diff --git "a/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" "b/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" --- "a/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" +++ "b/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.3902, "train/learning_rate": 8.180281690140844e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 103049, "_timestamp": 1648047628, "_step": 16510, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 6.0, 7.0, 11.0, 16.0, 15.0, 18.0, 10.0, 24.0, 27.0, 26.0, 29.0, 32.0, 29.0, 38.0, 39.0, 53.0, 30.0, 42.0, 33.0, 49.0, 42.0, 48.0, 44.0, 35.0, 23.0, 34.0, 38.0, 23.0, 21.0, 16.0, 20.0, 17.0, 12.0, 14.0, 8.0, 13.0, 10.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-7.036826133728027, -6.846851825714111, -6.656877517700195, -6.4669036865234375, -6.2769293785095215, -6.0869550704956055, -5.8969807624816895, -5.707006454467773, -5.517032623291016, -5.3270583152771, -5.137084007263184, -4.947110176086426, -4.75713586807251, -4.567161560058594, -4.377187252044678, -4.187212944030762, -3.997238874435425, -3.807264566421509, -3.617290496826172, -3.427316188812256, -3.237342119216919, -3.047367811203003, -2.857393741607666, -2.66741943359375, -2.477445125579834, -2.287470817565918, -2.097496747970581, -1.907522439956665, -1.7175483703613281, -1.527574062347412, -1.3375998735427856, -1.1476256847381592, -0.9576516151428223, -0.7676774263381958, -0.5777032375335693, -0.3877289891242981, -0.19775480031967163, -0.007780611515045166, 0.18219363689422607, 0.37216782569885254, 0.562142014503479, 0.7521162033081055, 0.9420903921127319, 1.1320645809173584, 1.3220388889312744, 1.5120129585266113, 1.7019872665405273, 1.8919614553451538, 2.0819356441497803, 2.2719099521636963, 2.461884021759033, 2.651858329772949, 2.841832399368286, 3.031806707382202, 3.221780776977539, 3.411755084991455, 3.601729393005371, 3.791703701019287, 3.981677770614624, 4.171651840209961, 4.361626148223877, 4.551600456237793, 4.741574764251709, 4.931549072265625, 5.121522903442383]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 11.0, 8.0, 13.0, 9.0, 15.0, 22.0, 19.0, 18.0, 30.0, 24.0, 22.0, 28.0, 39.0, 35.0, 31.0, 36.0, 39.0, 35.0, 24.0, 49.0, 40.0, 52.0, 37.0, 43.0, 43.0, 33.0, 29.0, 23.0, 19.0, 27.0, 23.0, 25.0, 21.0, 17.0, 11.0, 9.0, 7.0, 12.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.8797221183776855, -5.683355331420898, -5.4869890213012695, -5.290622234344482, -5.0942559242248535, -4.897889137268066, -4.7015228271484375, -4.50515604019165, -4.308789253234863, -4.112422466278076, -3.9160561561584473, -3.71968936920166, -3.523322820663452, -3.326956272125244, -3.130589723587036, -2.934223175048828, -2.73785662651062, -2.541490077972412, -2.345123529434204, -2.148756980895996, -1.952390193939209, -1.756023645401001, -1.559657096862793, -1.3632904291152954, -1.1669238805770874, -0.9705572724342346, -0.7741906642913818, -0.5778241157531738, -0.38145750761032104, -0.18509089946746826, 0.011275649070739746, 0.2076423168182373, 0.4040088653564453, 0.6003754734992981, 0.7967420816421509, 0.9931086301803589, 1.1894752979278564, 1.3858418464660645, 1.5822083950042725, 1.77857506275177, 1.974941611289978, 2.1713082790374756, 2.3676748275756836, 2.5640413761138916, 2.7604079246520996, 2.9567747116088867, 3.1531410217285156, 3.3495078086853027, 3.5458743572235107, 3.7422409057617188, 3.9386074542999268, 4.134974002838135, 4.331340789794922, 4.527707099914551, 4.724073886871338, 4.920440673828125, 5.116806983947754, 5.313173770904541, 5.50954008102417, 5.705906867980957, 5.902273178100586, 6.098639965057373, 6.29500675201416, 6.491373062133789, 6.687739849090576]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 15.0, 25.0, 38.0, 53.0, 90.0, 153.0, 220.0, 426.0, 648.0, 1093.0, 1805.0, 3065.0, 5048.0, 8386.0, 14186.0, 24264.0, 40731.0, 68891.0, 118114.0, 200098.0, 338691.0, 544984.0, 741635.0, 735598.0, 536658.0, 331270.0, 196674.0, 115194.0, 67644.0, 39817.0, 23580.0, 14242.0, 8411.0, 4927.0, 2923.0, 1821.0, 1138.0, 682.0, 379.0, 241.0, 154.0, 92.0, 72.0, 36.0, 20.0, 15.0, 8.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.4071044921875, -8.126708984375, -7.8463134765625, -7.56591796875, -7.2855224609375, -7.005126953125, -6.7247314453125, -6.4443359375, -6.1639404296875, -5.883544921875, -5.6031494140625, -5.32275390625, -5.0423583984375, -4.761962890625, -4.4815673828125, -4.201171875, -3.9207763671875, -3.640380859375, -3.3599853515625, -3.07958984375, -2.7991943359375, -2.518798828125, -2.2384033203125, -1.9580078125, -1.6776123046875, -1.397216796875, -1.1168212890625, -0.83642578125, -0.5560302734375, -0.275634765625, 0.0047607421875, 0.28515625, 0.5655517578125, 0.845947265625, 1.1263427734375, 1.40673828125, 1.6871337890625, 1.967529296875, 2.2479248046875, 2.5283203125, 2.8087158203125, 3.089111328125, 3.3695068359375, 3.64990234375, 3.9302978515625, 4.210693359375, 4.4910888671875, 4.771484375, 5.0518798828125, 5.332275390625, 5.6126708984375, 5.89306640625, 6.1734619140625, 6.453857421875, 6.7342529296875, 7.0146484375, 7.2950439453125, 7.575439453125, 7.8558349609375, 8.13623046875, 8.4166259765625, 8.697021484375, 8.9774169921875, 9.2578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0, 10.0, 11.0, 9.0, 16.0, 10.0, 20.0, 15.0, 14.0, 25.0, 33.0, 38.0, 45.0, 34.0, 41.0, 32.0, 41.0, 33.0, 44.0, 38.0, 38.0, 64.0, 25.0, 51.0, 38.0, 37.0, 22.0, 32.0, 25.0, 21.0, 29.0, 18.0, 14.0, 15.0, 15.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.48779296875, -6.2685546875, -6.04931640625, -5.830078125, -5.61083984375, -5.3916015625, -5.17236328125, -4.953125, -4.73388671875, -4.5146484375, -4.29541015625, -4.076171875, -3.85693359375, -3.6376953125, -3.41845703125, -3.19921875, -2.97998046875, -2.7607421875, -2.54150390625, -2.322265625, -2.10302734375, -1.8837890625, -1.66455078125, -1.4453125, -1.22607421875, -1.0068359375, -0.78759765625, -0.568359375, -0.34912109375, -0.1298828125, 0.08935546875, 0.30859375, 0.52783203125, 0.7470703125, 0.96630859375, 1.185546875, 1.40478515625, 1.6240234375, 1.84326171875, 2.0625, 2.28173828125, 2.5009765625, 2.72021484375, 2.939453125, 3.15869140625, 3.3779296875, 3.59716796875, 3.81640625, 4.03564453125, 4.2548828125, 4.47412109375, 4.693359375, 4.91259765625, 5.1318359375, 5.35107421875, 5.5703125, 5.78955078125, 6.0087890625, 6.22802734375, 6.447265625, 6.66650390625, 6.8857421875, 7.10498046875, 7.32421875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 14.0, 17.0, 20.0, 34.0, 47.0, 85.0, 137.0, 205.0, 362.0, 528.0, 833.0, 1422.0, 2268.0, 3870.0, 6162.0, 10069.0, 16208.0, 27101.0, 44303.0, 72380.0, 118635.0, 186435.0, 288004.0, 419578.0, 562755.0, 634296.0, 568682.0, 429489.0, 295549.0, 191251.0, 120886.0, 75082.0, 46071.0, 27901.0, 16988.0, 10115.0, 6240.0, 3871.0, 2388.0, 1481.0, 915.0, 594.0, 380.0, 225.0, 154.0, 82.0, 56.0, 37.0, 23.0, 26.0, 12.0, 3.0, 4.0, 2.0, 4.0, 3.0], "bins": [-7.57421875, -7.34832763671875, -7.1224365234375, -6.89654541015625, -6.670654296875, -6.44476318359375, -6.2188720703125, -5.99298095703125, -5.76708984375, -5.54119873046875, -5.3153076171875, -5.08941650390625, -4.863525390625, -4.63763427734375, -4.4117431640625, -4.18585205078125, -3.9599609375, -3.73406982421875, -3.5081787109375, -3.28228759765625, -3.056396484375, -2.83050537109375, -2.6046142578125, -2.37872314453125, -2.15283203125, -1.92694091796875, -1.7010498046875, -1.47515869140625, -1.249267578125, -1.02337646484375, -0.7974853515625, -0.57159423828125, -0.345703125, -0.11981201171875, 0.1060791015625, 0.33197021484375, 0.557861328125, 0.78375244140625, 1.0096435546875, 1.23553466796875, 1.46142578125, 1.68731689453125, 1.9132080078125, 2.13909912109375, 2.364990234375, 2.59088134765625, 2.8167724609375, 3.04266357421875, 3.2685546875, 3.49444580078125, 3.7203369140625, 3.94622802734375, 4.172119140625, 4.39801025390625, 4.6239013671875, 4.84979248046875, 5.07568359375, 5.30157470703125, 5.5274658203125, 5.75335693359375, 5.979248046875, 6.20513916015625, 6.4310302734375, 6.65692138671875, 6.8828125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 5.0, 18.0, 18.0, 16.0, 23.0, 24.0, 41.0, 41.0, 63.0, 57.0, 74.0, 79.0, 127.0, 116.0, 131.0, 145.0, 183.0, 200.0, 205.0, 220.0, 215.0, 215.0, 239.0, 203.0, 211.0, 187.0, 151.0, 126.0, 105.0, 113.0, 106.0, 77.0, 74.0, 52.0, 46.0, 35.0, 26.0, 18.0, 21.0, 11.0, 11.0, 7.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-3.205078125, -3.113067626953125, -3.02105712890625, -2.929046630859375, -2.8370361328125, -2.745025634765625, -2.65301513671875, -2.561004638671875, -2.468994140625, -2.376983642578125, -2.28497314453125, -2.192962646484375, -2.1009521484375, -2.008941650390625, -1.91693115234375, -1.824920654296875, -1.73291015625, -1.640899658203125, -1.54888916015625, -1.456878662109375, -1.3648681640625, -1.272857666015625, -1.18084716796875, -1.088836669921875, -0.996826171875, -0.904815673828125, -0.81280517578125, -0.720794677734375, -0.6287841796875, -0.536773681640625, -0.44476318359375, -0.352752685546875, -0.2607421875, -0.168731689453125, -0.07672119140625, 0.015289306640625, 0.1072998046875, 0.199310302734375, 0.29132080078125, 0.383331298828125, 0.475341796875, 0.567352294921875, 0.65936279296875, 0.751373291015625, 0.8433837890625, 0.935394287109375, 1.02740478515625, 1.119415283203125, 1.21142578125, 1.303436279296875, 1.39544677734375, 1.487457275390625, 1.5794677734375, 1.671478271484375, 1.76348876953125, 1.855499267578125, 1.947509765625, 2.039520263671875, 2.13153076171875, 2.223541259765625, 2.3155517578125, 2.407562255859375, 2.49957275390625, 2.591583251953125, 2.68359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 4.0, 10.0, 23.0, 27.0, 29.0, 28.0, 29.0, 48.0, 52.0, 46.0, 41.0, 51.0, 55.0, 49.0, 50.0, 56.0, 48.0, 48.0, 42.0, 31.0, 34.0, 34.0, 26.0, 19.0, 22.0, 20.0, 12.0, 9.0, 9.0, 7.0, 9.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.538727760314941, -8.252422332763672, -7.9661173820495605, -7.679812431335449, -7.39350700378418, -7.107202053070068, -6.820897102355957, -6.5345916748046875, -6.248286247253418, -5.961981296539307, -5.675675868988037, -5.389370918273926, -5.103065490722656, -4.816760540008545, -4.530455589294434, -4.244150161743164, -3.9578452110290527, -3.6715400218963623, -3.385234832763672, -3.0989298820495605, -2.812624454498291, -2.5263195037841797, -2.2400143146514893, -1.9537091255187988, -1.6674039363861084, -1.381098747253418, -1.0947935581207275, -0.8084884881973267, -0.5221832990646362, -0.2358781099319458, 0.05042695999145508, 0.3367321491241455, 0.6230373382568359, 0.9093425273895264, 1.1956477165222168, 1.4819527864456177, 1.768257975578308, 2.054563045501709, 2.3408682346343994, 2.62717342376709, 2.9134786128997803, 3.1997838020324707, 3.486088991165161, 3.7723941802978516, 4.058699131011963, 4.345004558563232, 4.631309509277344, 4.917614936828613, 5.203919887542725, 5.490224838256836, 5.7765302658081055, 6.062835216522217, 6.349140644073486, 6.635445594787598, 6.921751022338867, 7.2080559730529785, 7.49436092376709, 7.780665874481201, 8.066970825195312, 8.353276252746582, 8.639581680297852, 8.925887107849121, 9.212191581726074, 9.498497009277344, 9.784802436828613]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 10.0, 6.0, 10.0, 7.0, 14.0, 22.0, 15.0, 22.0, 16.0, 29.0, 14.0, 27.0, 21.0, 19.0, 31.0, 25.0, 27.0, 33.0, 27.0, 34.0, 38.0, 34.0, 42.0, 31.0, 35.0, 17.0, 29.0, 31.0, 23.0, 26.0, 27.0, 27.0, 28.0, 27.0, 27.0, 16.0, 19.0, 11.0, 11.0, 10.0, 8.0, 12.0, 6.0, 14.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0], "bins": [-6.0501508712768555, -5.855575084686279, -5.660998821258545, -5.466423034667969, -5.271846771240234, -5.077270984649658, -4.882694721221924, -4.688118934631348, -4.493542671203613, -4.298966884613037, -4.104390621185303, -3.9098145961761475, -3.715238571166992, -3.520662546157837, -3.3260865211486816, -3.1315107345581055, -2.93693470954895, -2.742358684539795, -2.5477826595306396, -2.3532066345214844, -2.158630609512329, -1.9640545845031738, -1.769478678703308, -1.5749026536941528, -1.3803266286849976, -1.1857506036758423, -0.991174578666687, -0.7965986132621765, -0.6020225882530212, -0.40744656324386597, -0.21287059783935547, -0.018294572830200195, 0.17628145217895508, 0.37085747718811035, 0.5654335021972656, 0.7600094676017761, 0.9545854926109314, 1.1491615772247314, 1.3437374830245972, 1.5383135080337524, 1.7328895330429077, 1.927465558052063, 2.1220414638519287, 2.316617488861084, 2.5111935138702393, 2.7057695388793945, 2.90034556388855, 3.094921588897705, 3.2894976139068604, 3.4840736389160156, 3.678649663925171, 3.873225688934326, 4.067801475524902, 4.262377738952637, 4.456953525543213, 4.651529788970947, 4.846105575561523, 5.0406813621521, 5.235257625579834, 5.42983341217041, 5.6244096755981445, 5.818985462188721, 6.013561725616455, 6.208137512207031, 6.402713775634766]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 13.0, 17.0, 15.0, 31.0, 43.0, 56.0, 80.0, 116.0, 153.0, 239.0, 355.0, 453.0, 730.0, 1086.0, 1756.0, 2728.0, 4359.0, 7425.0, 11917.0, 20947.0, 35506.0, 58704.0, 92868.0, 135501.0, 171616.0, 165847.0, 124798.0, 83030.0, 51308.0, 30883.0, 18086.0, 10586.0, 6357.0, 3913.0, 2384.0, 1510.0, 1001.0, 673.0, 467.0, 320.0, 192.0, 134.0, 113.0, 74.0, 54.0, 24.0, 24.0, 15.0, 15.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.158203125, -3.059112548828125, -2.96002197265625, -2.860931396484375, -2.7618408203125, -2.662750244140625, -2.56365966796875, -2.464569091796875, -2.365478515625, -2.266387939453125, -2.16729736328125, -2.068206787109375, -1.9691162109375, -1.870025634765625, -1.77093505859375, -1.671844482421875, -1.57275390625, -1.473663330078125, -1.37457275390625, -1.275482177734375, -1.1763916015625, -1.077301025390625, -0.97821044921875, -0.879119873046875, -0.780029296875, -0.680938720703125, -0.58184814453125, -0.482757568359375, -0.3836669921875, -0.284576416015625, -0.18548583984375, -0.086395263671875, 0.0126953125, 0.111785888671875, 0.21087646484375, 0.309967041015625, 0.4090576171875, 0.508148193359375, 0.60723876953125, 0.706329345703125, 0.805419921875, 0.904510498046875, 1.00360107421875, 1.102691650390625, 1.2017822265625, 1.300872802734375, 1.39996337890625, 1.499053955078125, 1.59814453125, 1.697235107421875, 1.79632568359375, 1.895416259765625, 1.9945068359375, 2.093597412109375, 2.19268798828125, 2.291778564453125, 2.390869140625, 2.489959716796875, 2.58905029296875, 2.688140869140625, 2.7872314453125, 2.886322021484375, 2.98541259765625, 3.084503173828125, 3.18359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 7.0, 2.0, 6.0, 10.0, 6.0, 7.0, 9.0, 13.0, 11.0, 24.0, 16.0, 18.0, 22.0, 26.0, 25.0, 20.0, 28.0, 23.0, 32.0, 32.0, 23.0, 36.0, 29.0, 48.0, 54.0, 33.0, 41.0, 31.0, 38.0, 30.0, 29.0, 23.0, 34.0, 17.0, 31.0, 20.0, 18.0, 24.0, 19.0, 15.0, 20.0, 10.0, 9.0, 8.0, 7.0, 5.0, 6.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8671875, -6.64410400390625, -6.4210205078125, -6.19793701171875, -5.974853515625, -5.75177001953125, -5.5286865234375, -5.30560302734375, -5.08251953125, -4.85943603515625, -4.6363525390625, -4.41326904296875, -4.190185546875, -3.96710205078125, -3.7440185546875, -3.52093505859375, -3.2978515625, -3.07476806640625, -2.8516845703125, -2.62860107421875, -2.405517578125, -2.18243408203125, -1.9593505859375, -1.73626708984375, -1.51318359375, -1.29010009765625, -1.0670166015625, -0.84393310546875, -0.620849609375, -0.39776611328125, -0.1746826171875, 0.04840087890625, 0.271484375, 0.49456787109375, 0.7176513671875, 0.94073486328125, 1.163818359375, 1.38690185546875, 1.6099853515625, 1.83306884765625, 2.05615234375, 2.27923583984375, 2.5023193359375, 2.72540283203125, 2.948486328125, 3.17156982421875, 3.3946533203125, 3.61773681640625, 3.8408203125, 4.06390380859375, 4.2869873046875, 4.51007080078125, 4.733154296875, 4.95623779296875, 5.1793212890625, 5.40240478515625, 5.62548828125, 5.84857177734375, 6.0716552734375, 6.29473876953125, 6.517822265625, 6.74090576171875, 6.9639892578125, 7.18707275390625, 7.41015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 0.0, 4.0, 6.0, 12.0, 14.0, 5.0, 17.0, 21.0, 20.0, 28.0, 48.0, 66.0, 81.0, 140.0, 189.0, 362.0, 583.0, 1359.0, 3132.0, 8409.0, 25112.0, 316926.0, 646664.0, 28897.0, 9670.0, 3529.0, 1467.0, 694.0, 391.0, 230.0, 137.0, 88.0, 64.0, 39.0, 23.0, 21.0, 20.0, 16.0, 5.0, 15.0, 8.0, 15.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1171875, -8.803466796875, -8.48974609375, -8.176025390625, -7.8623046875, -7.548583984375, -7.23486328125, -6.921142578125, -6.607421875, -6.293701171875, -5.97998046875, -5.666259765625, -5.3525390625, -5.038818359375, -4.72509765625, -4.411376953125, -4.09765625, -3.783935546875, -3.47021484375, -3.156494140625, -2.8427734375, -2.529052734375, -2.21533203125, -1.901611328125, -1.587890625, -1.274169921875, -0.96044921875, -0.646728515625, -0.3330078125, -0.019287109375, 0.29443359375, 0.608154296875, 0.921875, 1.235595703125, 1.54931640625, 1.863037109375, 2.1767578125, 2.490478515625, 2.80419921875, 3.117919921875, 3.431640625, 3.745361328125, 4.05908203125, 4.372802734375, 4.6865234375, 5.000244140625, 5.31396484375, 5.627685546875, 5.94140625, 6.255126953125, 6.56884765625, 6.882568359375, 7.1962890625, 7.510009765625, 7.82373046875, 8.137451171875, 8.451171875, 8.764892578125, 9.07861328125, 9.392333984375, 9.7060546875, 10.019775390625, 10.33349609375, 10.647216796875, 10.9609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 5.0, 17.0, 15.0, 16.0, 20.0, 16.0, 20.0, 24.0, 27.0, 33.0, 25.0, 44.0, 26.0, 35.0, 36.0, 47.0, 42.0, 53.0, 41.0, 47.0, 45.0, 39.0, 35.0, 25.0, 33.0, 31.0, 18.0, 18.0, 21.0, 22.0, 15.0, 14.0, 14.0, 10.0, 10.0, 12.0, 8.0, 1.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.44781494140625, -5.2706298828125, -5.09344482421875, -4.916259765625, -4.73907470703125, -4.5618896484375, -4.38470458984375, -4.20751953125, -4.03033447265625, -3.8531494140625, -3.67596435546875, -3.498779296875, -3.32159423828125, -3.1444091796875, -2.96722412109375, -2.7900390625, -2.61285400390625, -2.4356689453125, -2.25848388671875, -2.081298828125, -1.90411376953125, -1.7269287109375, -1.54974365234375, -1.37255859375, -1.19537353515625, -1.0181884765625, -0.84100341796875, -0.663818359375, -0.48663330078125, -0.3094482421875, -0.13226318359375, 0.044921875, 0.22210693359375, 0.3992919921875, 0.57647705078125, 0.753662109375, 0.93084716796875, 1.1080322265625, 1.28521728515625, 1.46240234375, 1.63958740234375, 1.8167724609375, 1.99395751953125, 2.171142578125, 2.34832763671875, 2.5255126953125, 2.70269775390625, 2.8798828125, 3.05706787109375, 3.2342529296875, 3.41143798828125, 3.588623046875, 3.76580810546875, 3.9429931640625, 4.12017822265625, 4.29736328125, 4.47454833984375, 4.6517333984375, 4.82891845703125, 5.006103515625, 5.18328857421875, 5.3604736328125, 5.53765869140625, 5.71484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 12.0, 16.0, 12.0, 20.0, 22.0, 40.0, 61.0, 115.0, 184.0, 359.0, 590.0, 1278.0, 2653.0, 6903.0, 20541.0, 150653.0, 816031.0, 32014.0, 9858.0, 3739.0, 1561.0, 804.0, 400.0, 223.0, 141.0, 92.0, 53.0, 41.0, 28.0, 24.0, 8.0, 15.0, 16.0, 12.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.7041168212890625, -1.649444580078125, -1.5947723388671875, -1.54010009765625, -1.4854278564453125, -1.430755615234375, -1.3760833740234375, -1.3214111328125, -1.2667388916015625, -1.212066650390625, -1.1573944091796875, -1.10272216796875, -1.0480499267578125, -0.993377685546875, -0.9387054443359375, -0.884033203125, -0.8293609619140625, -0.774688720703125, -0.7200164794921875, -0.66534423828125, -0.6106719970703125, -0.555999755859375, -0.5013275146484375, -0.4466552734375, -0.3919830322265625, -0.337310791015625, -0.2826385498046875, -0.22796630859375, -0.1732940673828125, -0.118621826171875, -0.0639495849609375, -0.00927734375, 0.0453948974609375, 0.100067138671875, 0.1547393798828125, 0.20941162109375, 0.2640838623046875, 0.318756103515625, 0.3734283447265625, 0.4281005859375, 0.4827728271484375, 0.537445068359375, 0.5921173095703125, 0.64678955078125, 0.7014617919921875, 0.756134033203125, 0.8108062744140625, 0.865478515625, 0.9201507568359375, 0.974822998046875, 1.0294952392578125, 1.08416748046875, 1.1388397216796875, 1.193511962890625, 1.2481842041015625, 1.3028564453125, 1.3575286865234375, 1.412200927734375, 1.4668731689453125, 1.52154541015625, 1.5762176513671875, 1.630889892578125, 1.6855621337890625, 1.740234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 14.0, 20.0, 26.0, 40.0, 53.0, 80.0, 94.0, 115.0, 94.0, 95.0, 89.0, 71.0, 61.0, 33.0, 21.0, 21.0, 17.0, 15.0, 11.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001354217529296875, -0.00013138726353645325, -0.000127352774143219, -0.00012331828474998474, -0.00011928379535675049, -0.00011524930596351624, -0.00011121481657028198, -0.00010718032717704773, -0.00010314583778381348, -9.911134839057922e-05, -9.507685899734497e-05, -9.104236960411072e-05, -8.700788021087646e-05, -8.297339081764221e-05, -7.893890142440796e-05, -7.49044120311737e-05, -7.086992263793945e-05, -6.68354332447052e-05, -6.280094385147095e-05, -5.8766454458236694e-05, -5.473196506500244e-05, -5.069747567176819e-05, -4.6662986278533936e-05, -4.262849688529968e-05, -3.859400749206543e-05, -3.455951809883118e-05, -3.0525028705596924e-05, -2.649053931236267e-05, -2.2456049919128418e-05, -1.8421560525894165e-05, -1.4387071132659912e-05, -1.035258173942566e-05, -6.318092346191406e-06, -2.2836029529571533e-06, 1.7508864402770996e-06, 5.7853758335113525e-06, 9.819865226745605e-06, 1.3854354619979858e-05, 1.788884401321411e-05, 2.1923333406448364e-05, 2.5957822799682617e-05, 2.999231219291687e-05, 3.402680158615112e-05, 3.8061290979385376e-05, 4.209578037261963e-05, 4.613026976585388e-05, 5.0164759159088135e-05, 5.419924855232239e-05, 5.823373794555664e-05, 6.22682273387909e-05, 6.630271673202515e-05, 7.03372061252594e-05, 7.437169551849365e-05, 7.84061849117279e-05, 8.244067430496216e-05, 8.647516369819641e-05, 9.050965309143066e-05, 9.454414248466492e-05, 9.857863187789917e-05, 0.00010261312127113342, 0.00010664761066436768, 0.00011068210005760193, 0.00011471658945083618, 0.00011875107884407043, 0.0001227855682373047]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 15.0, 42.0, 50.0, 49.0, 73.0, 148.0, 175.0, 285.0, 398.0, 558.0, 828.0, 1325.0, 1932.0, 2975.0, 4513.0, 7295.0, 11719.0, 18920.0, 31940.0, 54104.0, 89972.0, 140776.0, 186983.0, 175637.0, 123899.0, 76544.0, 45651.0, 27422.0, 16393.0, 10040.0, 6264.0, 3996.0, 2562.0, 1728.0, 1107.0, 726.0, 493.0, 318.0, 214.0, 144.0, 114.0, 58.0, 49.0, 37.0, 24.0, 15.0, 5.0, 8.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.97802734375, -0.9473114013671875, -0.916595458984375, -0.8858795166015625, -0.85516357421875, -0.8244476318359375, -0.793731689453125, -0.7630157470703125, -0.7322998046875, -0.7015838623046875, -0.670867919921875, -0.6401519775390625, -0.60943603515625, -0.5787200927734375, -0.548004150390625, -0.5172882080078125, -0.486572265625, -0.4558563232421875, -0.425140380859375, -0.3944244384765625, -0.36370849609375, -0.3329925537109375, -0.302276611328125, -0.2715606689453125, -0.2408447265625, -0.2101287841796875, -0.179412841796875, -0.1486968994140625, -0.11798095703125, -0.0872650146484375, -0.056549072265625, -0.0258331298828125, 0.0048828125, 0.0355987548828125, 0.066314697265625, 0.0970306396484375, 0.12774658203125, 0.1584625244140625, 0.189178466796875, 0.2198944091796875, 0.2506103515625, 0.2813262939453125, 0.312042236328125, 0.3427581787109375, 0.37347412109375, 0.4041900634765625, 0.434906005859375, 0.4656219482421875, 0.496337890625, 0.5270538330078125, 0.557769775390625, 0.5884857177734375, 0.61920166015625, 0.6499176025390625, 0.680633544921875, 0.7113494873046875, 0.7420654296875, 0.7727813720703125, 0.803497314453125, 0.8342132568359375, 0.86492919921875, 0.8956451416015625, 0.926361083984375, 0.9570770263671875, 0.98779296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 16.0, 23.0, 11.0, 31.0, 27.0, 41.0, 53.0, 63.0, 88.0, 86.0, 76.0, 89.0, 70.0, 67.0, 45.0, 52.0, 33.0, 19.0, 13.0, 17.0, 14.0, 10.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4929771423339844, -0.47863006591796875, -0.4642829895019531, -0.4499359130859375, -0.4355888366699219, -0.42124176025390625, -0.4068946838378906, -0.392547607421875, -0.3782005310058594, -0.36385345458984375, -0.3495063781738281, -0.3351593017578125, -0.3208122253417969, -0.30646514892578125, -0.2921180725097656, -0.27777099609375, -0.2634239196777344, -0.24907684326171875, -0.23472976684570312, -0.2203826904296875, -0.20603561401367188, -0.19168853759765625, -0.17734146118164062, -0.162994384765625, -0.14864730834960938, -0.13430023193359375, -0.11995315551757812, -0.1056060791015625, -0.09125900268554688, -0.07691192626953125, -0.06256484985351562, -0.0482177734375, -0.033870697021484375, -0.01952362060546875, -0.005176544189453125, 0.0091705322265625, 0.023517608642578125, 0.03786468505859375, 0.052211761474609375, 0.066558837890625, 0.08090591430664062, 0.09525299072265625, 0.10960006713867188, 0.1239471435546875, 0.13829421997070312, 0.15264129638671875, 0.16698837280273438, 0.18133544921875, 0.19568252563476562, 0.21002960205078125, 0.22437667846679688, 0.2387237548828125, 0.2530708312988281, 0.26741790771484375, 0.2817649841308594, 0.296112060546875, 0.3104591369628906, 0.32480621337890625, 0.3391532897949219, 0.3535003662109375, 0.3678474426269531, 0.38219451904296875, 0.3965415954589844, 0.410888671875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 0.0, 1.0, 5.0, 2.0, 8.0, 6.0, 10.0, 15.0, 20.0, 25.0, 23.0, 44.0, 37.0, 52.0, 46.0, 46.0, 39.0, 56.0, 52.0, 45.0, 60.0, 56.0, 41.0, 57.0, 36.0, 35.0, 25.0, 26.0, 31.0, 19.0, 15.0, 17.0, 18.0, 6.0, 10.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.392671585083008, -8.107319831848145, -7.821968078613281, -7.536616325378418, -7.251265048980713, -6.96591329574585, -6.680561542510986, -6.395209789276123, -6.109858512878418, -5.824506759643555, -5.539155006408691, -5.253803253173828, -4.968451976776123, -4.68310022354126, -4.3977484703063965, -4.112396717071533, -3.82704496383667, -3.5416932106018066, -3.2563416957855225, -2.970989942550659, -2.685638427734375, -2.4002866744995117, -2.1149349212646484, -1.8295832872390747, -1.544231653213501, -1.2588800191879272, -0.9735283255577087, -0.6881766319274902, -0.4028249979019165, -0.11747336387634277, 0.1678783893585205, 0.45323002338409424, 0.738581657409668, 1.0239332914352417, 1.3092849254608154, 1.5946366786956787, 1.8799883127212524, 2.165339946746826, 2.4506916999816895, 2.7360434532165527, 3.021394968032837, 3.3067467212677, 3.5920982360839844, 3.8774499893188477, 4.162801742553711, 4.448153495788574, 4.7335052490234375, 5.018856525421143, 5.304208278656006, 5.589560031890869, 5.874911785125732, 6.1602630615234375, 6.445614814758301, 6.730966567993164, 7.016318321228027, 7.301670074462891, 7.587021827697754, 7.872373580932617, 8.15772533416748, 8.443077087402344, 8.728428840637207, 9.01378059387207, 9.299131393432617, 9.58448314666748, 9.869834899902344]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 9.0, 12.0, 8.0, 10.0, 7.0, 10.0, 19.0, 15.0, 17.0, 20.0, 24.0, 20.0, 24.0, 21.0, 19.0, 28.0, 26.0, 25.0, 30.0, 31.0, 30.0, 37.0, 45.0, 37.0, 29.0, 38.0, 20.0, 27.0, 30.0, 29.0, 28.0, 25.0, 26.0, 30.0, 25.0, 31.0, 16.0, 15.0, 16.0, 7.0, 17.0, 7.0, 14.0, 8.0, 9.0, 10.0, 5.0, 8.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.8974504470825195, -5.703672885894775, -5.509895324707031, -5.316117286682129, -5.122339725494385, -4.928562164306641, -4.734784126281738, -4.541006565093994, -4.34722900390625, -4.153451442718506, -3.9596736431121826, -3.7658958435058594, -3.5721182823181152, -3.378340721130371, -3.184562921524048, -2.9907851219177246, -2.7970075607299805, -2.6032299995422363, -2.409452199935913, -2.21567440032959, -2.0218968391418457, -1.828119158744812, -1.6343414783477783, -1.4405637979507446, -1.246786117553711, -1.0530084371566772, -0.8592307567596436, -0.6654530763626099, -0.47167539596557617, -0.2778977155685425, -0.08412003517150879, 0.1096576452255249, 0.3034348487854004, 0.4972125291824341, 0.6909902095794678, 0.8847678899765015, 1.0785455703735352, 1.2723232507705688, 1.4661009311676025, 1.6598786115646362, 1.85365629196167, 2.047433853149414, 2.2412116527557373, 2.4349894523620605, 2.6287670135498047, 2.822544574737549, 3.016322374343872, 3.2101001739501953, 3.4038777351379395, 3.5976552963256836, 3.791433095932007, 3.98521089553833, 4.178988456726074, 4.372766017913818, 4.5665435791015625, 4.760321617126465, 4.954099178314209, 5.147876739501953, 5.3416547775268555, 5.5354323387146, 5.729209899902344, 5.922987461090088, 6.116765022277832, 6.310543060302734, 6.5043206214904785]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 4.0, 8.0, 9.0, 12.0, 27.0, 34.0, 56.0, 86.0, 124.0, 187.0, 329.0, 535.0, 803.0, 1290.0, 1863.0, 2965.0, 4453.0, 6665.0, 10130.0, 15101.0, 22388.0, 31619.0, 43896.0, 57802.0, 73623.0, 89098.0, 99300.0, 103746.0, 100582.0, 90696.0, 76845.0, 60918.0, 46748.0, 33824.0, 23904.0, 16507.0, 11346.0, 7401.0, 4816.0, 3116.0, 2069.0, 1315.0, 831.0, 535.0, 327.0, 230.0, 138.0, 92.0, 65.0, 39.0, 28.0, 15.0, 13.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.13671875, -5.9425048828125, -5.748291015625, -5.5540771484375, -5.35986328125, -5.1656494140625, -4.971435546875, -4.7772216796875, -4.5830078125, -4.3887939453125, -4.194580078125, -4.0003662109375, -3.80615234375, -3.6119384765625, -3.417724609375, -3.2235107421875, -3.029296875, -2.8350830078125, -2.640869140625, -2.4466552734375, -2.25244140625, -2.0582275390625, -1.864013671875, -1.6697998046875, -1.4755859375, -1.2813720703125, -1.087158203125, -0.8929443359375, -0.69873046875, -0.5045166015625, -0.310302734375, -0.1160888671875, 0.078125, 0.2723388671875, 0.466552734375, 0.6607666015625, 0.85498046875, 1.0491943359375, 1.243408203125, 1.4376220703125, 1.6318359375, 1.8260498046875, 2.020263671875, 2.2144775390625, 2.40869140625, 2.6029052734375, 2.797119140625, 2.9913330078125, 3.185546875, 3.3797607421875, 3.573974609375, 3.7681884765625, 3.96240234375, 4.1566162109375, 4.350830078125, 4.5450439453125, 4.7392578125, 4.9334716796875, 5.127685546875, 5.3218994140625, 5.51611328125, 5.7103271484375, 5.904541015625, 6.0987548828125, 6.29296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 13.0, 16.0, 18.0, 23.0, 24.0, 20.0, 20.0, 24.0, 26.0, 28.0, 32.0, 29.0, 37.0, 27.0, 34.0, 40.0, 48.0, 28.0, 40.0, 40.0, 46.0, 26.0, 42.0, 33.0, 34.0, 28.0, 29.0, 20.0, 22.0, 23.0, 19.0, 7.0, 12.0, 12.0, 10.0, 8.0, 9.0, 6.0, 5.0, 9.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.31201171875, -6.0888671875, -5.86572265625, -5.642578125, -5.41943359375, -5.1962890625, -4.97314453125, -4.75, -4.52685546875, -4.3037109375, -4.08056640625, -3.857421875, -3.63427734375, -3.4111328125, -3.18798828125, -2.96484375, -2.74169921875, -2.5185546875, -2.29541015625, -2.072265625, -1.84912109375, -1.6259765625, -1.40283203125, -1.1796875, -0.95654296875, -0.7333984375, -0.51025390625, -0.287109375, -0.06396484375, 0.1591796875, 0.38232421875, 0.60546875, 0.82861328125, 1.0517578125, 1.27490234375, 1.498046875, 1.72119140625, 1.9443359375, 2.16748046875, 2.390625, 2.61376953125, 2.8369140625, 3.06005859375, 3.283203125, 3.50634765625, 3.7294921875, 3.95263671875, 4.17578125, 4.39892578125, 4.6220703125, 4.84521484375, 5.068359375, 5.29150390625, 5.5146484375, 5.73779296875, 5.9609375, 6.18408203125, 6.4072265625, 6.63037109375, 6.853515625, 7.07666015625, 7.2998046875, 7.52294921875, 7.74609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 3.0, 11.0, 10.0, 19.0, 37.0, 59.0, 79.0, 124.0, 208.0, 345.0, 572.0, 888.0, 1278.0, 2122.0, 3202.0, 4914.0, 7216.0, 10579.0, 15479.0, 22188.0, 31261.0, 42002.0, 55495.0, 69601.0, 83687.0, 93932.0, 98957.0, 97905.0, 90203.0, 78487.0, 63734.0, 49843.0, 37714.0, 26827.0, 19203.0, 13309.0, 9265.0, 6262.0, 4074.0, 2681.0, 1749.0, 1108.0, 734.0, 437.0, 297.0, 186.0, 105.0, 65.0, 46.0, 18.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-7.10546875, -6.874755859375, -6.64404296875, -6.413330078125, -6.1826171875, -5.951904296875, -5.72119140625, -5.490478515625, -5.259765625, -5.029052734375, -4.79833984375, -4.567626953125, -4.3369140625, -4.106201171875, -3.87548828125, -3.644775390625, -3.4140625, -3.183349609375, -2.95263671875, -2.721923828125, -2.4912109375, -2.260498046875, -2.02978515625, -1.799072265625, -1.568359375, -1.337646484375, -1.10693359375, -0.876220703125, -0.6455078125, -0.414794921875, -0.18408203125, 0.046630859375, 0.27734375, 0.508056640625, 0.73876953125, 0.969482421875, 1.2001953125, 1.430908203125, 1.66162109375, 1.892333984375, 2.123046875, 2.353759765625, 2.58447265625, 2.815185546875, 3.0458984375, 3.276611328125, 3.50732421875, 3.738037109375, 3.96875, 4.199462890625, 4.43017578125, 4.660888671875, 4.8916015625, 5.122314453125, 5.35302734375, 5.583740234375, 5.814453125, 6.045166015625, 6.27587890625, 6.506591796875, 6.7373046875, 6.968017578125, 7.19873046875, 7.429443359375, 7.66015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 8.0, 12.0, 11.0, 19.0, 12.0, 19.0, 21.0, 21.0, 26.0, 28.0, 25.0, 32.0, 32.0, 54.0, 33.0, 46.0, 42.0, 32.0, 47.0, 55.0, 42.0, 31.0, 42.0, 31.0, 30.0, 31.0, 21.0, 29.0, 17.0, 22.0, 21.0, 12.0, 18.0, 17.0, 9.0, 2.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0], "bins": [-6.05859375, -5.89837646484375, -5.7381591796875, -5.57794189453125, -5.417724609375, -5.25750732421875, -5.0972900390625, -4.93707275390625, -4.77685546875, -4.61663818359375, -4.4564208984375, -4.29620361328125, -4.135986328125, -3.97576904296875, -3.8155517578125, -3.65533447265625, -3.4951171875, -3.33489990234375, -3.1746826171875, -3.01446533203125, -2.854248046875, -2.69403076171875, -2.5338134765625, -2.37359619140625, -2.21337890625, -2.05316162109375, -1.8929443359375, -1.73272705078125, -1.572509765625, -1.41229248046875, -1.2520751953125, -1.09185791015625, -0.931640625, -0.77142333984375, -0.6112060546875, -0.45098876953125, -0.290771484375, -0.13055419921875, 0.0296630859375, 0.18988037109375, 0.35009765625, 0.51031494140625, 0.6705322265625, 0.83074951171875, 0.990966796875, 1.15118408203125, 1.3114013671875, 1.47161865234375, 1.6318359375, 1.79205322265625, 1.9522705078125, 2.11248779296875, 2.272705078125, 2.43292236328125, 2.5931396484375, 2.75335693359375, 2.91357421875, 3.07379150390625, 3.2340087890625, 3.39422607421875, 3.554443359375, 3.71466064453125, 3.8748779296875, 4.03509521484375, 4.1953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 4.0, 5.0, 11.0, 15.0, 26.0, 37.0, 53.0, 75.0, 100.0, 157.0, 192.0, 272.0, 365.0, 529.0, 745.0, 1087.0, 1511.0, 2252.0, 3362.0, 4827.0, 7098.0, 10601.0, 15959.0, 23828.0, 34793.0, 49702.0, 69037.0, 89656.0, 107879.0, 117714.0, 115955.0, 103002.0, 83461.0, 62793.0, 44949.0, 31232.0, 21062.0, 14159.0, 9614.0, 6480.0, 4388.0, 2962.0, 2032.0, 1367.0, 992.0, 652.0, 464.0, 308.0, 240.0, 166.0, 125.0, 90.0, 57.0, 43.0, 34.0, 14.0, 15.0, 6.0, 3.0, 5.0, 5.0, 2.0], "bins": [-2.103515625, -2.0374755859375, -1.971435546875, -1.9053955078125, -1.83935546875, -1.7733154296875, -1.707275390625, -1.6412353515625, -1.5751953125, -1.5091552734375, -1.443115234375, -1.3770751953125, -1.31103515625, -1.2449951171875, -1.178955078125, -1.1129150390625, -1.046875, -0.9808349609375, -0.914794921875, -0.8487548828125, -0.78271484375, -0.7166748046875, -0.650634765625, -0.5845947265625, -0.5185546875, -0.4525146484375, -0.386474609375, -0.3204345703125, -0.25439453125, -0.1883544921875, -0.122314453125, -0.0562744140625, 0.009765625, 0.0758056640625, 0.141845703125, 0.2078857421875, 0.27392578125, 0.3399658203125, 0.406005859375, 0.4720458984375, 0.5380859375, 0.6041259765625, 0.670166015625, 0.7362060546875, 0.80224609375, 0.8682861328125, 0.934326171875, 1.0003662109375, 1.06640625, 1.1324462890625, 1.198486328125, 1.2645263671875, 1.33056640625, 1.3966064453125, 1.462646484375, 1.5286865234375, 1.5947265625, 1.6607666015625, 1.726806640625, 1.7928466796875, 1.85888671875, 1.9249267578125, 1.990966796875, 2.0570068359375, 2.123046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 6.0, 11.0, 9.0, 16.0, 14.0, 17.0, 12.0, 24.0, 27.0, 43.0, 41.0, 47.0, 51.0, 44.0, 47.0, 76.0, 59.0, 63.0, 57.0, 53.0, 33.0, 47.0, 39.0, 36.0, 26.0, 16.0, 22.0, 16.0, 10.0, 10.0, 12.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0003790855407714844, -0.00036915019154548645, -0.0003592148423194885, -0.0003492794930934906, -0.0003393441438674927, -0.00032940879464149475, -0.0003194734454154968, -0.0003095380961894989, -0.000299602746963501, -0.00028966739773750305, -0.0002797320485115051, -0.0002697966992855072, -0.0002598613500595093, -0.00024992600083351135, -0.00023999065160751343, -0.0002300553023815155, -0.00022011995315551758, -0.00021018460392951965, -0.00020024925470352173, -0.0001903139054775238, -0.00018037855625152588, -0.00017044320702552795, -0.00016050785779953003, -0.0001505725085735321, -0.00014063715934753418, -0.00013070181012153625, -0.00012076646089553833, -0.0001108311116695404, -0.00010089576244354248, -9.096041321754456e-05, -8.102506399154663e-05, -7.10897147655487e-05, -6.115436553955078e-05, -5.1219016313552856e-05, -4.128366708755493e-05, -3.134831786155701e-05, -2.1412968635559082e-05, -1.1477619409561157e-05, -1.5422701835632324e-06, 8.393079042434692e-06, 1.8328428268432617e-05, 2.8263777494430542e-05, 3.819912672042847e-05, 4.813447594642639e-05, 5.8069825172424316e-05, 6.800517439842224e-05, 7.794052362442017e-05, 8.787587285041809e-05, 9.781122207641602e-05, 0.00010774657130241394, 0.00011768192052841187, 0.0001276172697544098, 0.00013755261898040771, 0.00014748796820640564, 0.00015742331743240356, 0.0001673586666584015, 0.00017729401588439941, 0.00018722936511039734, 0.00019716471433639526, 0.0002071000635623932, 0.0002170354127883911, 0.00022697076201438904, 0.00023690611124038696, 0.0002468414604663849, 0.0002567768096923828]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 17.0, 28.0, 41.0, 47.0, 58.0, 114.0, 146.0, 219.0, 315.0, 496.0, 720.0, 1090.0, 1761.0, 2663.0, 4158.0, 6432.0, 10313.0, 15811.0, 24547.0, 37252.0, 54223.0, 75992.0, 98758.0, 117228.0, 125069.0, 119478.0, 101575.0, 79427.0, 56964.0, 39604.0, 26543.0, 16829.0, 10875.0, 7030.0, 4462.0, 2812.0, 1834.0, 1228.0, 781.0, 502.0, 356.0, 208.0, 198.0, 94.0, 85.0, 48.0, 40.0, 26.0, 12.0, 8.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.1171875, -2.047943115234375, -1.97869873046875, -1.909454345703125, -1.8402099609375, -1.770965576171875, -1.70172119140625, -1.632476806640625, -1.563232421875, -1.493988037109375, -1.42474365234375, -1.355499267578125, -1.2862548828125, -1.217010498046875, -1.14776611328125, -1.078521728515625, -1.00927734375, -0.940032958984375, -0.87078857421875, -0.801544189453125, -0.7322998046875, -0.663055419921875, -0.59381103515625, -0.524566650390625, -0.455322265625, -0.386077880859375, -0.31683349609375, -0.247589111328125, -0.1783447265625, -0.109100341796875, -0.03985595703125, 0.029388427734375, 0.0986328125, 0.167877197265625, 0.23712158203125, 0.306365966796875, 0.3756103515625, 0.444854736328125, 0.51409912109375, 0.583343505859375, 0.652587890625, 0.721832275390625, 0.79107666015625, 0.860321044921875, 0.9295654296875, 0.998809814453125, 1.06805419921875, 1.137298583984375, 1.20654296875, 1.275787353515625, 1.34503173828125, 1.414276123046875, 1.4835205078125, 1.552764892578125, 1.62200927734375, 1.691253662109375, 1.760498046875, 1.829742431640625, 1.89898681640625, 1.968231201171875, 2.0374755859375, 2.106719970703125, 2.17596435546875, 2.245208740234375, 2.314453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 10.0, 8.0, 12.0, 16.0, 9.0, 17.0, 32.0, 30.0, 17.0, 37.0, 32.0, 41.0, 45.0, 50.0, 59.0, 52.0, 33.0, 35.0, 48.0, 48.0, 41.0, 51.0, 28.0, 26.0, 28.0, 38.0, 24.0, 18.0, 19.0, 13.0, 13.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9007186889648438, -0.8693084716796875, -0.8378982543945312, -0.806488037109375, -0.7750778198242188, -0.7436676025390625, -0.7122573852539062, -0.68084716796875, -0.6494369506835938, -0.6180267333984375, -0.5866165161132812, -0.555206298828125, -0.5237960815429688, -0.4923858642578125, -0.46097564697265625, -0.4295654296875, -0.39815521240234375, -0.3667449951171875, -0.33533477783203125, -0.303924560546875, -0.27251434326171875, -0.2411041259765625, -0.20969390869140625, -0.17828369140625, -0.14687347412109375, -0.1154632568359375, -0.08405303955078125, -0.052642822265625, -0.02123260498046875, 0.0101776123046875, 0.04158782958984375, 0.072998046875, 0.10440826416015625, 0.1358184814453125, 0.16722869873046875, 0.198638916015625, 0.23004913330078125, 0.2614593505859375, 0.29286956787109375, 0.32427978515625, 0.35569000244140625, 0.3871002197265625, 0.41851043701171875, 0.449920654296875, 0.48133087158203125, 0.5127410888671875, 0.5441513061523438, 0.5755615234375, 0.6069717407226562, 0.6383819580078125, 0.6697921752929688, 0.701202392578125, 0.7326126098632812, 0.7640228271484375, 0.7954330444335938, 0.82684326171875, 0.8582534790039062, 0.8896636962890625, 0.9210739135742188, 0.952484130859375, 0.9838943481445312, 1.0153045654296875, 1.0467147827148438, 1.078125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 7.0, 6.0, 13.0, 16.0, 13.0, 14.0, 27.0, 52.0, 27.0, 38.0, 42.0, 30.0, 45.0, 65.0, 67.0, 60.0, 50.0, 49.0, 47.0, 48.0, 31.0, 31.0, 31.0, 28.0, 26.0, 24.0, 26.0, 16.0, 14.0, 11.0, 11.0, 8.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.949705123901367, -7.6665358543396, -7.383366584777832, -7.100197792053223, -6.817028522491455, -6.5338592529296875, -6.250690460205078, -5.9675211906433105, -5.684351921081543, -5.401182651519775, -5.118013381958008, -4.834844589233398, -4.551675319671631, -4.268506050109863, -3.985337018966675, -3.7021679878234863, -3.4189987182617188, -3.135829448699951, -2.8526604175567627, -2.569491386413574, -2.2863221168518066, -2.003152847290039, -1.7199838161468506, -1.4368146657943726, -1.1536455154418945, -0.8704763650894165, -0.5873072147369385, -0.30413806438446045, -0.020968914031982422, 0.2622002363204956, 0.5453693866729736, 0.8285385370254517, 1.1117067337036133, 1.3948758840560913, 1.6780450344085693, 1.9612141847610474, 2.2443833351135254, 2.527552604675293, 2.8107216358184814, 3.09389066696167, 3.3770599365234375, 3.660229206085205, 3.9433982372283936, 4.226567268371582, 4.50973653793335, 4.792905807495117, 5.076074600219727, 5.359243869781494, 5.642413139343262, 5.925582408905029, 6.208751678466797, 6.491920471191406, 6.775089740753174, 7.058259010314941, 7.341427803039551, 7.624597072601318, 7.907766342163086, 8.190935134887695, 8.474104881286621, 8.75727367401123, 9.040443420410156, 9.323612213134766, 9.606781005859375, 9.8899507522583, 10.17311954498291]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 4.0, 4.0, 5.0, 2.0, 7.0, 5.0, 14.0, 13.0, 12.0, 14.0, 11.0, 23.0, 16.0, 25.0, 22.0, 18.0, 24.0, 26.0, 24.0, 25.0, 29.0, 42.0, 45.0, 36.0, 41.0, 39.0, 30.0, 35.0, 44.0, 32.0, 26.0, 23.0, 26.0, 30.0, 29.0, 17.0, 24.0, 25.0, 23.0, 16.0, 24.0, 11.0, 13.0, 9.0, 7.0, 5.0, 13.0, 6.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.554723262786865, -6.333518981933594, -6.112314701080322, -5.891110420227051, -5.6699066162109375, -5.448702335357666, -5.2274980545043945, -5.006293773651123, -4.785089492797852, -4.56388521194458, -4.342680931091309, -4.121477127075195, -3.900272846221924, -3.6790685653686523, -3.457864284515381, -3.2366600036621094, -3.015456199645996, -2.7942519187927246, -2.5730478763580322, -2.3518435955047607, -2.1306395530700684, -1.9094352722167969, -1.6882309913635254, -1.4670268297195435, -1.2458226680755615, -1.0246185064315796, -0.8034142851829529, -0.5822100639343262, -0.36100590229034424, -0.1398017406463623, 0.08140254020690918, 0.3026067018508911, 0.5238113403320312, 0.7450155019760132, 0.9662197232246399, 1.1874239444732666, 1.4086281061172485, 1.6298322677612305, 1.851036548614502, 2.0722408294677734, 2.293444871902466, 2.5146491527557373, 2.7358531951904297, 2.957057476043701, 3.1782617568969727, 3.399465799331665, 3.6206700801849365, 3.841874122619629, 4.0630784034729, 4.284282684326172, 4.505486965179443, 4.726691246032715, 4.947895050048828, 5.1690993309021, 5.390303611755371, 5.611507892608643, 5.832712173461914, 6.0539164543151855, 6.275120735168457, 6.49632453918457, 6.717528820037842, 6.938733100891113, 7.159937381744385, 7.381141662597656, 7.6023454666137695]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 8.0, 13.0, 12.0, 23.0, 35.0, 51.0, 94.0, 126.0, 208.0, 296.0, 421.0, 598.0, 846.0, 1328.0, 1984.0, 3121.0, 4622.0, 7129.0, 11211.0, 17120.0, 26055.0, 41001.0, 63578.0, 100176.0, 157193.0, 246514.0, 371457.0, 517290.0, 613742.0, 595686.0, 477882.0, 334096.0, 216962.0, 138681.0, 87851.0, 55827.0, 35670.0, 22892.0, 14625.0, 9475.0, 6253.0, 4135.0, 2657.0, 1751.0, 1195.0, 796.0, 546.0, 347.0, 242.0, 148.0, 112.0, 72.0, 39.0, 25.0, 24.0, 23.0, 7.0, 6.0, 8.0, 4.0, 4.0], "bins": [-6.19921875, -6.004638671875, -5.81005859375, -5.615478515625, -5.4208984375, -5.226318359375, -5.03173828125, -4.837158203125, -4.642578125, -4.447998046875, -4.25341796875, -4.058837890625, -3.8642578125, -3.669677734375, -3.47509765625, -3.280517578125, -3.0859375, -2.891357421875, -2.69677734375, -2.502197265625, -2.3076171875, -2.113037109375, -1.91845703125, -1.723876953125, -1.529296875, -1.334716796875, -1.14013671875, -0.945556640625, -0.7509765625, -0.556396484375, -0.36181640625, -0.167236328125, 0.02734375, 0.221923828125, 0.41650390625, 0.611083984375, 0.8056640625, 1.000244140625, 1.19482421875, 1.389404296875, 1.583984375, 1.778564453125, 1.97314453125, 2.167724609375, 2.3623046875, 2.556884765625, 2.75146484375, 2.946044921875, 3.140625, 3.335205078125, 3.52978515625, 3.724365234375, 3.9189453125, 4.113525390625, 4.30810546875, 4.502685546875, 4.697265625, 4.891845703125, 5.08642578125, 5.281005859375, 5.4755859375, 5.670166015625, 5.86474609375, 6.059326171875, 6.25390625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 6.0, 10.0, 13.0, 10.0, 19.0, 14.0, 20.0, 29.0, 24.0, 26.0, 19.0, 24.0, 30.0, 34.0, 49.0, 35.0, 36.0, 48.0, 33.0, 41.0, 41.0, 48.0, 34.0, 38.0, 28.0, 50.0, 28.0, 29.0, 20.0, 14.0, 24.0, 19.0, 17.0, 14.0, 17.0, 15.0, 12.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.683837890625, -6.46923828125, -6.254638671875, -6.0400390625, -5.825439453125, -5.61083984375, -5.396240234375, -5.181640625, -4.967041015625, -4.75244140625, -4.537841796875, -4.3232421875, -4.108642578125, -3.89404296875, -3.679443359375, -3.46484375, -3.250244140625, -3.03564453125, -2.821044921875, -2.6064453125, -2.391845703125, -2.17724609375, -1.962646484375, -1.748046875, -1.533447265625, -1.31884765625, -1.104248046875, -0.8896484375, -0.675048828125, -0.46044921875, -0.245849609375, -0.03125, 0.183349609375, 0.39794921875, 0.612548828125, 0.8271484375, 1.041748046875, 1.25634765625, 1.470947265625, 1.685546875, 1.900146484375, 2.11474609375, 2.329345703125, 2.5439453125, 2.758544921875, 2.97314453125, 3.187744140625, 3.40234375, 3.616943359375, 3.83154296875, 4.046142578125, 4.2607421875, 4.475341796875, 4.68994140625, 4.904541015625, 5.119140625, 5.333740234375, 5.54833984375, 5.762939453125, 5.9775390625, 6.192138671875, 6.40673828125, 6.621337890625, 6.8359375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 12.0, 16.0, 22.0, 27.0, 44.0, 76.0, 100.0, 164.0, 244.0, 373.0, 580.0, 866.0, 1357.0, 2111.0, 3339.0, 5074.0, 8057.0, 12975.0, 19988.0, 32457.0, 50827.0, 80887.0, 126251.0, 193286.0, 288152.0, 410257.0, 533690.0, 594974.0, 543537.0, 422506.0, 300959.0, 200473.0, 131439.0, 84079.0, 53559.0, 33779.0, 21180.0, 13185.0, 8551.0, 5234.0, 3338.0, 2180.0, 1421.0, 933.0, 611.0, 400.0, 246.0, 166.0, 100.0, 68.0, 53.0, 32.0, 19.0, 11.0, 13.0, 4.0, 4.0, 3.0], "bins": [-6.5625, -6.36688232421875, -6.1712646484375, -5.97564697265625, -5.780029296875, -5.58441162109375, -5.3887939453125, -5.19317626953125, -4.99755859375, -4.80194091796875, -4.6063232421875, -4.41070556640625, -4.215087890625, -4.01947021484375, -3.8238525390625, -3.62823486328125, -3.4326171875, -3.23699951171875, -3.0413818359375, -2.84576416015625, -2.650146484375, -2.45452880859375, -2.2589111328125, -2.06329345703125, -1.86767578125, -1.67205810546875, -1.4764404296875, -1.28082275390625, -1.085205078125, -0.88958740234375, -0.6939697265625, -0.49835205078125, -0.302734375, -0.10711669921875, 0.0885009765625, 0.28411865234375, 0.479736328125, 0.67535400390625, 0.8709716796875, 1.06658935546875, 1.26220703125, 1.45782470703125, 1.6534423828125, 1.84906005859375, 2.044677734375, 2.24029541015625, 2.4359130859375, 2.63153076171875, 2.8271484375, 3.02276611328125, 3.2183837890625, 3.41400146484375, 3.609619140625, 3.80523681640625, 4.0008544921875, 4.19647216796875, 4.39208984375, 4.58770751953125, 4.7833251953125, 4.97894287109375, 5.174560546875, 5.37017822265625, 5.5657958984375, 5.76141357421875, 5.95703125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 8.0, 11.0, 15.0, 13.0, 31.0, 36.0, 30.0, 52.0, 41.0, 58.0, 86.0, 93.0, 110.0, 153.0, 151.0, 194.0, 189.0, 232.0, 239.0, 225.0, 246.0, 250.0, 245.0, 209.0, 186.0, 166.0, 150.0, 124.0, 112.0, 67.0, 59.0, 69.0, 44.0, 45.0, 34.0, 23.0, 19.0, 16.0, 6.0, 10.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.66156005859375, -2.5672607421875, -2.47296142578125, -2.378662109375, -2.28436279296875, -2.1900634765625, -2.09576416015625, -2.00146484375, -1.90716552734375, -1.8128662109375, -1.71856689453125, -1.624267578125, -1.52996826171875, -1.4356689453125, -1.34136962890625, -1.2470703125, -1.15277099609375, -1.0584716796875, -0.96417236328125, -0.869873046875, -0.77557373046875, -0.6812744140625, -0.58697509765625, -0.49267578125, -0.39837646484375, -0.3040771484375, -0.20977783203125, -0.115478515625, -0.02117919921875, 0.0731201171875, 0.16741943359375, 0.26171875, 0.35601806640625, 0.4503173828125, 0.54461669921875, 0.638916015625, 0.73321533203125, 0.8275146484375, 0.92181396484375, 1.01611328125, 1.11041259765625, 1.2047119140625, 1.29901123046875, 1.393310546875, 1.48760986328125, 1.5819091796875, 1.67620849609375, 1.7705078125, 1.86480712890625, 1.9591064453125, 2.05340576171875, 2.147705078125, 2.24200439453125, 2.3363037109375, 2.43060302734375, 2.52490234375, 2.61920166015625, 2.7135009765625, 2.80780029296875, 2.902099609375, 2.99639892578125, 3.0906982421875, 3.18499755859375, 3.279296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 2.0, 14.0, 9.0, 17.0, 14.0, 11.0, 23.0, 22.0, 23.0, 26.0, 23.0, 48.0, 27.0, 45.0, 36.0, 39.0, 38.0, 48.0, 45.0, 51.0, 44.0, 45.0, 41.0, 34.0, 41.0, 39.0, 29.0, 19.0, 22.0, 18.0, 10.0, 14.0, 12.0, 10.0, 9.0, 12.0, 6.0, 4.0, 9.0, 5.0, 4.0, 3.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.414489269256592, -6.176285266876221, -5.93808126449585, -5.6998772621154785, -5.461672782897949, -5.223468780517578, -4.985264778137207, -4.747060775756836, -4.508856773376465, -4.270652770996094, -4.032448768615723, -3.7942445278167725, -3.5560405254364014, -3.3178365230560303, -3.07963228225708, -2.841428279876709, -2.603224277496338, -2.365020275115967, -2.1268162727355957, -1.8886120319366455, -1.6504080295562744, -1.4122040271759033, -1.1739999055862427, -0.935795783996582, -0.6975917816162109, -0.45938771963119507, -0.2211836576461792, 0.01702040433883667, 0.25522446632385254, 0.49342846870422363, 0.7316325902938843, 0.9698367118835449, 1.2080411911010742, 1.4462451934814453, 1.684449315071106, 1.9226534366607666, 2.1608574390411377, 2.399061441421509, 2.637265682220459, 2.87546968460083, 3.113673686981201, 3.3518776893615723, 3.5900816917419434, 3.8282859325408936, 4.066490173339844, 4.304694175720215, 4.542898178100586, 4.781102180480957, 5.019306182861328, 5.257510185241699, 5.49571418762207, 5.733918190002441, 5.9721221923828125, 6.210326194763184, 6.448530673980713, 6.686734676361084, 6.924938678741455, 7.163142681121826, 7.401346683502197, 7.639550685882568, 7.877755165100098, 8.115959167480469, 8.35416316986084, 8.592367172241211, 8.830571174621582]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 4.0, 14.0, 21.0, 12.0, 10.0, 14.0, 14.0, 24.0, 20.0, 20.0, 25.0, 31.0, 35.0, 29.0, 37.0, 37.0, 37.0, 39.0, 34.0, 33.0, 34.0, 41.0, 32.0, 34.0, 33.0, 32.0, 28.0, 27.0, 29.0, 38.0, 28.0, 20.0, 15.0, 26.0, 15.0, 14.0, 8.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.124462127685547, -6.89511775970459, -6.665773391723633, -6.436429023742676, -6.207084655761719, -5.977740287780762, -5.7483954429626465, -5.5190510749816895, -5.289706707000732, -5.060362339019775, -4.831017971038818, -4.601673603057861, -4.372328758239746, -4.142984390258789, -3.913640022277832, -3.684295654296875, -3.454951286315918, -3.225606918334961, -2.996262550354004, -2.7669179439544678, -2.5375735759735107, -2.3082292079925537, -2.0788846015930176, -1.8495402336120605, -1.6201958656311035, -1.3908514976501465, -1.1615070104599, -0.9321625828742981, -0.7028181552886963, -0.47347378730773926, -0.24412930011749268, -0.014784812927246094, 0.21455955505371094, 0.44390398263931274, 0.6732484102249146, 0.9025928378105164, 1.1319372653961182, 1.3612816333770752, 1.5906261205673218, 1.8199706077575684, 2.0493149757385254, 2.2786593437194824, 2.5080037117004395, 2.7373483180999756, 2.9666926860809326, 3.1960370540618896, 3.425381660461426, 3.654726028442383, 3.88407039642334, 4.113414764404297, 4.342759132385254, 4.572103500366211, 4.801447868347168, 5.030792236328125, 5.26013708114624, 5.489481449127197, 5.718825817108154, 5.948170185089111, 6.177514553070068, 6.406858921051025, 6.636203765869141, 6.865548133850098, 7.094892501831055, 7.324236869812012, 7.553581237792969]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 18.0, 39.0, 53.0, 88.0, 150.0, 243.0, 377.0, 583.0, 969.0, 1501.0, 2463.0, 3820.0, 5987.0, 9129.0, 14116.0, 21121.0, 31295.0, 43934.0, 59307.0, 76544.0, 93143.0, 105318.0, 110732.0, 105246.0, 93425.0, 76073.0, 58445.0, 43026.0, 30538.0, 21270.0, 14069.0, 9263.0, 6002.0, 3799.0, 2503.0, 1560.0, 867.0, 577.0, 382.0, 219.0, 135.0, 76.0, 50.0, 38.0, 22.0, 8.0, 10.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.453125, -3.346832275390625, -3.24053955078125, -3.134246826171875, -3.0279541015625, -2.921661376953125, -2.81536865234375, -2.709075927734375, -2.602783203125, -2.496490478515625, -2.39019775390625, -2.283905029296875, -2.1776123046875, -2.071319580078125, -1.96502685546875, -1.858734130859375, -1.75244140625, -1.646148681640625, -1.53985595703125, -1.433563232421875, -1.3272705078125, -1.220977783203125, -1.11468505859375, -1.008392333984375, -0.902099609375, -0.795806884765625, -0.68951416015625, -0.583221435546875, -0.4769287109375, -0.370635986328125, -0.26434326171875, -0.158050537109375, -0.0517578125, 0.054534912109375, 0.16082763671875, 0.267120361328125, 0.3734130859375, 0.479705810546875, 0.58599853515625, 0.692291259765625, 0.798583984375, 0.904876708984375, 1.01116943359375, 1.117462158203125, 1.2237548828125, 1.330047607421875, 1.43634033203125, 1.542633056640625, 1.64892578125, 1.755218505859375, 1.86151123046875, 1.967803955078125, 2.0740966796875, 2.180389404296875, 2.28668212890625, 2.392974853515625, 2.499267578125, 2.605560302734375, 2.71185302734375, 2.818145751953125, 2.9244384765625, 3.030731201171875, 3.13702392578125, 3.243316650390625, 3.349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 14.0, 14.0, 11.0, 7.0, 18.0, 18.0, 23.0, 20.0, 31.0, 32.0, 26.0, 31.0, 39.0, 35.0, 43.0, 41.0, 17.0, 38.0, 29.0, 31.0, 41.0, 33.0, 36.0, 37.0, 32.0, 33.0, 36.0, 34.0, 35.0, 23.0, 21.0, 17.0, 19.0, 19.0, 8.0, 12.0, 13.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.03216552734375, -5.8221435546875, -5.61212158203125, -5.402099609375, -5.19207763671875, -4.9820556640625, -4.77203369140625, -4.56201171875, -4.35198974609375, -4.1419677734375, -3.93194580078125, -3.721923828125, -3.51190185546875, -3.3018798828125, -3.09185791015625, -2.8818359375, -2.67181396484375, -2.4617919921875, -2.25177001953125, -2.041748046875, -1.83172607421875, -1.6217041015625, -1.41168212890625, -1.20166015625, -0.99163818359375, -0.7816162109375, -0.57159423828125, -0.361572265625, -0.15155029296875, 0.0584716796875, 0.26849365234375, 0.478515625, 0.68853759765625, 0.8985595703125, 1.10858154296875, 1.318603515625, 1.52862548828125, 1.7386474609375, 1.94866943359375, 2.15869140625, 2.36871337890625, 2.5787353515625, 2.78875732421875, 2.998779296875, 3.20880126953125, 3.4188232421875, 3.62884521484375, 3.8388671875, 4.04888916015625, 4.2589111328125, 4.46893310546875, 4.678955078125, 4.88897705078125, 5.0989990234375, 5.30902099609375, 5.51904296875, 5.72906494140625, 5.9390869140625, 6.14910888671875, 6.359130859375, 6.56915283203125, 6.7791748046875, 6.98919677734375, 7.19921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 9.0, 9.0, 18.0, 26.0, 45.0, 57.0, 73.0, 87.0, 170.0, 240.0, 380.0, 642.0, 1067.0, 1837.0, 2952.0, 4847.0, 8115.0, 13315.0, 22845.0, 59805.0, 696082.0, 165768.0, 29010.0, 16271.0, 9862.0, 5986.0, 3491.0, 2091.0, 1266.0, 792.0, 479.0, 303.0, 182.0, 135.0, 76.0, 53.0, 47.0, 26.0, 20.0, 13.0, 16.0, 10.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.538330078125, -8.24072265625, -7.943115234375, -7.6455078125, -7.347900390625, -7.05029296875, -6.752685546875, -6.455078125, -6.157470703125, -5.85986328125, -5.562255859375, -5.2646484375, -4.967041015625, -4.66943359375, -4.371826171875, -4.07421875, -3.776611328125, -3.47900390625, -3.181396484375, -2.8837890625, -2.586181640625, -2.28857421875, -1.990966796875, -1.693359375, -1.395751953125, -1.09814453125, -0.800537109375, -0.5029296875, -0.205322265625, 0.09228515625, 0.389892578125, 0.6875, 0.985107421875, 1.28271484375, 1.580322265625, 1.8779296875, 2.175537109375, 2.47314453125, 2.770751953125, 3.068359375, 3.365966796875, 3.66357421875, 3.961181640625, 4.2587890625, 4.556396484375, 4.85400390625, 5.151611328125, 5.44921875, 5.746826171875, 6.04443359375, 6.342041015625, 6.6396484375, 6.937255859375, 7.23486328125, 7.532470703125, 7.830078125, 8.127685546875, 8.42529296875, 8.722900390625, 9.0205078125, 9.318115234375, 9.61572265625, 9.913330078125, 10.2109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 5.0, 7.0, 8.0, 4.0, 20.0, 14.0, 20.0, 21.0, 25.0, 20.0, 21.0, 36.0, 34.0, 36.0, 34.0, 32.0, 40.0, 37.0, 34.0, 29.0, 41.0, 35.0, 45.0, 26.0, 34.0, 28.0, 42.0, 31.0, 21.0, 25.0, 19.0, 27.0, 21.0, 24.0, 10.0, 10.0, 9.0, 14.0, 10.0, 8.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.79296875, -7.55767822265625, -7.3223876953125, -7.08709716796875, -6.851806640625, -6.61651611328125, -6.3812255859375, -6.14593505859375, -5.91064453125, -5.67535400390625, -5.4400634765625, -5.20477294921875, -4.969482421875, -4.73419189453125, -4.4989013671875, -4.26361083984375, -4.0283203125, -3.79302978515625, -3.5577392578125, -3.32244873046875, -3.087158203125, -2.85186767578125, -2.6165771484375, -2.38128662109375, -2.14599609375, -1.91070556640625, -1.6754150390625, -1.44012451171875, -1.204833984375, -0.96954345703125, -0.7342529296875, -0.49896240234375, -0.263671875, -0.02838134765625, 0.2069091796875, 0.44219970703125, 0.677490234375, 0.91278076171875, 1.1480712890625, 1.38336181640625, 1.61865234375, 1.85394287109375, 2.0892333984375, 2.32452392578125, 2.559814453125, 2.79510498046875, 3.0303955078125, 3.26568603515625, 3.5009765625, 3.73626708984375, 3.9715576171875, 4.20684814453125, 4.442138671875, 4.67742919921875, 4.9127197265625, 5.14801025390625, 5.38330078125, 5.61859130859375, 5.8538818359375, 6.08917236328125, 6.324462890625, 6.55975341796875, 6.7950439453125, 7.03033447265625, 7.265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 10.0, 18.0, 25.0, 18.0, 34.0, 50.0, 61.0, 93.0, 150.0, 214.0, 300.0, 455.0, 693.0, 947.0, 1479.0, 2196.0, 3532.0, 5670.0, 9141.0, 15828.0, 31980.0, 161398.0, 652606.0, 98642.0, 26368.0, 14037.0, 8179.0, 4956.0, 3187.0, 2083.0, 1362.0, 851.0, 637.0, 434.0, 297.0, 182.0, 117.0, 94.0, 60.0, 46.0, 38.0, 29.0, 15.0, 11.0, 5.0, 14.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.53125, -1.480865478515625, -1.43048095703125, -1.380096435546875, -1.3297119140625, -1.279327392578125, -1.22894287109375, -1.178558349609375, -1.128173828125, -1.077789306640625, -1.02740478515625, -0.977020263671875, -0.9266357421875, -0.876251220703125, -0.82586669921875, -0.775482177734375, -0.72509765625, -0.674713134765625, -0.62432861328125, -0.573944091796875, -0.5235595703125, -0.473175048828125, -0.42279052734375, -0.372406005859375, -0.322021484375, -0.271636962890625, -0.22125244140625, -0.170867919921875, -0.1204833984375, -0.070098876953125, -0.01971435546875, 0.030670166015625, 0.0810546875, 0.131439208984375, 0.18182373046875, 0.232208251953125, 0.2825927734375, 0.332977294921875, 0.38336181640625, 0.433746337890625, 0.484130859375, 0.534515380859375, 0.58489990234375, 0.635284423828125, 0.6856689453125, 0.736053466796875, 0.78643798828125, 0.836822509765625, 0.88720703125, 0.937591552734375, 0.98797607421875, 1.038360595703125, 1.0887451171875, 1.139129638671875, 1.18951416015625, 1.239898681640625, 1.290283203125, 1.340667724609375, 1.39105224609375, 1.441436767578125, 1.4918212890625, 1.542205810546875, 1.59259033203125, 1.642974853515625, 1.693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 16.0, 16.0, 27.0, 34.0, 46.0, 54.0, 59.0, 85.0, 79.0, 102.0, 93.0, 81.0, 66.0, 58.0, 33.0, 35.0, 22.0, 19.0, 10.0, 12.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00103759765625, -0.0010055601596832275, -0.0009735226631164551, -0.0009414851665496826, -0.0009094476699829102, -0.0008774101734161377, -0.0008453726768493652, -0.0008133351802825928, -0.0007812976837158203, -0.0007492601871490479, -0.0007172226905822754, -0.0006851851940155029, -0.0006531476974487305, -0.000621110200881958, -0.0005890727043151855, -0.0005570352077484131, -0.0005249977111816406, -0.0004929602146148682, -0.0004609227180480957, -0.00042888522148132324, -0.0003968477249145508, -0.0003648102283477783, -0.00033277273178100586, -0.0003007352352142334, -0.00026869773864746094, -0.00023666024208068848, -0.00020462274551391602, -0.00017258524894714355, -0.0001405477523803711, -0.00010851025581359863, -7.647275924682617e-05, -4.443526268005371e-05, -1.239776611328125e-05, 1.963973045349121e-05, 5.167722702026367e-05, 8.371472358703613e-05, 0.0001157522201538086, 0.00014778971672058105, 0.00017982721328735352, 0.00021186470985412598, 0.00024390220642089844, 0.0002759397029876709, 0.00030797719955444336, 0.0003400146961212158, 0.0003720521926879883, 0.00040408968925476074, 0.0004361271858215332, 0.00046816468238830566, 0.0005002021789550781, 0.0005322396755218506, 0.000564277172088623, 0.0005963146686553955, 0.000628352165222168, 0.0006603896617889404, 0.0006924271583557129, 0.0007244646549224854, 0.0007565021514892578, 0.0007885396480560303, 0.0008205771446228027, 0.0008526146411895752, 0.0008846521377563477, 0.0009166896343231201, 0.0009487271308898926, 0.000980764627456665, 0.0010128021240234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 10.0, 21.0, 23.0, 43.0, 61.0, 92.0, 148.0, 209.0, 279.0, 508.0, 795.0, 1424.0, 2519.0, 4710.0, 9746.0, 22608.0, 58002.0, 150728.0, 299153.0, 278194.0, 131525.0, 49784.0, 19592.0, 8577.0, 4163.0, 2223.0, 1222.0, 744.0, 472.0, 313.0, 199.0, 159.0, 89.0, 72.0, 38.0, 24.0, 18.0, 18.0, 12.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.30859375, -1.2688446044921875, -1.229095458984375, -1.1893463134765625, -1.14959716796875, -1.1098480224609375, -1.070098876953125, -1.0303497314453125, -0.9906005859375, -0.9508514404296875, -0.911102294921875, -0.8713531494140625, -0.83160400390625, -0.7918548583984375, -0.752105712890625, -0.7123565673828125, -0.672607421875, -0.6328582763671875, -0.593109130859375, -0.5533599853515625, -0.51361083984375, -0.4738616943359375, -0.434112548828125, -0.3943634033203125, -0.3546142578125, -0.3148651123046875, -0.275115966796875, -0.2353668212890625, -0.19561767578125, -0.1558685302734375, -0.116119384765625, -0.0763702392578125, -0.03662109375, 0.0031280517578125, 0.042877197265625, 0.0826263427734375, 0.12237548828125, 0.1621246337890625, 0.201873779296875, 0.2416229248046875, 0.2813720703125, 0.3211212158203125, 0.360870361328125, 0.4006195068359375, 0.44036865234375, 0.4801177978515625, 0.519866943359375, 0.5596160888671875, 0.599365234375, 0.6391143798828125, 0.678863525390625, 0.7186126708984375, 0.75836181640625, 0.7981109619140625, 0.837860107421875, 0.8776092529296875, 0.9173583984375, 0.9571075439453125, 0.996856689453125, 1.0366058349609375, 1.07635498046875, 1.1161041259765625, 1.155853271484375, 1.1956024169921875, 1.2353515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 7.0, 16.0, 9.0, 21.0, 28.0, 27.0, 36.0, 54.0, 48.0, 56.0, 69.0, 81.0, 77.0, 66.0, 72.0, 57.0, 61.0, 45.0, 33.0, 23.0, 22.0, 19.0, 16.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3635826110839844, -0.35338592529296875, -0.3431892395019531, -0.3329925537109375, -0.3227958679199219, -0.31259918212890625, -0.3024024963378906, -0.292205810546875, -0.2820091247558594, -0.27181243896484375, -0.2616157531738281, -0.2514190673828125, -0.24122238159179688, -0.23102569580078125, -0.22082901000976562, -0.21063232421875, -0.20043563842773438, -0.19023895263671875, -0.18004226684570312, -0.1698455810546875, -0.15964889526367188, -0.14945220947265625, -0.13925552368164062, -0.129058837890625, -0.11886215209960938, -0.10866546630859375, -0.09846878051757812, -0.0882720947265625, -0.07807540893554688, -0.06787872314453125, -0.057682037353515625, -0.0474853515625, -0.037288665771484375, -0.02709197998046875, -0.016895294189453125, -0.0066986083984375, 0.003498077392578125, 0.01369476318359375, 0.023891448974609375, 0.034088134765625, 0.044284820556640625, 0.05448150634765625, 0.06467819213867188, 0.0748748779296875, 0.08507156372070312, 0.09526824951171875, 0.10546493530273438, 0.11566162109375, 0.12585830688476562, 0.13605499267578125, 0.14625167846679688, 0.1564483642578125, 0.16664505004882812, 0.17684173583984375, 0.18703842163085938, 0.197235107421875, 0.20743179321289062, 0.21762847900390625, 0.22782516479492188, 0.2380218505859375, 0.24821853637695312, 0.25841522216796875, 0.2686119079589844, 0.27880859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 5.0, 16.0, 6.0, 16.0, 20.0, 22.0, 20.0, 22.0, 35.0, 29.0, 28.0, 33.0, 35.0, 41.0, 41.0, 39.0, 53.0, 41.0, 50.0, 49.0, 48.0, 42.0, 31.0, 35.0, 31.0, 35.0, 14.0, 20.0, 21.0, 10.0, 16.0, 15.0, 10.0, 8.0, 9.0, 5.0, 6.0, 2.0, 7.0, 7.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.698208808898926, -5.498865127563477, -5.299520969390869, -5.10017728805542, -4.900833606719971, -4.701489448547363, -4.502145767211914, -4.302802085876465, -4.103458404541016, -3.9041144847869873, -3.704770803451538, -3.5054268836975098, -3.3060832023620605, -3.1067392826080322, -2.907395362854004, -2.7080516815185547, -2.5087075233459473, -2.309363603591919, -2.1100199222564697, -1.9106760025024414, -1.7113322019577026, -1.5119884014129639, -1.3126444816589355, -1.1133006811141968, -0.913956880569458, -0.7146130800247192, -0.5152692198753357, -0.31592535972595215, -0.11658155918121338, 0.08276224136352539, 0.2821061611175537, 0.4814499616622925, 0.6807937622070312, 0.88013756275177, 1.0794813632965088, 1.278825283050537, 1.4781690835952759, 1.6775128841400146, 1.876856803894043, 2.076200485229492, 2.2755444049835205, 2.474888324737549, 2.674232006072998, 2.8735759258270264, 3.0729198455810547, 3.272263526916504, 3.4716074466705322, 3.6709513664245605, 3.8702950477600098, 4.069638729095459, 4.268982887268066, 4.468326568603516, 4.667670249938965, 4.867013931274414, 5.0663580894470215, 5.265701770782471, 5.465045928955078, 5.664389610290527, 5.863733768463135, 6.063077449798584, 6.262421131134033, 6.461765289306641, 6.66110897064209, 6.860452651977539, 7.059796333312988]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 9.0, 11.0, 13.0, 15.0, 11.0, 12.0, 12.0, 17.0, 19.0, 20.0, 27.0, 25.0, 23.0, 30.0, 41.0, 34.0, 26.0, 36.0, 38.0, 32.0, 39.0, 34.0, 46.0, 36.0, 35.0, 32.0, 30.0, 29.0, 24.0, 30.0, 34.0, 25.0, 21.0, 24.0, 18.0, 18.0, 15.0, 16.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.959095478057861, -5.7669830322265625, -5.5748701095581055, -5.382757663726807, -5.190645217895508, -4.998532772064209, -4.80642032623291, -4.614307403564453, -4.422194957733154, -4.2300825119018555, -4.037969589233398, -3.8458571434020996, -3.653744697570801, -3.461632251739502, -3.269519567489624, -3.077406883239746, -2.8852944374084473, -2.6931819915771484, -2.5010693073272705, -2.3089566230773926, -2.1168441772460938, -1.9247316122055054, -1.732619047164917, -1.5405064821243286, -1.3483939170837402, -1.1562813520431519, -0.9641687870025635, -0.7720562219619751, -0.5799436569213867, -0.38783109188079834, -0.19571852684020996, -0.003605961799621582, 0.1885061264038086, 0.380618691444397, 0.5727312564849854, 0.7648438215255737, 0.9569563865661621, 1.1490689516067505, 1.3411815166473389, 1.5332940816879272, 1.7254066467285156, 1.917519211769104, 2.1096317768096924, 2.3017444610595703, 2.493856906890869, 2.685969352722168, 2.878082036972046, 3.070194721221924, 3.2623071670532227, 3.4544196128845215, 3.6465322971343994, 3.8386449813842773, 4.030757427215576, 4.222869873046875, 4.414982795715332, 4.607095241546631, 4.79920768737793, 4.9913201332092285, 5.183432579040527, 5.375545501708984, 5.567657947540283, 5.759770393371582, 5.951883316040039, 6.143995761871338, 6.336108207702637]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 9.0, 10.0, 18.0, 33.0, 57.0, 73.0, 118.0, 203.0, 305.0, 455.0, 743.0, 1148.0, 1803.0, 2923.0, 4634.0, 7396.0, 11439.0, 17620.0, 26824.0, 39235.0, 55530.0, 74814.0, 94403.0, 108605.0, 116831.0, 112502.0, 98986.0, 80572.0, 61371.0, 43932.0, 30148.0, 20017.0, 12978.0, 8423.0, 5286.0, 3326.0, 2163.0, 1339.0, 837.0, 511.0, 323.0, 205.0, 129.0, 104.0, 62.0, 38.0, 23.0, 17.0, 11.0, 12.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.96484375, -4.8079833984375, -4.651123046875, -4.4942626953125, -4.33740234375, -4.1805419921875, -4.023681640625, -3.8668212890625, -3.7099609375, -3.5531005859375, -3.396240234375, -3.2393798828125, -3.08251953125, -2.9256591796875, -2.768798828125, -2.6119384765625, -2.455078125, -2.2982177734375, -2.141357421875, -1.9844970703125, -1.82763671875, -1.6707763671875, -1.513916015625, -1.3570556640625, -1.2001953125, -1.0433349609375, -0.886474609375, -0.7296142578125, -0.57275390625, -0.4158935546875, -0.259033203125, -0.1021728515625, 0.0546875, 0.2115478515625, 0.368408203125, 0.5252685546875, 0.68212890625, 0.8389892578125, 0.995849609375, 1.1527099609375, 1.3095703125, 1.4664306640625, 1.623291015625, 1.7801513671875, 1.93701171875, 2.0938720703125, 2.250732421875, 2.4075927734375, 2.564453125, 2.7213134765625, 2.878173828125, 3.0350341796875, 3.19189453125, 3.3487548828125, 3.505615234375, 3.6624755859375, 3.8193359375, 3.9761962890625, 4.133056640625, 4.2899169921875, 4.44677734375, 4.6036376953125, 4.760498046875, 4.9173583984375, 5.07421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 12.0, 13.0, 11.0, 10.0, 14.0, 16.0, 24.0, 20.0, 18.0, 29.0, 29.0, 29.0, 21.0, 39.0, 31.0, 30.0, 46.0, 25.0, 42.0, 42.0, 48.0, 44.0, 32.0, 18.0, 38.0, 37.0, 29.0, 19.0, 24.0, 24.0, 33.0, 25.0, 24.0, 22.0, 12.0, 15.0, 5.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.71484375, -5.5220947265625, -5.329345703125, -5.1365966796875, -4.94384765625, -4.7510986328125, -4.558349609375, -4.3656005859375, -4.1728515625, -3.9801025390625, -3.787353515625, -3.5946044921875, -3.40185546875, -3.2091064453125, -3.016357421875, -2.8236083984375, -2.630859375, -2.4381103515625, -2.245361328125, -2.0526123046875, -1.85986328125, -1.6671142578125, -1.474365234375, -1.2816162109375, -1.0888671875, -0.8961181640625, -0.703369140625, -0.5106201171875, -0.31787109375, -0.1251220703125, 0.067626953125, 0.2603759765625, 0.453125, 0.6458740234375, 0.838623046875, 1.0313720703125, 1.22412109375, 1.4168701171875, 1.609619140625, 1.8023681640625, 1.9951171875, 2.1878662109375, 2.380615234375, 2.5733642578125, 2.76611328125, 2.9588623046875, 3.151611328125, 3.3443603515625, 3.537109375, 3.7298583984375, 3.922607421875, 4.1153564453125, 4.30810546875, 4.5008544921875, 4.693603515625, 4.8863525390625, 5.0791015625, 5.2718505859375, 5.464599609375, 5.6573486328125, 5.85009765625, 6.0428466796875, 6.235595703125, 6.4283447265625, 6.62109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 9.0, 12.0, 13.0, 22.0, 32.0, 46.0, 63.0, 108.0, 129.0, 211.0, 328.0, 494.0, 700.0, 1042.0, 1676.0, 2230.0, 3470.0, 5149.0, 7348.0, 10918.0, 15946.0, 22801.0, 31826.0, 43500.0, 57667.0, 73554.0, 87849.0, 98670.0, 102109.0, 99534.0, 89444.0, 75451.0, 60572.0, 45512.0, 33562.0, 23793.0, 16751.0, 11428.0, 7810.0, 5408.0, 3679.0, 2593.0, 1674.0, 1108.0, 733.0, 540.0, 355.0, 215.0, 177.0, 102.0, 71.0, 42.0, 37.0, 12.0, 18.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0], "bins": [-5.37109375, -5.20098876953125, -5.0308837890625, -4.86077880859375, -4.690673828125, -4.52056884765625, -4.3504638671875, -4.18035888671875, -4.01025390625, -3.84014892578125, -3.6700439453125, -3.49993896484375, -3.329833984375, -3.15972900390625, -2.9896240234375, -2.81951904296875, -2.6494140625, -2.47930908203125, -2.3092041015625, -2.13909912109375, -1.968994140625, -1.79888916015625, -1.6287841796875, -1.45867919921875, -1.28857421875, -1.11846923828125, -0.9483642578125, -0.77825927734375, -0.608154296875, -0.43804931640625, -0.2679443359375, -0.09783935546875, 0.072265625, 0.24237060546875, 0.4124755859375, 0.58258056640625, 0.752685546875, 0.92279052734375, 1.0928955078125, 1.26300048828125, 1.43310546875, 1.60321044921875, 1.7733154296875, 1.94342041015625, 2.113525390625, 2.28363037109375, 2.4537353515625, 2.62384033203125, 2.7939453125, 2.96405029296875, 3.1341552734375, 3.30426025390625, 3.474365234375, 3.64447021484375, 3.8145751953125, 3.98468017578125, 4.15478515625, 4.32489013671875, 4.4949951171875, 4.66510009765625, 4.835205078125, 5.00531005859375, 5.1754150390625, 5.34552001953125, 5.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 9.0, 13.0, 11.0, 11.0, 14.0, 15.0, 18.0, 16.0, 16.0, 35.0, 35.0, 24.0, 37.0, 36.0, 45.0, 34.0, 43.0, 47.0, 33.0, 44.0, 58.0, 40.0, 49.0, 43.0, 35.0, 35.0, 29.0, 32.0, 33.0, 20.0, 19.0, 7.0, 10.0, 15.0, 7.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.63671875, -4.493896484375, -4.35107421875, -4.208251953125, -4.0654296875, -3.922607421875, -3.77978515625, -3.636962890625, -3.494140625, -3.351318359375, -3.20849609375, -3.065673828125, -2.9228515625, -2.780029296875, -2.63720703125, -2.494384765625, -2.3515625, -2.208740234375, -2.06591796875, -1.923095703125, -1.7802734375, -1.637451171875, -1.49462890625, -1.351806640625, -1.208984375, -1.066162109375, -0.92333984375, -0.780517578125, -0.6376953125, -0.494873046875, -0.35205078125, -0.209228515625, -0.06640625, 0.076416015625, 0.21923828125, 0.362060546875, 0.5048828125, 0.647705078125, 0.79052734375, 0.933349609375, 1.076171875, 1.218994140625, 1.36181640625, 1.504638671875, 1.6474609375, 1.790283203125, 1.93310546875, 2.075927734375, 2.21875, 2.361572265625, 2.50439453125, 2.647216796875, 2.7900390625, 2.932861328125, 3.07568359375, 3.218505859375, 3.361328125, 3.504150390625, 3.64697265625, 3.789794921875, 3.9326171875, 4.075439453125, 4.21826171875, 4.361083984375, 4.50390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 16.0, 33.0, 27.0, 47.0, 59.0, 118.0, 150.0, 202.0, 348.0, 500.0, 790.0, 1271.0, 1799.0, 3080.0, 5291.0, 8601.0, 14460.0, 24457.0, 41004.0, 66415.0, 99241.0, 133659.0, 153839.0, 147605.0, 120802.0, 85771.0, 55449.0, 33498.0, 19978.0, 11807.0, 6983.0, 4101.0, 2629.0, 1515.0, 1015.0, 648.0, 446.0, 298.0, 212.0, 102.0, 95.0, 54.0, 43.0, 31.0, 18.0, 15.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.27734375, -2.207916259765625, -2.13848876953125, -2.069061279296875, -1.9996337890625, -1.930206298828125, -1.86077880859375, -1.791351318359375, -1.721923828125, -1.652496337890625, -1.58306884765625, -1.513641357421875, -1.4442138671875, -1.374786376953125, -1.30535888671875, -1.235931396484375, -1.16650390625, -1.097076416015625, -1.02764892578125, -0.958221435546875, -0.8887939453125, -0.819366455078125, -0.74993896484375, -0.680511474609375, -0.611083984375, -0.541656494140625, -0.47222900390625, -0.402801513671875, -0.3333740234375, -0.263946533203125, -0.19451904296875, -0.125091552734375, -0.0556640625, 0.013763427734375, 0.08319091796875, 0.152618408203125, 0.2220458984375, 0.291473388671875, 0.36090087890625, 0.430328369140625, 0.499755859375, 0.569183349609375, 0.63861083984375, 0.708038330078125, 0.7774658203125, 0.846893310546875, 0.91632080078125, 0.985748291015625, 1.05517578125, 1.124603271484375, 1.19403076171875, 1.263458251953125, 1.3328857421875, 1.402313232421875, 1.47174072265625, 1.541168212890625, 1.610595703125, 1.680023193359375, 1.74945068359375, 1.818878173828125, 1.8883056640625, 1.957733154296875, 2.02716064453125, 2.096588134765625, 2.166015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 12.0, 25.0, 16.0, 16.0, 20.0, 26.0, 40.0, 35.0, 40.0, 40.0, 39.0, 36.0, 42.0, 50.0, 35.0, 45.0, 50.0, 47.0, 53.0, 36.0, 26.0, 38.0, 32.0, 22.0, 20.0, 21.0, 12.0, 17.0, 17.0, 14.0, 5.0, 6.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.00023603439331054688, -0.00022898614406585693, -0.000221937894821167, -0.00021488964557647705, -0.0002078413963317871, -0.00020079314708709717, -0.00019374489784240723, -0.00018669664859771729, -0.00017964839935302734, -0.0001726001501083374, -0.00016555190086364746, -0.00015850365161895752, -0.00015145540237426758, -0.00014440715312957764, -0.0001373589038848877, -0.00013031065464019775, -0.0001232624053955078, -0.00011621415615081787, -0.00010916590690612793, -0.00010211765766143799, -9.506940841674805e-05, -8.80211591720581e-05, -8.097290992736816e-05, -7.392466068267822e-05, -6.687641143798828e-05, -5.982816219329834e-05, -5.27799129486084e-05, -4.573166370391846e-05, -3.8683414459228516e-05, -3.1635165214538574e-05, -2.4586915969848633e-05, -1.753866672515869e-05, -1.049041748046875e-05, -3.4421682357788086e-06, 3.606081008911133e-06, 1.0654330253601074e-05, 1.7702579498291016e-05, 2.4750828742980957e-05, 3.17990779876709e-05, 3.884732723236084e-05, 4.589557647705078e-05, 5.294382572174072e-05, 5.9992074966430664e-05, 6.70403242111206e-05, 7.408857345581055e-05, 8.113682270050049e-05, 8.818507194519043e-05, 9.523332118988037e-05, 0.00010228157043457031, 0.00010932981967926025, 0.0001163780689239502, 0.00012342631816864014, 0.00013047456741333008, 0.00013752281665802002, 0.00014457106590270996, 0.0001516193151473999, 0.00015866756439208984, 0.00016571581363677979, 0.00017276406288146973, 0.00017981231212615967, 0.0001868605613708496, 0.00019390881061553955, 0.0002009570598602295, 0.00020800530910491943, 0.00021505355834960938]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 16.0, 10.0, 35.0, 28.0, 58.0, 69.0, 123.0, 191.0, 308.0, 549.0, 884.0, 1611.0, 2742.0, 4833.0, 8460.0, 15763.0, 27893.0, 47737.0, 77384.0, 114224.0, 146935.0, 159387.0, 144876.0, 111944.0, 75567.0, 45932.0, 26882.0, 14939.0, 8246.0, 4658.0, 2576.0, 1506.0, 864.0, 507.0, 290.0, 194.0, 121.0, 71.0, 51.0, 29.0, 24.0, 14.0, 9.0, 5.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.271820068359375, -2.20184326171875, -2.131866455078125, -2.0618896484375, -1.991912841796875, -1.92193603515625, -1.851959228515625, -1.781982421875, -1.712005615234375, -1.64202880859375, -1.572052001953125, -1.5020751953125, -1.432098388671875, -1.36212158203125, -1.292144775390625, -1.22216796875, -1.152191162109375, -1.08221435546875, -1.012237548828125, -0.9422607421875, -0.872283935546875, -0.80230712890625, -0.732330322265625, -0.662353515625, -0.592376708984375, -0.52239990234375, -0.452423095703125, -0.3824462890625, -0.312469482421875, -0.24249267578125, -0.172515869140625, -0.1025390625, -0.032562255859375, 0.03741455078125, 0.107391357421875, 0.1773681640625, 0.247344970703125, 0.31732177734375, 0.387298583984375, 0.457275390625, 0.527252197265625, 0.59722900390625, 0.667205810546875, 0.7371826171875, 0.807159423828125, 0.87713623046875, 0.947113037109375, 1.01708984375, 1.087066650390625, 1.15704345703125, 1.227020263671875, 1.2969970703125, 1.366973876953125, 1.43695068359375, 1.506927490234375, 1.576904296875, 1.646881103515625, 1.71685791015625, 1.786834716796875, 1.8568115234375, 1.926788330078125, 1.99676513671875, 2.066741943359375, 2.13671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 12.0, 23.0, 12.0, 14.0, 12.0, 28.0, 27.0, 34.0, 36.0, 59.0, 44.0, 41.0, 37.0, 64.0, 39.0, 60.0, 46.0, 40.0, 48.0, 37.0, 25.0, 43.0, 27.0, 36.0, 26.0, 18.0, 18.0, 16.0, 7.0, 12.0, 5.0, 4.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.82568359375, -0.8009490966796875, -0.776214599609375, -0.7514801025390625, -0.72674560546875, -0.7020111083984375, -0.677276611328125, -0.6525421142578125, -0.6278076171875, -0.6030731201171875, -0.578338623046875, -0.5536041259765625, -0.52886962890625, -0.5041351318359375, -0.479400634765625, -0.4546661376953125, -0.429931640625, -0.4051971435546875, -0.380462646484375, -0.3557281494140625, -0.33099365234375, -0.3062591552734375, -0.281524658203125, -0.2567901611328125, -0.2320556640625, -0.2073211669921875, -0.182586669921875, -0.1578521728515625, -0.13311767578125, -0.1083831787109375, -0.083648681640625, -0.0589141845703125, -0.0341796875, -0.0094451904296875, 0.015289306640625, 0.0400238037109375, 0.06475830078125, 0.0894927978515625, 0.114227294921875, 0.1389617919921875, 0.1636962890625, 0.1884307861328125, 0.213165283203125, 0.2378997802734375, 0.26263427734375, 0.2873687744140625, 0.312103271484375, 0.3368377685546875, 0.361572265625, 0.3863067626953125, 0.411041259765625, 0.4357757568359375, 0.46051025390625, 0.4852447509765625, 0.509979248046875, 0.5347137451171875, 0.5594482421875, 0.5841827392578125, 0.608917236328125, 0.6336517333984375, 0.65838623046875, 0.6831207275390625, 0.707855224609375, 0.7325897216796875, 0.75732421875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 15.0, 16.0, 18.0, 23.0, 22.0, 31.0, 24.0, 32.0, 37.0, 33.0, 42.0, 50.0, 48.0, 50.0, 46.0, 32.0, 51.0, 31.0, 48.0, 39.0, 34.0, 30.0, 26.0, 28.0, 21.0, 24.0, 17.0, 11.0, 12.0, 13.0, 6.0, 6.0, 6.0, 13.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.7316789627075195, -5.538595676422119, -5.345512390136719, -5.152429103851318, -4.959345817565918, -4.766262531280518, -4.573179244995117, -4.380095958709717, -4.187012672424316, -3.993929386138916, -3.8008460998535156, -3.6077628135681152, -3.414679527282715, -3.2215962409973145, -3.028512954711914, -2.8354296684265137, -2.6423463821411133, -2.449263095855713, -2.2561798095703125, -2.063096523284912, -1.8700132369995117, -1.6769299507141113, -1.483846664428711, -1.2907633781433105, -1.0976800918579102, -0.9045968055725098, -0.7115135192871094, -0.518430233001709, -0.3253469467163086, -0.1322636604309082, 0.06081962585449219, 0.2539029121398926, 0.44698572158813477, 0.6400690078735352, 0.8331522941589355, 1.026235580444336, 1.2193188667297363, 1.4124021530151367, 1.605485439300537, 1.7985687255859375, 1.991652011871338, 2.1847352981567383, 2.3778185844421387, 2.570901870727539, 2.7639851570129395, 2.95706844329834, 3.1501517295837402, 3.3432350158691406, 3.536318302154541, 3.7294015884399414, 3.922484874725342, 4.115568161010742, 4.308651447296143, 4.501734733581543, 4.694818019866943, 4.887901306152344, 5.080984592437744, 5.2740678787231445, 5.467151165008545, 5.660234451293945, 5.853317737579346, 6.046401023864746, 6.2394843101501465, 6.432567596435547, 6.625650882720947]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 10.0, 8.0, 13.0, 13.0, 16.0, 10.0, 17.0, 19.0, 15.0, 24.0, 18.0, 19.0, 28.0, 30.0, 43.0, 36.0, 37.0, 41.0, 34.0, 26.0, 38.0, 42.0, 42.0, 26.0, 53.0, 32.0, 42.0, 29.0, 19.0, 27.0, 31.0, 24.0, 25.0, 25.0, 19.0, 6.0, 9.0, 10.0, 7.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.826560974121094, -5.627845764160156, -5.4291300773620605, -5.230414867401123, -5.031699180603027, -4.83298397064209, -4.634268760681152, -4.435553073883057, -4.236837863922119, -4.038122653961182, -3.839406967163086, -3.6406917572021484, -3.441976308822632, -3.2432608604431152, -3.0445454120635986, -2.845829963684082, -2.6471145153045654, -2.448399066925049, -2.2496836185455322, -2.0509681701660156, -1.8522529602050781, -1.6535375118255615, -1.454822063446045, -1.2561067342758179, -1.0573912858963013, -0.8586758971214294, -0.6599605083465576, -0.461245059967041, -0.2625296711921692, -0.06381428241729736, 0.13490116596221924, 0.3336164951324463, 0.5323319435119629, 0.7310473322868347, 0.9297627210617065, 1.1284781694412231, 1.3271934986114502, 1.5259089469909668, 1.7246243953704834, 1.9233397245407104, 2.1220550537109375, 2.320770502090454, 2.5194859504699707, 2.718201160430908, 2.916916608810425, 3.1156320571899414, 3.314347505569458, 3.5130629539489746, 3.711778402328491, 3.910493850708008, 4.109209060668945, 4.307924747467041, 4.5066399574279785, 4.705355644226074, 4.904070854187012, 5.102786064147949, 5.301501750946045, 5.500216960906982, 5.698932647705078, 5.897647857666016, 6.096363544464111, 6.295078754425049, 6.4937944412231445, 6.692509651184082, 6.8912248611450195]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 12.0, 9.0, 26.0, 33.0, 47.0, 89.0, 125.0, 209.0, 332.0, 550.0, 985.0, 1550.0, 2582.0, 4403.0, 7705.0, 13552.0, 24350.0, 43545.0, 79361.0, 144673.0, 259512.0, 435848.0, 634718.0, 741194.0, 669759.0, 476726.0, 287758.0, 161638.0, 88677.0, 48680.0, 27845.0, 15655.0, 8960.0, 5245.0, 3145.0, 1823.0, 1117.0, 656.0, 451.0, 251.0, 171.0, 118.0, 68.0, 56.0, 24.0, 23.0, 14.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.7421875, -5.5712890625, -5.400390625, -5.2294921875, -5.05859375, -4.8876953125, -4.716796875, -4.5458984375, -4.375, -4.2041015625, -4.033203125, -3.8623046875, -3.69140625, -3.5205078125, -3.349609375, -3.1787109375, -3.0078125, -2.8369140625, -2.666015625, -2.4951171875, -2.32421875, -2.1533203125, -1.982421875, -1.8115234375, -1.640625, -1.4697265625, -1.298828125, -1.1279296875, -0.95703125, -0.7861328125, -0.615234375, -0.4443359375, -0.2734375, -0.1025390625, 0.068359375, 0.2392578125, 0.41015625, 0.5810546875, 0.751953125, 0.9228515625, 1.09375, 1.2646484375, 1.435546875, 1.6064453125, 1.77734375, 1.9482421875, 2.119140625, 2.2900390625, 2.4609375, 2.6318359375, 2.802734375, 2.9736328125, 3.14453125, 3.3154296875, 3.486328125, 3.6572265625, 3.828125, 3.9990234375, 4.169921875, 4.3408203125, 4.51171875, 4.6826171875, 4.853515625, 5.0244140625, 5.1953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 12.0, 12.0, 6.0, 13.0, 9.0, 11.0, 18.0, 13.0, 17.0, 18.0, 17.0, 22.0, 21.0, 35.0, 30.0, 36.0, 31.0, 29.0, 37.0, 40.0, 36.0, 45.0, 34.0, 31.0, 31.0, 38.0, 32.0, 30.0, 34.0, 27.0, 32.0, 18.0, 25.0, 27.0, 21.0, 18.0, 11.0, 12.0, 13.0, 8.0, 8.0, 6.0, 4.0, 4.0, 1.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0], "bins": [-4.84375, -4.68548583984375, -4.5272216796875, -4.36895751953125, -4.210693359375, -4.05242919921875, -3.8941650390625, -3.73590087890625, -3.57763671875, -3.41937255859375, -3.2611083984375, -3.10284423828125, -2.944580078125, -2.78631591796875, -2.6280517578125, -2.46978759765625, -2.3115234375, -2.15325927734375, -1.9949951171875, -1.83673095703125, -1.678466796875, -1.52020263671875, -1.3619384765625, -1.20367431640625, -1.04541015625, -0.88714599609375, -0.7288818359375, -0.57061767578125, -0.412353515625, -0.25408935546875, -0.0958251953125, 0.06243896484375, 0.220703125, 0.37896728515625, 0.5372314453125, 0.69549560546875, 0.853759765625, 1.01202392578125, 1.1702880859375, 1.32855224609375, 1.48681640625, 1.64508056640625, 1.8033447265625, 1.96160888671875, 2.119873046875, 2.27813720703125, 2.4364013671875, 2.59466552734375, 2.7529296875, 2.91119384765625, 3.0694580078125, 3.22772216796875, 3.385986328125, 3.54425048828125, 3.7025146484375, 3.86077880859375, 4.01904296875, 4.17730712890625, 4.3355712890625, 4.49383544921875, 4.652099609375, 4.81036376953125, 4.9686279296875, 5.12689208984375, 5.28515625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 15.0, 15.0, 24.0, 40.0, 55.0, 82.0, 134.0, 220.0, 374.0, 571.0, 913.0, 1583.0, 2691.0, 4347.0, 7130.0, 12077.0, 20596.0, 34810.0, 58388.0, 97969.0, 161929.0, 258613.0, 392120.0, 538943.0, 636690.0, 607369.0, 481601.0, 332809.0, 213919.0, 132007.0, 79426.0, 47859.0, 27990.0, 16357.0, 9888.0, 5951.0, 3466.0, 2056.0, 1233.0, 745.0, 494.0, 274.0, 189.0, 119.0, 71.0, 55.0, 24.0, 17.0, 12.0, 9.0, 7.0, 10.0, 2.0, 3.0, 1.0, 1.0], "bins": [-5.72265625, -5.54815673828125, -5.3736572265625, -5.19915771484375, -5.024658203125, -4.85015869140625, -4.6756591796875, -4.50115966796875, -4.32666015625, -4.15216064453125, -3.9776611328125, -3.80316162109375, -3.628662109375, -3.45416259765625, -3.2796630859375, -3.10516357421875, -2.9306640625, -2.75616455078125, -2.5816650390625, -2.40716552734375, -2.232666015625, -2.05816650390625, -1.8836669921875, -1.70916748046875, -1.53466796875, -1.36016845703125, -1.1856689453125, -1.01116943359375, -0.836669921875, -0.66217041015625, -0.4876708984375, -0.31317138671875, -0.138671875, 0.03582763671875, 0.2103271484375, 0.38482666015625, 0.559326171875, 0.73382568359375, 0.9083251953125, 1.08282470703125, 1.25732421875, 1.43182373046875, 1.6063232421875, 1.78082275390625, 1.955322265625, 2.12982177734375, 2.3043212890625, 2.47882080078125, 2.6533203125, 2.82781982421875, 3.0023193359375, 3.17681884765625, 3.351318359375, 3.52581787109375, 3.7003173828125, 3.87481689453125, 4.04931640625, 4.22381591796875, 4.3983154296875, 4.57281494140625, 4.747314453125, 4.92181396484375, 5.0963134765625, 5.27081298828125, 5.4453125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 11.0, 10.0, 9.0, 18.0, 19.0, 20.0, 25.0, 37.0, 38.0, 44.0, 53.0, 71.0, 91.0, 115.0, 133.0, 127.0, 133.0, 171.0, 186.0, 185.0, 190.0, 192.0, 181.0, 213.0, 210.0, 178.0, 188.0, 174.0, 135.0, 144.0, 118.0, 106.0, 76.0, 84.0, 74.0, 54.0, 58.0, 46.0, 24.0, 29.0, 18.0, 14.0, 15.0, 10.0, 9.0, 9.0, 8.0, 2.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.08203125, -2.01666259765625, -1.9512939453125, -1.88592529296875, -1.820556640625, -1.75518798828125, -1.6898193359375, -1.62445068359375, -1.55908203125, -1.49371337890625, -1.4283447265625, -1.36297607421875, -1.297607421875, -1.23223876953125, -1.1668701171875, -1.10150146484375, -1.0361328125, -0.97076416015625, -0.9053955078125, -0.84002685546875, -0.774658203125, -0.70928955078125, -0.6439208984375, -0.57855224609375, -0.51318359375, -0.44781494140625, -0.3824462890625, -0.31707763671875, -0.251708984375, -0.18634033203125, -0.1209716796875, -0.05560302734375, 0.009765625, 0.07513427734375, 0.1405029296875, 0.20587158203125, 0.271240234375, 0.33660888671875, 0.4019775390625, 0.46734619140625, 0.53271484375, 0.59808349609375, 0.6634521484375, 0.72882080078125, 0.794189453125, 0.85955810546875, 0.9249267578125, 0.99029541015625, 1.0556640625, 1.12103271484375, 1.1864013671875, 1.25177001953125, 1.317138671875, 1.38250732421875, 1.4478759765625, 1.51324462890625, 1.57861328125, 1.64398193359375, 1.7093505859375, 1.77471923828125, 1.840087890625, 1.90545654296875, 1.9708251953125, 2.03619384765625, 2.1015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 9.0, 10.0, 9.0, 8.0, 14.0, 22.0, 30.0, 20.0, 40.0, 33.0, 33.0, 18.0, 44.0, 51.0, 48.0, 34.0, 46.0, 47.0, 50.0, 42.0, 51.0, 44.0, 34.0, 29.0, 33.0, 31.0, 19.0, 10.0, 15.0, 25.0, 12.0, 13.0, 14.0, 16.0, 9.0, 2.0, 6.0, 2.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.817519187927246, -5.621379852294922, -5.425240516662598, -5.229101181030273, -5.032961845397949, -4.836822509765625, -4.640683174133301, -4.444543838500977, -4.248404502868652, -4.052265167236328, -3.856125831604004, -3.6599864959716797, -3.4638471603393555, -3.2677078247070312, -3.071568727493286, -2.875429391860962, -2.679290294647217, -2.4831509590148926, -2.2870116233825684, -2.090872287750244, -1.8947330713272095, -1.6985937356948853, -1.5024545192718506, -1.3063151836395264, -1.1101758480072021, -0.9140365123748779, -0.7178972363471985, -0.521757960319519, -0.3256186246871948, -0.1294792890548706, 0.06665992736816406, 0.2627992630004883, 0.4589385986328125, 0.6550779342651367, 0.8512172102928162, 1.0473564863204956, 1.2434958219528198, 1.439635157585144, 1.6357743740081787, 1.831913709640503, 2.028053045272827, 2.2241923809051514, 2.4203317165374756, 2.6164708137512207, 2.812610149383545, 3.008749485015869, 3.2048888206481934, 3.4010281562805176, 3.597167491912842, 3.793306827545166, 3.9894461631774902, 4.1855854988098145, 4.381724834442139, 4.577864170074463, 4.774003028869629, 4.970142364501953, 5.166281700134277, 5.362421035766602, 5.558560371398926, 5.75469970703125, 5.950839042663574, 6.146978378295898, 6.343117713928223, 6.539257049560547, 6.735396385192871]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 6.0, 6.0, 2.0, 14.0, 11.0, 10.0, 23.0, 11.0, 15.0, 20.0, 22.0, 22.0, 29.0, 26.0, 28.0, 33.0, 29.0, 42.0, 31.0, 40.0, 39.0, 34.0, 37.0, 31.0, 20.0, 36.0, 37.0, 28.0, 26.0, 39.0, 42.0, 20.0, 30.0, 23.0, 21.0, 11.0, 21.0, 9.0, 9.0, 9.0, 9.0, 11.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0], "bins": [-5.7941389083862305, -5.611611843109131, -5.429084300994873, -5.246557235717773, -5.064029693603516, -4.881502628326416, -4.698975563049316, -4.516448020935059, -4.333920955657959, -4.151393890380859, -3.9688663482666016, -3.786339282989502, -3.6038119792938232, -3.4212846755981445, -3.238757610321045, -3.056230306625366, -2.8737030029296875, -2.691175699234009, -2.50864839553833, -2.3261213302612305, -2.1435940265655518, -1.961066722869873, -1.7785395383834839, -1.5960123538970947, -1.413485050201416, -1.2309577465057373, -1.0484305620193481, -0.8659033179283142, -0.6833760738372803, -0.5008488297462463, -0.3183215856552124, -0.13579440116882324, 0.04673337936401367, 0.2292606234550476, 0.41178786754608154, 0.5943151116371155, 0.7768423557281494, 0.9593695998191833, 1.1418968439102173, 1.3244240283966064, 1.5069513320922852, 1.6894786357879639, 1.872005820274353, 2.054533004760742, 2.237060308456421, 2.4195876121520996, 2.602114677429199, 2.784641981124878, 2.9671692848205566, 3.1496965885162354, 3.332223892211914, 3.5147509574890137, 3.6972782611846924, 3.879805564880371, 4.062332630157471, 4.24485969543457, 4.427387237548828, 4.609914302825928, 4.7924418449401855, 4.974968910217285, 5.157496452331543, 5.340023517608643, 5.522550582885742, 5.705078125, 5.8876051902771]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 25.0, 39.0, 50.0, 84.0, 132.0, 207.0, 321.0, 531.0, 851.0, 1305.0, 2114.0, 3238.0, 4994.0, 7761.0, 11247.0, 17023.0, 24292.0, 33886.0, 45620.0, 58960.0, 73895.0, 87051.0, 95564.0, 99577.0, 97255.0, 87665.0, 75040.0, 60654.0, 47423.0, 34754.0, 25215.0, 17227.0, 11884.0, 7997.0, 5228.0, 3455.0, 2203.0, 1408.0, 893.0, 525.0, 350.0, 214.0, 148.0, 80.0, 63.0, 44.0, 23.0, 15.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.408203125, -2.329376220703125, -2.25054931640625, -2.171722412109375, -2.0928955078125, -2.014068603515625, -1.93524169921875, -1.856414794921875, -1.777587890625, -1.698760986328125, -1.61993408203125, -1.541107177734375, -1.4622802734375, -1.383453369140625, -1.30462646484375, -1.225799560546875, -1.14697265625, -1.068145751953125, -0.98931884765625, -0.910491943359375, -0.8316650390625, -0.752838134765625, -0.67401123046875, -0.595184326171875, -0.516357421875, -0.437530517578125, -0.35870361328125, -0.279876708984375, -0.2010498046875, -0.122222900390625, -0.04339599609375, 0.035430908203125, 0.1142578125, 0.193084716796875, 0.27191162109375, 0.350738525390625, 0.4295654296875, 0.508392333984375, 0.58721923828125, 0.666046142578125, 0.744873046875, 0.823699951171875, 0.90252685546875, 0.981353759765625, 1.0601806640625, 1.139007568359375, 1.21783447265625, 1.296661376953125, 1.37548828125, 1.454315185546875, 1.53314208984375, 1.611968994140625, 1.6907958984375, 1.769622802734375, 1.84844970703125, 1.927276611328125, 2.006103515625, 2.084930419921875, 2.16375732421875, 2.242584228515625, 2.3214111328125, 2.400238037109375, 2.47906494140625, 2.557891845703125, 2.63671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 16.0, 10.0, 19.0, 17.0, 19.0, 23.0, 15.0, 26.0, 30.0, 36.0, 28.0, 26.0, 36.0, 42.0, 31.0, 37.0, 39.0, 37.0, 43.0, 40.0, 21.0, 42.0, 41.0, 32.0, 30.0, 41.0, 26.0, 31.0, 31.0, 13.0, 11.0, 18.0, 11.0, 5.0, 11.0, 9.0, 3.0, 4.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.8515625, -5.67071533203125, -5.4898681640625, -5.30902099609375, -5.128173828125, -4.94732666015625, -4.7664794921875, -4.58563232421875, -4.40478515625, -4.22393798828125, -4.0430908203125, -3.86224365234375, -3.681396484375, -3.50054931640625, -3.3197021484375, -3.13885498046875, -2.9580078125, -2.77716064453125, -2.5963134765625, -2.41546630859375, -2.234619140625, -2.05377197265625, -1.8729248046875, -1.69207763671875, -1.51123046875, -1.33038330078125, -1.1495361328125, -0.96868896484375, -0.787841796875, -0.60699462890625, -0.4261474609375, -0.24530029296875, -0.064453125, 0.11639404296875, 0.2972412109375, 0.47808837890625, 0.658935546875, 0.83978271484375, 1.0206298828125, 1.20147705078125, 1.38232421875, 1.56317138671875, 1.7440185546875, 1.92486572265625, 2.105712890625, 2.28656005859375, 2.4674072265625, 2.64825439453125, 2.8291015625, 3.00994873046875, 3.1907958984375, 3.37164306640625, 3.552490234375, 3.73333740234375, 3.9141845703125, 4.09503173828125, 4.27587890625, 4.45672607421875, 4.6375732421875, 4.81842041015625, 4.999267578125, 5.18011474609375, 5.3609619140625, 5.54180908203125, 5.72265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 6.0, 11.0, 6.0, 11.0, 8.0, 18.0, 29.0, 36.0, 44.0, 75.0, 92.0, 113.0, 179.0, 293.0, 455.0, 753.0, 1263.0, 2348.0, 4129.0, 7273.0, 13111.0, 23282.0, 64055.0, 767606.0, 103197.0, 26521.0, 14557.0, 8053.0, 4635.0, 2590.0, 1463.0, 839.0, 467.0, 311.0, 199.0, 145.0, 108.0, 59.0, 59.0, 30.0, 31.0, 20.0, 11.0, 18.0, 5.0, 8.0, 6.0, 7.0, 6.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.46875, -10.1373291015625, -9.805908203125, -9.4744873046875, -9.14306640625, -8.8116455078125, -8.480224609375, -8.1488037109375, -7.8173828125, -7.4859619140625, -7.154541015625, -6.8231201171875, -6.49169921875, -6.1602783203125, -5.828857421875, -5.4974365234375, -5.166015625, -4.8345947265625, -4.503173828125, -4.1717529296875, -3.84033203125, -3.5089111328125, -3.177490234375, -2.8460693359375, -2.5146484375, -2.1832275390625, -1.851806640625, -1.5203857421875, -1.18896484375, -0.8575439453125, -0.526123046875, -0.1947021484375, 0.13671875, 0.4681396484375, 0.799560546875, 1.1309814453125, 1.46240234375, 1.7938232421875, 2.125244140625, 2.4566650390625, 2.7880859375, 3.1195068359375, 3.450927734375, 3.7823486328125, 4.11376953125, 4.4451904296875, 4.776611328125, 5.1080322265625, 5.439453125, 5.7708740234375, 6.102294921875, 6.4337158203125, 6.76513671875, 7.0965576171875, 7.427978515625, 7.7593994140625, 8.0908203125, 8.4222412109375, 8.753662109375, 9.0850830078125, 9.41650390625, 9.7479248046875, 10.079345703125, 10.4107666015625, 10.7421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 6.0, 4.0, 7.0, 7.0, 8.0, 15.0, 13.0, 19.0, 17.0, 22.0, 24.0, 29.0, 28.0, 37.0, 37.0, 34.0, 40.0, 37.0, 48.0, 36.0, 50.0, 43.0, 45.0, 47.0, 37.0, 36.0, 39.0, 36.0, 34.0, 22.0, 25.0, 23.0, 15.0, 14.0, 11.0, 12.0, 7.0, 10.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-8.859375, -8.61773681640625, -8.3760986328125, -8.13446044921875, -7.892822265625, -7.65118408203125, -7.4095458984375, -7.16790771484375, -6.92626953125, -6.68463134765625, -6.4429931640625, -6.20135498046875, -5.959716796875, -5.71807861328125, -5.4764404296875, -5.23480224609375, -4.9931640625, -4.75152587890625, -4.5098876953125, -4.26824951171875, -4.026611328125, -3.78497314453125, -3.5433349609375, -3.30169677734375, -3.06005859375, -2.81842041015625, -2.5767822265625, -2.33514404296875, -2.093505859375, -1.85186767578125, -1.6102294921875, -1.36859130859375, -1.126953125, -0.88531494140625, -0.6436767578125, -0.40203857421875, -0.160400390625, 0.08123779296875, 0.3228759765625, 0.56451416015625, 0.80615234375, 1.04779052734375, 1.2894287109375, 1.53106689453125, 1.772705078125, 2.01434326171875, 2.2559814453125, 2.49761962890625, 2.7392578125, 2.98089599609375, 3.2225341796875, 3.46417236328125, 3.705810546875, 3.94744873046875, 4.1890869140625, 4.43072509765625, 4.67236328125, 4.91400146484375, 5.1556396484375, 5.39727783203125, 5.638916015625, 5.88055419921875, 6.1221923828125, 6.36383056640625, 6.60546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 8.0, 8.0, 13.0, 15.0, 22.0, 30.0, 40.0, 65.0, 74.0, 130.0, 162.0, 271.0, 353.0, 538.0, 768.0, 1228.0, 1860.0, 2964.0, 4775.0, 7600.0, 13111.0, 24461.0, 84887.0, 684552.0, 152668.0, 29915.0, 14909.0, 8509.0, 5233.0, 3284.0, 2088.0, 1333.0, 858.0, 593.0, 396.0, 261.0, 175.0, 96.0, 89.0, 57.0, 38.0, 35.0, 17.0, 13.0, 10.0, 13.0, 8.0, 6.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.158203125, -2.092041015625, -2.02587890625, -1.959716796875, -1.8935546875, -1.827392578125, -1.76123046875, -1.695068359375, -1.62890625, -1.562744140625, -1.49658203125, -1.430419921875, -1.3642578125, -1.298095703125, -1.23193359375, -1.165771484375, -1.099609375, -1.033447265625, -0.96728515625, -0.901123046875, -0.8349609375, -0.768798828125, -0.70263671875, -0.636474609375, -0.5703125, -0.504150390625, -0.43798828125, -0.371826171875, -0.3056640625, -0.239501953125, -0.17333984375, -0.107177734375, -0.041015625, 0.025146484375, 0.09130859375, 0.157470703125, 0.2236328125, 0.289794921875, 0.35595703125, 0.422119140625, 0.48828125, 0.554443359375, 0.62060546875, 0.686767578125, 0.7529296875, 0.819091796875, 0.88525390625, 0.951416015625, 1.017578125, 1.083740234375, 1.14990234375, 1.216064453125, 1.2822265625, 1.348388671875, 1.41455078125, 1.480712890625, 1.546875, 1.613037109375, 1.67919921875, 1.745361328125, 1.8115234375, 1.877685546875, 1.94384765625, 2.010009765625, 2.076171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 12.0, 11.0, 6.0, 12.0, 18.0, 20.0, 31.0, 40.0, 36.0, 40.0, 51.0, 52.0, 59.0, 81.0, 76.0, 64.0, 59.0, 61.0, 64.0, 31.0, 39.0, 28.0, 26.0, 25.0, 11.0, 12.0, 14.0, 6.0, 7.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008748695254325867, -0.0008489936590194702, -0.0008231177926063538, -0.0007972419261932373, -0.0007713660597801208, -0.0007454901933670044, -0.0007196143269538879, -0.0006937384605407715, -0.000667862594127655, -0.0006419867277145386, -0.0006161108613014221, -0.0005902349948883057, -0.0005643591284751892, -0.0005384832620620728, -0.0005126073956489563, -0.00048673152923583984, -0.0004608556628227234, -0.00043497979640960693, -0.0004091039299964905, -0.000383228063583374, -0.00035735219717025757, -0.0003314763307571411, -0.00030560046434402466, -0.0002797245979309082, -0.00025384873151779175, -0.0002279728651046753, -0.00020209699869155884, -0.00017622113227844238, -0.00015034526586532593, -0.00012446939945220947, -9.859353303909302e-05, -7.271766662597656e-05, -4.684180021286011e-05, -2.0965933799743652e-05, 4.909932613372803e-06, 3.078579902648926e-05, 5.666166543960571e-05, 8.253753185272217e-05, 0.00010841339826583862, 0.00013428926467895508, 0.00016016513109207153, 0.000186040997505188, 0.00021191686391830444, 0.0002377927303314209, 0.00026366859674453735, 0.0002895444631576538, 0.00031542032957077026, 0.0003412961959838867, 0.0003671720623970032, 0.00039304792881011963, 0.0004189237952232361, 0.00044479966163635254, 0.000470675528049469, 0.0004965513944625854, 0.0005224272608757019, 0.0005483031272888184, 0.0005741789937019348, 0.0006000548601150513, 0.0006259307265281677, 0.0006518065929412842, 0.0006776824593544006, 0.0007035583257675171, 0.0007294341921806335, 0.00075531005859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 8.0, 13.0, 17.0, 30.0, 30.0, 57.0, 96.0, 116.0, 170.0, 250.0, 334.0, 486.0, 675.0, 1000.0, 1544.0, 2236.0, 3363.0, 5232.0, 8053.0, 12926.0, 21165.0, 34913.0, 59114.0, 98263.0, 153537.0, 196313.0, 167180.0, 110732.0, 66578.0, 39755.0, 23602.0, 14528.0, 9061.0, 5781.0, 3603.0, 2536.0, 1735.0, 1120.0, 751.0, 518.0, 344.0, 234.0, 188.0, 122.0, 72.0, 53.0, 43.0, 26.0, 16.0, 18.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.828125, -0.8019332885742188, -0.7757415771484375, -0.7495498657226562, -0.723358154296875, -0.6971664428710938, -0.6709747314453125, -0.6447830200195312, -0.61859130859375, -0.5923995971679688, -0.5662078857421875, -0.5400161743164062, -0.513824462890625, -0.48763275146484375, -0.4614410400390625, -0.43524932861328125, -0.4090576171875, -0.38286590576171875, -0.3566741943359375, -0.33048248291015625, -0.304290771484375, -0.27809906005859375, -0.2519073486328125, -0.22571563720703125, -0.19952392578125, -0.17333221435546875, -0.1471405029296875, -0.12094879150390625, -0.094757080078125, -0.06856536865234375, -0.0423736572265625, -0.01618194580078125, 0.010009765625, 0.03620147705078125, 0.0623931884765625, 0.08858489990234375, 0.114776611328125, 0.14096832275390625, 0.1671600341796875, 0.19335174560546875, 0.21954345703125, 0.24573516845703125, 0.2719268798828125, 0.29811859130859375, 0.324310302734375, 0.35050201416015625, 0.3766937255859375, 0.40288543701171875, 0.4290771484375, 0.45526885986328125, 0.4814605712890625, 0.5076522827148438, 0.533843994140625, 0.5600357055664062, 0.5862274169921875, 0.6124191284179688, 0.63861083984375, 0.6648025512695312, 0.6909942626953125, 0.7171859741210938, 0.743377685546875, 0.7695693969726562, 0.7957611083984375, 0.8219528198242188, 0.84814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 2.0, 3.0, 9.0, 10.0, 16.0, 15.0, 16.0, 20.0, 24.0, 25.0, 24.0, 34.0, 38.0, 53.0, 41.0, 46.0, 52.0, 56.0, 63.0, 59.0, 51.0, 40.0, 40.0, 41.0, 39.0, 25.0, 24.0, 16.0, 19.0, 16.0, 17.0, 12.0, 12.0, 8.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.279296875, -0.2698211669921875, -0.260345458984375, -0.2508697509765625, -0.24139404296875, -0.2319183349609375, -0.222442626953125, -0.2129669189453125, -0.2034912109375, -0.1940155029296875, -0.184539794921875, -0.1750640869140625, -0.16558837890625, -0.1561126708984375, -0.146636962890625, -0.1371612548828125, -0.127685546875, -0.1182098388671875, -0.108734130859375, -0.0992584228515625, -0.08978271484375, -0.0803070068359375, -0.070831298828125, -0.0613555908203125, -0.0518798828125, -0.0424041748046875, -0.032928466796875, -0.0234527587890625, -0.01397705078125, -0.0045013427734375, 0.004974365234375, 0.0144500732421875, 0.02392578125, 0.0334014892578125, 0.042877197265625, 0.0523529052734375, 0.06182861328125, 0.0713043212890625, 0.080780029296875, 0.0902557373046875, 0.0997314453125, 0.1092071533203125, 0.118682861328125, 0.1281585693359375, 0.13763427734375, 0.1471099853515625, 0.156585693359375, 0.1660614013671875, 0.175537109375, 0.1850128173828125, 0.194488525390625, 0.2039642333984375, 0.21343994140625, 0.2229156494140625, 0.232391357421875, 0.2418670654296875, 0.2513427734375, 0.2608184814453125, 0.270294189453125, 0.2797698974609375, 0.28924560546875, 0.2987213134765625, 0.308197021484375, 0.3176727294921875, 0.3271484375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 1.0, 6.0, 9.0, 8.0, 6.0, 14.0, 10.0, 18.0, 17.0, 23.0, 16.0, 22.0, 31.0, 35.0, 46.0, 28.0, 40.0, 50.0, 41.0, 49.0, 50.0, 34.0, 47.0, 42.0, 49.0, 38.0, 39.0, 25.0, 19.0, 28.0, 27.0, 21.0, 15.0, 11.0, 16.0, 19.0, 9.0, 11.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.390498638153076, -5.211665630340576, -5.032832145690918, -4.853999137878418, -4.675166130065918, -4.496333122253418, -4.31749963760376, -4.13866662979126, -3.9598333835601807, -3.7810001373291016, -3.6021671295166016, -3.4233338832855225, -3.2445006370544434, -3.0656676292419434, -2.8868343830108643, -2.708001136779785, -2.529168128967285, -2.350334882736206, -2.171501874923706, -1.992668628692627, -1.8138355016708374, -1.6350023746490479, -1.4561691284179688, -1.2773360013961792, -1.0985028743743896, -0.9196697473526001, -0.7408365607261658, -0.5620033740997314, -0.3831702470779419, -0.20433712005615234, -0.025503873825073242, 0.1533292531967163, 0.33216285705566406, 0.5109959840774536, 0.6898291707038879, 0.8686623573303223, 1.0474954843521118, 1.2263286113739014, 1.4051618576049805, 1.58399498462677, 1.7628281116485596, 1.9416612386703491, 2.1204943656921387, 2.2993276119232178, 2.478160858154297, 2.656993865966797, 2.835827112197876, 3.014660358428955, 3.193493366241455, 3.372326612472534, 3.551159620285034, 3.7299928665161133, 3.9088258743286133, 4.087658882141113, 4.2664923667907715, 4.4453253746032715, 4.62415885925293, 4.80299186706543, 4.981825351715088, 5.160658359527588, 5.339491367340088, 5.518324851989746, 5.697157859802246, 5.875990867614746, 6.054823875427246]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 4.0, 11.0, 6.0, 9.0, 6.0, 18.0, 12.0, 13.0, 17.0, 15.0, 21.0, 19.0, 28.0, 29.0, 25.0, 27.0, 31.0, 32.0, 40.0, 49.0, 34.0, 32.0, 31.0, 49.0, 31.0, 37.0, 37.0, 39.0, 26.0, 36.0, 29.0, 24.0, 32.0, 26.0, 18.0, 13.0, 16.0, 12.0, 11.0, 11.0, 9.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.5370306968688965, -5.365978717803955, -5.194926738739014, -5.023874759674072, -4.852822780609131, -4.681770324707031, -4.51071834564209, -4.339666366577148, -4.168614387512207, -3.9975624084472656, -3.826510429382324, -3.655458450317383, -3.4844062328338623, -3.313354253768921, -3.1423022747039795, -2.971250057220459, -2.8001983165740967, -2.6291463375091553, -2.458094358444214, -2.2870421409606934, -2.115990161895752, -1.9449381828308105, -1.7738862037658691, -1.6028341054916382, -1.4317821264266968, -1.2607301473617554, -1.0896780490875244, -0.918626070022583, -0.7475740313529968, -0.5765219926834106, -0.40547001361846924, -0.23441791534423828, -0.06336593627929688, 0.10768608748912811, 0.2787381112575531, 0.4497901201248169, 0.6208421587944031, 0.7918941974639893, 0.9629461765289307, 1.1339982748031616, 1.305050253868103, 1.4761022329330444, 1.6471543312072754, 1.8182063102722168, 1.9892582893371582, 2.1603102684020996, 2.331362247467041, 2.5024144649505615, 2.673466444015503, 2.8445184230804443, 3.0155704021453857, 3.1866226196289062, 3.3576745986938477, 3.528726577758789, 3.6997785568237305, 3.870830535888672, 4.041882514953613, 4.212934494018555, 4.383986473083496, 4.5550384521484375, 4.726090431213379, 4.89714241027832, 5.068194389343262, 5.239246845245361, 5.410298824310303]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 7.0, 13.0, 11.0, 32.0, 60.0, 74.0, 130.0, 192.0, 296.0, 500.0, 744.0, 1217.0, 1920.0, 2919.0, 4423.0, 6552.0, 9526.0, 14121.0, 20152.0, 28066.0, 38918.0, 51343.0, 66981.0, 81471.0, 93844.0, 100509.0, 101106.0, 93554.0, 81040.0, 66558.0, 51811.0, 38971.0, 28415.0, 20328.0, 13919.0, 9775.0, 6495.0, 4463.0, 2811.0, 1926.0, 1215.0, 757.0, 501.0, 311.0, 218.0, 139.0, 91.0, 54.0, 39.0, 21.0, 6.0, 8.0, 7.0, 0.0, 0.0, 2.0], "bins": [-3.75, -3.63970947265625, -3.5294189453125, -3.41912841796875, -3.308837890625, -3.19854736328125, -3.0882568359375, -2.97796630859375, -2.86767578125, -2.75738525390625, -2.6470947265625, -2.53680419921875, -2.426513671875, -2.31622314453125, -2.2059326171875, -2.09564208984375, -1.9853515625, -1.87506103515625, -1.7647705078125, -1.65447998046875, -1.544189453125, -1.43389892578125, -1.3236083984375, -1.21331787109375, -1.10302734375, -0.99273681640625, -0.8824462890625, -0.77215576171875, -0.661865234375, -0.55157470703125, -0.4412841796875, -0.33099365234375, -0.220703125, -0.11041259765625, -0.0001220703125, 0.11016845703125, 0.220458984375, 0.33074951171875, 0.4410400390625, 0.55133056640625, 0.66162109375, 0.77191162109375, 0.8822021484375, 0.99249267578125, 1.102783203125, 1.21307373046875, 1.3233642578125, 1.43365478515625, 1.5439453125, 1.65423583984375, 1.7645263671875, 1.87481689453125, 1.985107421875, 2.09539794921875, 2.2056884765625, 2.31597900390625, 2.42626953125, 2.53656005859375, 2.6468505859375, 2.75714111328125, 2.867431640625, 2.97772216796875, 3.0880126953125, 3.19830322265625, 3.30859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 10.0, 10.0, 12.0, 18.0, 16.0, 15.0, 21.0, 25.0, 24.0, 26.0, 24.0, 41.0, 50.0, 39.0, 39.0, 35.0, 40.0, 49.0, 47.0, 32.0, 39.0, 39.0, 36.0, 37.0, 37.0, 27.0, 29.0, 21.0, 22.0, 15.0, 19.0, 14.0, 14.0, 13.0, 7.0, 6.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.02734375, -5.84814453125, -5.6689453125, -5.48974609375, -5.310546875, -5.13134765625, -4.9521484375, -4.77294921875, -4.59375, -4.41455078125, -4.2353515625, -4.05615234375, -3.876953125, -3.69775390625, -3.5185546875, -3.33935546875, -3.16015625, -2.98095703125, -2.8017578125, -2.62255859375, -2.443359375, -2.26416015625, -2.0849609375, -1.90576171875, -1.7265625, -1.54736328125, -1.3681640625, -1.18896484375, -1.009765625, -0.83056640625, -0.6513671875, -0.47216796875, -0.29296875, -0.11376953125, 0.0654296875, 0.24462890625, 0.423828125, 0.60302734375, 0.7822265625, 0.96142578125, 1.140625, 1.31982421875, 1.4990234375, 1.67822265625, 1.857421875, 2.03662109375, 2.2158203125, 2.39501953125, 2.57421875, 2.75341796875, 2.9326171875, 3.11181640625, 3.291015625, 3.47021484375, 3.6494140625, 3.82861328125, 4.0078125, 4.18701171875, 4.3662109375, 4.54541015625, 4.724609375, 4.90380859375, 5.0830078125, 5.26220703125, 5.44140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 5.0, 1.0, 4.0, 12.0, 18.0, 23.0, 32.0, 49.0, 84.0, 111.0, 184.0, 274.0, 409.0, 675.0, 1037.0, 1695.0, 2807.0, 4710.0, 7658.0, 12423.0, 20764.0, 34361.0, 53709.0, 80693.0, 112147.0, 136994.0, 145445.0, 131827.0, 103444.0, 72840.0, 47574.0, 30128.0, 18239.0, 10934.0, 6772.0, 3938.0, 2423.0, 1461.0, 965.0, 574.0, 402.0, 228.0, 181.0, 102.0, 76.0, 31.0, 33.0, 28.0, 11.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.15045166015625, -4.9688720703125, -4.78729248046875, -4.605712890625, -4.42413330078125, -4.2425537109375, -4.06097412109375, -3.87939453125, -3.69781494140625, -3.5162353515625, -3.33465576171875, -3.153076171875, -2.97149658203125, -2.7899169921875, -2.60833740234375, -2.4267578125, -2.24517822265625, -2.0635986328125, -1.88201904296875, -1.700439453125, -1.51885986328125, -1.3372802734375, -1.15570068359375, -0.97412109375, -0.79254150390625, -0.6109619140625, -0.42938232421875, -0.247802734375, -0.06622314453125, 0.1153564453125, 0.29693603515625, 0.478515625, 0.66009521484375, 0.8416748046875, 1.02325439453125, 1.204833984375, 1.38641357421875, 1.5679931640625, 1.74957275390625, 1.93115234375, 2.11273193359375, 2.2943115234375, 2.47589111328125, 2.657470703125, 2.83905029296875, 3.0206298828125, 3.20220947265625, 3.3837890625, 3.56536865234375, 3.7469482421875, 3.92852783203125, 4.110107421875, 4.29168701171875, 4.4732666015625, 4.65484619140625, 4.83642578125, 5.01800537109375, 5.1995849609375, 5.38116455078125, 5.562744140625, 5.74432373046875, 5.9259033203125, 6.10748291015625, 6.2890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 10.0, 13.0, 8.0, 11.0, 15.0, 16.0, 19.0, 22.0, 24.0, 29.0, 19.0, 39.0, 41.0, 45.0, 61.0, 44.0, 34.0, 48.0, 44.0, 43.0, 33.0, 36.0, 42.0, 45.0, 34.0, 27.0, 25.0, 29.0, 27.0, 13.0, 21.0, 18.0, 18.0, 16.0, 7.0, 7.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.46484375, -4.338653564453125, -4.21246337890625, -4.086273193359375, -3.9600830078125, -3.833892822265625, -3.70770263671875, -3.581512451171875, -3.455322265625, -3.329132080078125, -3.20294189453125, -3.076751708984375, -2.9505615234375, -2.824371337890625, -2.69818115234375, -2.571990966796875, -2.44580078125, -2.319610595703125, -2.19342041015625, -2.067230224609375, -1.9410400390625, -1.814849853515625, -1.68865966796875, -1.562469482421875, -1.436279296875, -1.310089111328125, -1.18389892578125, -1.057708740234375, -0.9315185546875, -0.805328369140625, -0.67913818359375, -0.552947998046875, -0.4267578125, -0.300567626953125, -0.17437744140625, -0.048187255859375, 0.0780029296875, 0.204193115234375, 0.33038330078125, 0.456573486328125, 0.582763671875, 0.708953857421875, 0.83514404296875, 0.961334228515625, 1.0875244140625, 1.213714599609375, 1.33990478515625, 1.466094970703125, 1.59228515625, 1.718475341796875, 1.84466552734375, 1.970855712890625, 2.0970458984375, 2.223236083984375, 2.34942626953125, 2.475616455078125, 2.601806640625, 2.727996826171875, 2.85418701171875, 2.980377197265625, 3.1065673828125, 3.232757568359375, 3.35894775390625, 3.485137939453125, 3.611328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 3.0, 11.0, 19.0, 31.0, 51.0, 71.0, 113.0, 168.0, 279.0, 446.0, 730.0, 1047.0, 1837.0, 3040.0, 4757.0, 8083.0, 13437.0, 22389.0, 36240.0, 57717.0, 86163.0, 118968.0, 144552.0, 147993.0, 128976.0, 97175.0, 66253.0, 42205.0, 26038.0, 15783.0, 9225.0, 5620.0, 3495.0, 2142.0, 1250.0, 826.0, 517.0, 324.0, 218.0, 130.0, 90.0, 62.0, 27.0, 29.0, 12.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8838043212890625, -1.825225830078125, -1.7666473388671875, -1.70806884765625, -1.6494903564453125, -1.590911865234375, -1.5323333740234375, -1.4737548828125, -1.4151763916015625, -1.356597900390625, -1.2980194091796875, -1.23944091796875, -1.1808624267578125, -1.122283935546875, -1.0637054443359375, -1.005126953125, -0.9465484619140625, -0.887969970703125, -0.8293914794921875, -0.77081298828125, -0.7122344970703125, -0.653656005859375, -0.5950775146484375, -0.5364990234375, -0.4779205322265625, -0.419342041015625, -0.3607635498046875, -0.30218505859375, -0.2436065673828125, -0.185028076171875, -0.1264495849609375, -0.06787109375, -0.0092926025390625, 0.049285888671875, 0.1078643798828125, 0.16644287109375, 0.2250213623046875, 0.283599853515625, 0.3421783447265625, 0.4007568359375, 0.4593353271484375, 0.517913818359375, 0.5764923095703125, 0.63507080078125, 0.6936492919921875, 0.752227783203125, 0.8108062744140625, 0.869384765625, 0.9279632568359375, 0.986541748046875, 1.0451202392578125, 1.10369873046875, 1.1622772216796875, 1.220855712890625, 1.2794342041015625, 1.3380126953125, 1.3965911865234375, 1.455169677734375, 1.5137481689453125, 1.57232666015625, 1.6309051513671875, 1.689483642578125, 1.7480621337890625, 1.806640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 3.0, 9.0, 11.0, 19.0, 13.0, 22.0, 25.0, 34.0, 39.0, 49.0, 41.0, 48.0, 46.0, 55.0, 65.0, 57.0, 61.0, 57.0, 50.0, 40.0, 43.0, 35.0, 25.0, 29.0, 23.0, 13.0, 20.0, 8.0, 9.0, 8.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001964569091796875, -0.00018958933651447296, -0.00018272176384925842, -0.00017585419118404388, -0.00016898661851882935, -0.0001621190458536148, -0.00015525147318840027, -0.00014838390052318573, -0.0001415163278579712, -0.00013464875519275665, -0.00012778118252754211, -0.00012091360986232758, -0.00011404603719711304, -0.0001071784645318985, -0.00010031089186668396, -9.344331920146942e-05, -8.657574653625488e-05, -7.970817387104034e-05, -7.28406012058258e-05, -6.597302854061127e-05, -5.910545587539673e-05, -5.223788321018219e-05, -4.537031054496765e-05, -3.850273787975311e-05, -3.1635165214538574e-05, -2.4767592549324036e-05, -1.7900019884109497e-05, -1.1032447218894958e-05, -4.16487455368042e-06, 2.7026981115341187e-06, 9.570270776748657e-06, 1.6437843441963196e-05, 2.3305416107177734e-05, 3.0172988772392273e-05, 3.704056143760681e-05, 4.390813410282135e-05, 5.077570676803589e-05, 5.764327943325043e-05, 6.451085209846497e-05, 7.13784247636795e-05, 7.824599742889404e-05, 8.511357009410858e-05, 9.198114275932312e-05, 9.884871542453766e-05, 0.0001057162880897522, 0.00011258386075496674, 0.00011945143342018127, 0.0001263190060853958, 0.00013318657875061035, 0.0001400541514158249, 0.00014692172408103943, 0.00015378929674625397, 0.0001606568694114685, 0.00016752444207668304, 0.00017439201474189758, 0.00018125958740711212, 0.00018812716007232666, 0.0001949947327375412, 0.00020186230540275574, 0.00020872987806797028, 0.00021559745073318481, 0.00022246502339839935, 0.0002293325960636139, 0.00023620016872882843, 0.00024306774139404297]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 13.0, 17.0, 23.0, 35.0, 57.0, 81.0, 133.0, 214.0, 303.0, 444.0, 698.0, 1068.0, 1599.0, 2406.0, 3748.0, 5741.0, 8943.0, 14520.0, 22805.0, 35788.0, 55179.0, 82086.0, 112170.0, 137042.0, 142251.0, 126782.0, 98637.0, 69270.0, 45920.0, 29611.0, 18457.0, 11516.0, 7360.0, 4682.0, 3018.0, 1971.0, 1366.0, 891.0, 548.0, 388.0, 282.0, 160.0, 105.0, 75.0, 56.0, 35.0, 24.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.884765625, -1.8263702392578125, -1.767974853515625, -1.7095794677734375, -1.65118408203125, -1.5927886962890625, -1.534393310546875, -1.4759979248046875, -1.4176025390625, -1.3592071533203125, -1.300811767578125, -1.2424163818359375, -1.18402099609375, -1.1256256103515625, -1.067230224609375, -1.0088348388671875, -0.950439453125, -0.8920440673828125, -0.833648681640625, -0.7752532958984375, -0.71685791015625, -0.6584625244140625, -0.600067138671875, -0.5416717529296875, -0.4832763671875, -0.4248809814453125, -0.366485595703125, -0.3080902099609375, -0.24969482421875, -0.1912994384765625, -0.132904052734375, -0.0745086669921875, -0.01611328125, 0.0422821044921875, 0.100677490234375, 0.1590728759765625, 0.21746826171875, 0.2758636474609375, 0.334259033203125, 0.3926544189453125, 0.4510498046875, 0.5094451904296875, 0.567840576171875, 0.6262359619140625, 0.68463134765625, 0.7430267333984375, 0.801422119140625, 0.8598175048828125, 0.918212890625, 0.9766082763671875, 1.035003662109375, 1.0933990478515625, 1.15179443359375, 1.2101898193359375, 1.268585205078125, 1.3269805908203125, 1.3853759765625, 1.4437713623046875, 1.502166748046875, 1.5605621337890625, 1.61895751953125, 1.6773529052734375, 1.735748291015625, 1.7941436767578125, 1.8525390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 3.0, 8.0, 10.0, 9.0, 13.0, 14.0, 14.0, 17.0, 23.0, 32.0, 28.0, 40.0, 46.0, 40.0, 52.0, 51.0, 63.0, 57.0, 56.0, 62.0, 56.0, 42.0, 35.0, 37.0, 40.0, 27.0, 18.0, 17.0, 18.0, 17.0, 9.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7265625, -0.7033462524414062, -0.6801300048828125, -0.6569137573242188, -0.633697509765625, -0.6104812622070312, -0.5872650146484375, -0.5640487670898438, -0.54083251953125, -0.5176162719726562, -0.4944000244140625, -0.47118377685546875, -0.447967529296875, -0.42475128173828125, -0.4015350341796875, -0.37831878662109375, -0.3551025390625, -0.33188629150390625, -0.3086700439453125, -0.28545379638671875, -0.262237548828125, -0.23902130126953125, -0.2158050537109375, -0.19258880615234375, -0.16937255859375, -0.14615631103515625, -0.1229400634765625, -0.09972381591796875, -0.076507568359375, -0.05329132080078125, -0.0300750732421875, -0.00685882568359375, 0.016357421875, 0.03957366943359375, 0.0627899169921875, 0.08600616455078125, 0.109222412109375, 0.13243865966796875, 0.1556549072265625, 0.17887115478515625, 0.20208740234375, 0.22530364990234375, 0.2485198974609375, 0.27173614501953125, 0.294952392578125, 0.31816864013671875, 0.3413848876953125, 0.36460113525390625, 0.3878173828125, 0.41103363037109375, 0.4342498779296875, 0.45746612548828125, 0.480682373046875, 0.5038986206054688, 0.5271148681640625, 0.5503311157226562, 0.57354736328125, 0.5967636108398438, 0.6199798583984375, 0.6431961059570312, 0.666412353515625, 0.6896286010742188, 0.7128448486328125, 0.7360610961914062, 0.75927734375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 5.0, 10.0, 12.0, 12.0, 12.0, 15.0, 14.0, 13.0, 33.0, 28.0, 25.0, 29.0, 25.0, 36.0, 25.0, 46.0, 35.0, 36.0, 51.0, 48.0, 52.0, 45.0, 35.0, 39.0, 42.0, 37.0, 34.0, 18.0, 30.0, 17.0, 19.0, 14.0, 16.0, 15.0, 10.0, 11.0, 11.0, 11.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7879319190979, -4.626857280731201, -4.46578311920166, -4.304708480834961, -4.14363431930542, -3.9825596809387207, -3.8214852809906006, -3.6604108810424805, -3.4993364810943604, -3.3382620811462402, -3.17718768119812, -3.01611328125, -2.855038642883301, -2.6939644813537598, -2.5328898429870605, -2.3718154430389404, -2.2107410430908203, -2.0496666431427, -1.88859224319458, -1.7275177240371704, -1.5664433240890503, -1.4053689241409302, -1.2442944049835205, -1.0832200050354004, -0.9221456050872803, -0.7610712051391602, -0.5999967455863953, -0.43892231583595276, -0.27784788608551025, -0.11677348613739014, 0.044300973415374756, 0.20537543296813965, 0.36644935607910156, 0.5275237560272217, 0.6885982155799866, 0.8496726751327515, 1.0107470750808716, 1.1718214750289917, 1.3328959941864014, 1.4939703941345215, 1.6550447940826416, 1.8161191940307617, 1.9771935939788818, 2.138267993927002, 2.299342632293701, 2.460416793823242, 2.6214914321899414, 2.7825658321380615, 2.9436402320861816, 3.1047146320343018, 3.265789031982422, 3.426863431930542, 3.587937831878662, 3.7490124702453613, 3.9100868701934814, 4.071161270141602, 4.232235908508301, 4.393310546875, 4.554384708404541, 4.71545934677124, 4.876533508300781, 5.0376081466674805, 5.1986823081970215, 5.359756946563721, 5.520831108093262]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 14.0, 11.0, 18.0, 14.0, 17.0, 34.0, 24.0, 30.0, 29.0, 24.0, 34.0, 31.0, 47.0, 46.0, 30.0, 36.0, 43.0, 44.0, 26.0, 45.0, 43.0, 34.0, 36.0, 43.0, 35.0, 41.0, 30.0, 25.0, 11.0, 16.0, 16.0, 11.0, 14.0, 7.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.8438401222229, -5.6544904708862305, -5.465141296386719, -5.275791645050049, -5.086442470550537, -4.897092819213867, -4.7077436447143555, -4.5183939933776855, -4.329044342041016, -4.139694690704346, -3.950345516204834, -3.760995864868164, -3.5716466903686523, -3.3822970390319824, -3.1929476261138916, -3.003598213195801, -2.814249038696289, -2.6248996257781982, -2.4355502128601074, -2.2462005615234375, -2.056851387023926, -1.8675018548965454, -1.678152322769165, -1.4888029098510742, -1.2994534969329834, -1.1101040840148926, -0.920754611492157, -0.7314051389694214, -0.5420557260513306, -0.35270631313323975, -0.16335678100585938, 0.025992631912231445, 0.21534204483032227, 0.4046914875507355, 0.5940409302711487, 0.7833904027938843, 0.9727398157119751, 1.162089228630066, 1.3514387607574463, 1.540788173675537, 1.730137586593628, 1.9194869995117188, 2.1088364124298096, 2.2981858253479004, 2.4875354766845703, 2.676884651184082, 2.866234302520752, 3.0555837154388428, 3.2449331283569336, 3.4342825412750244, 3.6236319541931152, 3.812981605529785, 4.002330780029297, 4.191680431365967, 4.381030082702637, 4.570379257202148, 4.75972843170166, 4.94907808303833, 5.138427257537842, 5.327776908874512, 5.517126083374023, 5.706475734710693, 5.895825386047363, 6.085174560546875, 6.274524211883545]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 14.0, 26.0, 34.0, 51.0, 67.0, 131.0, 183.0, 337.0, 568.0, 925.0, 1535.0, 2626.0, 4342.0, 7468.0, 13289.0, 23485.0, 42756.0, 80043.0, 151001.0, 281569.0, 486587.0, 705262.0, 781723.0, 655575.0, 429659.0, 242629.0, 128408.0, 68034.0, 37196.0, 20566.0, 11639.0, 6656.0, 3846.0, 2347.0, 1356.0, 876.0, 542.0, 331.0, 221.0, 133.0, 73.0, 49.0, 35.0, 34.0, 23.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.30859375, -4.16192626953125, -4.0152587890625, -3.86859130859375, -3.721923828125, -3.57525634765625, -3.4285888671875, -3.28192138671875, -3.13525390625, -2.98858642578125, -2.8419189453125, -2.69525146484375, -2.548583984375, -2.40191650390625, -2.2552490234375, -2.10858154296875, -1.9619140625, -1.81524658203125, -1.6685791015625, -1.52191162109375, -1.375244140625, -1.22857666015625, -1.0819091796875, -0.93524169921875, -0.78857421875, -0.64190673828125, -0.4952392578125, -0.34857177734375, -0.201904296875, -0.05523681640625, 0.0914306640625, 0.23809814453125, 0.384765625, 0.53143310546875, 0.6781005859375, 0.82476806640625, 0.971435546875, 1.11810302734375, 1.2647705078125, 1.41143798828125, 1.55810546875, 1.70477294921875, 1.8514404296875, 1.99810791015625, 2.144775390625, 2.29144287109375, 2.4381103515625, 2.58477783203125, 2.7314453125, 2.87811279296875, 3.0247802734375, 3.17144775390625, 3.318115234375, 3.46478271484375, 3.6114501953125, 3.75811767578125, 3.90478515625, 4.05145263671875, 4.1981201171875, 4.34478759765625, 4.491455078125, 4.63812255859375, 4.7847900390625, 4.93145751953125, 5.078125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 8.0, 7.0, 8.0, 6.0, 10.0, 10.0, 13.0, 18.0, 24.0, 15.0, 17.0, 23.0, 20.0, 37.0, 40.0, 33.0, 40.0, 37.0, 38.0, 31.0, 58.0, 37.0, 38.0, 49.0, 30.0, 32.0, 44.0, 30.0, 32.0, 34.0, 33.0, 26.0, 32.0, 18.0, 19.0, 15.0, 7.0, 13.0, 6.0, 5.0, 1.0, 3.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.9140625, -4.75726318359375, -4.6004638671875, -4.44366455078125, -4.286865234375, -4.13006591796875, -3.9732666015625, -3.81646728515625, -3.65966796875, -3.50286865234375, -3.3460693359375, -3.18927001953125, -3.032470703125, -2.87567138671875, -2.7188720703125, -2.56207275390625, -2.4052734375, -2.24847412109375, -2.0916748046875, -1.93487548828125, -1.778076171875, -1.62127685546875, -1.4644775390625, -1.30767822265625, -1.15087890625, -0.99407958984375, -0.8372802734375, -0.68048095703125, -0.523681640625, -0.36688232421875, -0.2100830078125, -0.05328369140625, 0.103515625, 0.26031494140625, 0.4171142578125, 0.57391357421875, 0.730712890625, 0.88751220703125, 1.0443115234375, 1.20111083984375, 1.35791015625, 1.51470947265625, 1.6715087890625, 1.82830810546875, 1.985107421875, 2.14190673828125, 2.2987060546875, 2.45550537109375, 2.6123046875, 2.76910400390625, 2.9259033203125, 3.08270263671875, 3.239501953125, 3.39630126953125, 3.5531005859375, 3.70989990234375, 3.86669921875, 4.02349853515625, 4.1802978515625, 4.33709716796875, 4.493896484375, 4.65069580078125, 4.8074951171875, 4.96429443359375, 5.12109375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 13.0, 18.0, 29.0, 44.0, 53.0, 89.0, 152.0, 235.0, 353.0, 552.0, 822.0, 1309.0, 2103.0, 3234.0, 5405.0, 8745.0, 13665.0, 22329.0, 35826.0, 58640.0, 94754.0, 150004.0, 235979.0, 355966.0, 496973.0, 609059.0, 607752.0, 498346.0, 356508.0, 235708.0, 150861.0, 94362.0, 58876.0, 36201.0, 22205.0, 13857.0, 8702.0, 5307.0, 3411.0, 2159.0, 1337.0, 840.0, 531.0, 338.0, 228.0, 136.0, 93.0, 63.0, 47.0, 20.0, 17.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-4.30859375, -4.16961669921875, -4.0306396484375, -3.89166259765625, -3.752685546875, -3.61370849609375, -3.4747314453125, -3.33575439453125, -3.19677734375, -3.05780029296875, -2.9188232421875, -2.77984619140625, -2.640869140625, -2.50189208984375, -2.3629150390625, -2.22393798828125, -2.0849609375, -1.94598388671875, -1.8070068359375, -1.66802978515625, -1.529052734375, -1.39007568359375, -1.2510986328125, -1.11212158203125, -0.97314453125, -0.83416748046875, -0.6951904296875, -0.55621337890625, -0.417236328125, -0.27825927734375, -0.1392822265625, -0.00030517578125, 0.138671875, 0.27764892578125, 0.4166259765625, 0.55560302734375, 0.694580078125, 0.83355712890625, 0.9725341796875, 1.11151123046875, 1.25048828125, 1.38946533203125, 1.5284423828125, 1.66741943359375, 1.806396484375, 1.94537353515625, 2.0843505859375, 2.22332763671875, 2.3623046875, 2.50128173828125, 2.6402587890625, 2.77923583984375, 2.918212890625, 3.05718994140625, 3.1961669921875, 3.33514404296875, 3.47412109375, 3.61309814453125, 3.7520751953125, 3.89105224609375, 4.030029296875, 4.16900634765625, 4.3079833984375, 4.44696044921875, 4.5859375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 19.0, 14.0, 17.0, 26.0, 28.0, 36.0, 34.0, 73.0, 73.0, 81.0, 114.0, 112.0, 166.0, 175.0, 189.0, 205.0, 230.0, 244.0, 251.0, 235.0, 217.0, 236.0, 232.0, 156.0, 162.0, 139.0, 103.0, 110.0, 79.0, 55.0, 55.0, 48.0, 40.0, 35.0, 15.0, 18.0, 12.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.984527587890625, -1.92022705078125, -1.855926513671875, -1.7916259765625, -1.727325439453125, -1.66302490234375, -1.598724365234375, -1.534423828125, -1.470123291015625, -1.40582275390625, -1.341522216796875, -1.2772216796875, -1.212921142578125, -1.14862060546875, -1.084320068359375, -1.02001953125, -0.955718994140625, -0.89141845703125, -0.827117919921875, -0.7628173828125, -0.698516845703125, -0.63421630859375, -0.569915771484375, -0.505615234375, -0.441314697265625, -0.37701416015625, -0.312713623046875, -0.2484130859375, -0.184112548828125, -0.11981201171875, -0.055511474609375, 0.0087890625, 0.073089599609375, 0.13739013671875, 0.201690673828125, 0.2659912109375, 0.330291748046875, 0.39459228515625, 0.458892822265625, 0.523193359375, 0.587493896484375, 0.65179443359375, 0.716094970703125, 0.7803955078125, 0.844696044921875, 0.90899658203125, 0.973297119140625, 1.03759765625, 1.101898193359375, 1.16619873046875, 1.230499267578125, 1.2947998046875, 1.359100341796875, 1.42340087890625, 1.487701416015625, 1.552001953125, 1.616302490234375, 1.68060302734375, 1.744903564453125, 1.8092041015625, 1.873504638671875, 1.93780517578125, 2.002105712890625, 2.06640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 8.0, 1.0, 11.0, 3.0, 10.0, 10.0, 10.0, 10.0, 10.0, 19.0, 21.0, 29.0, 28.0, 21.0, 29.0, 28.0, 34.0, 35.0, 43.0, 34.0, 46.0, 45.0, 35.0, 45.0, 41.0, 34.0, 39.0, 39.0, 34.0, 30.0, 37.0, 11.0, 24.0, 19.0, 21.0, 18.0, 17.0, 19.0, 14.0, 9.0, 3.0, 7.0, 8.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.133327484130859, -3.9779529571533203, -3.8225784301757812, -3.6672041416168213, -3.5118296146392822, -3.356455087661743, -3.201080799102783, -3.045706272125244, -2.890331745147705, -2.734957218170166, -2.579582691192627, -2.424208402633667, -2.268833875656128, -2.113459348678589, -1.9580849409103394, -1.8027105331420898, -1.6473360061645508, -1.4919614791870117, -1.3365870714187622, -1.1812126636505127, -1.0258381366729736, -0.8704636693000793, -0.7150892019271851, -0.5597147941589355, -0.4043402671813965, -0.2489657998085022, -0.09359133243560791, 0.06178313493728638, 0.21715760231018066, 0.37253206968307495, 0.5279065370559692, 0.6832809448242188, 0.838655948638916, 0.9940304160118103, 1.1494048833847046, 1.304779291152954, 1.4601538181304932, 1.6155283451080322, 1.7709027528762817, 1.9262771606445312, 2.0816516876220703, 2.2370262145996094, 2.3924007415771484, 2.5477750301361084, 2.7031495571136475, 2.8585240840911865, 3.0138983726501465, 3.1692728996276855, 3.3246474266052246, 3.4800219535827637, 3.6353964805603027, 3.7907707691192627, 3.9461452960968018, 4.101519584655762, 4.256894111633301, 4.41226863861084, 4.567643165588379, 4.723017692565918, 4.878392219543457, 5.033766746520996, 5.189141273498535, 5.344515323638916, 5.499889850616455, 5.655264377593994, 5.810638904571533]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 11.0, 14.0, 25.0, 23.0, 21.0, 21.0, 25.0, 20.0, 31.0, 37.0, 35.0, 37.0, 38.0, 45.0, 38.0, 42.0, 32.0, 45.0, 44.0, 33.0, 49.0, 36.0, 36.0, 39.0, 20.0, 24.0, 24.0, 29.0, 22.0, 15.0, 15.0, 10.0, 11.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.650145053863525, -5.472300052642822, -5.294454574584961, -5.116609573364258, -4.938764572143555, -4.760919094085693, -4.58307409286499, -4.405228614807129, -4.227383613586426, -4.049538612365723, -3.8716933727264404, -3.693848133087158, -3.516002893447876, -3.3381576538085938, -3.1603126525878906, -2.9824674129486084, -2.8046224117279053, -2.626777172088623, -2.44893217086792, -2.2710869312286377, -2.0932416915893555, -1.9153965711593628, -1.7375514507293701, -1.559706211090088, -1.3818610906600952, -1.2040159702301025, -1.0261707305908203, -0.8483256101608276, -0.6704804301261902, -0.49263525009155273, -0.31479012966156006, -0.13694489002227783, 0.040900230407714844, 0.2187453955411911, 0.39659056067466736, 0.5744357109069824, 0.7522808909416199, 0.9301260709762573, 1.10797119140625, 1.2858164310455322, 1.463661551475525, 1.6415066719055176, 1.8193519115447998, 1.9971970319747925, 2.175042152404785, 2.3528873920440674, 2.5307326316833496, 2.7085776329040527, 2.886422872543335, 3.064268112182617, 3.2421131134033203, 3.4199583530426025, 3.5978035926818848, 3.775648593902588, 3.95349383354187, 4.131339073181152, 4.3091840744018555, 4.487029075622559, 4.66487455368042, 4.842719554901123, 5.020564556121826, 5.1984100341796875, 5.376255035400391, 5.554100036621094, 5.731945514678955]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 9.0, 8.0, 9.0, 22.0, 34.0, 58.0, 84.0, 115.0, 170.0, 280.0, 478.0, 702.0, 1240.0, 1833.0, 3245.0, 5249.0, 8775.0, 14096.0, 22746.0, 36092.0, 55541.0, 80123.0, 108893.0, 131123.0, 138361.0, 127075.0, 101837.0, 74359.0, 50316.0, 32533.0, 20683.0, 12669.0, 7776.0, 4710.0, 2736.0, 1675.0, 1057.0, 641.0, 420.0, 261.0, 190.0, 108.0, 73.0, 55.0, 37.0, 20.0, 10.0, 10.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.9609375, -2.8695068359375, -2.778076171875, -2.6866455078125, -2.59521484375, -2.5037841796875, -2.412353515625, -2.3209228515625, -2.2294921875, -2.1380615234375, -2.046630859375, -1.9552001953125, -1.86376953125, -1.7723388671875, -1.680908203125, -1.5894775390625, -1.498046875, -1.4066162109375, -1.315185546875, -1.2237548828125, -1.13232421875, -1.0408935546875, -0.949462890625, -0.8580322265625, -0.7666015625, -0.6751708984375, -0.583740234375, -0.4923095703125, -0.40087890625, -0.3094482421875, -0.218017578125, -0.1265869140625, -0.03515625, 0.0562744140625, 0.147705078125, 0.2391357421875, 0.33056640625, 0.4219970703125, 0.513427734375, 0.6048583984375, 0.6962890625, 0.7877197265625, 0.879150390625, 0.9705810546875, 1.06201171875, 1.1534423828125, 1.244873046875, 1.3363037109375, 1.427734375, 1.5191650390625, 1.610595703125, 1.7020263671875, 1.79345703125, 1.8848876953125, 1.976318359375, 2.0677490234375, 2.1591796875, 2.2506103515625, 2.342041015625, 2.4334716796875, 2.52490234375, 2.6163330078125, 2.707763671875, 2.7991943359375, 2.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 18.0, 18.0, 19.0, 27.0, 13.0, 21.0, 34.0, 28.0, 33.0, 31.0, 40.0, 40.0, 27.0, 39.0, 42.0, 48.0, 37.0, 50.0, 43.0, 32.0, 33.0, 38.0, 32.0, 32.0, 27.0, 22.0, 21.0, 37.0, 17.0, 19.0, 7.0, 11.0, 13.0, 3.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.560791015625, -5.38330078125, -5.205810546875, -5.0283203125, -4.850830078125, -4.67333984375, -4.495849609375, -4.318359375, -4.140869140625, -3.96337890625, -3.785888671875, -3.6083984375, -3.430908203125, -3.25341796875, -3.075927734375, -2.8984375, -2.720947265625, -2.54345703125, -2.365966796875, -2.1884765625, -2.010986328125, -1.83349609375, -1.656005859375, -1.478515625, -1.301025390625, -1.12353515625, -0.946044921875, -0.7685546875, -0.591064453125, -0.41357421875, -0.236083984375, -0.05859375, 0.118896484375, 0.29638671875, 0.473876953125, 0.6513671875, 0.828857421875, 1.00634765625, 1.183837890625, 1.361328125, 1.538818359375, 1.71630859375, 1.893798828125, 2.0712890625, 2.248779296875, 2.42626953125, 2.603759765625, 2.78125, 2.958740234375, 3.13623046875, 3.313720703125, 3.4912109375, 3.668701171875, 3.84619140625, 4.023681640625, 4.201171875, 4.378662109375, 4.55615234375, 4.733642578125, 4.9111328125, 5.088623046875, 5.26611328125, 5.443603515625, 5.62109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 16.0, 15.0, 14.0, 17.0, 24.0, 47.0, 80.0, 116.0, 200.0, 260.0, 514.0, 974.0, 1809.0, 3382.0, 6494.0, 12685.0, 24323.0, 78934.0, 799668.0, 69327.0, 23868.0, 12207.0, 6252.0, 3337.0, 1670.0, 919.0, 512.0, 317.0, 196.0, 119.0, 66.0, 47.0, 33.0, 23.0, 23.0, 13.0, 11.0, 14.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.958740234375, -6.71435546875, -6.469970703125, -6.2255859375, -5.981201171875, -5.73681640625, -5.492431640625, -5.248046875, -5.003662109375, -4.75927734375, -4.514892578125, -4.2705078125, -4.026123046875, -3.78173828125, -3.537353515625, -3.29296875, -3.048583984375, -2.80419921875, -2.559814453125, -2.3154296875, -2.071044921875, -1.82666015625, -1.582275390625, -1.337890625, -1.093505859375, -0.84912109375, -0.604736328125, -0.3603515625, -0.115966796875, 0.12841796875, 0.372802734375, 0.6171875, 0.861572265625, 1.10595703125, 1.350341796875, 1.5947265625, 1.839111328125, 2.08349609375, 2.327880859375, 2.572265625, 2.816650390625, 3.06103515625, 3.305419921875, 3.5498046875, 3.794189453125, 4.03857421875, 4.282958984375, 4.52734375, 4.771728515625, 5.01611328125, 5.260498046875, 5.5048828125, 5.749267578125, 5.99365234375, 6.238037109375, 6.482421875, 6.726806640625, 6.97119140625, 7.215576171875, 7.4599609375, 7.704345703125, 7.94873046875, 8.193115234375, 8.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 15.0, 7.0, 13.0, 17.0, 17.0, 19.0, 19.0, 22.0, 20.0, 26.0, 35.0, 38.0, 36.0, 37.0, 45.0, 35.0, 34.0, 33.0, 40.0, 43.0, 44.0, 32.0, 33.0, 33.0, 31.0, 31.0, 30.0, 28.0, 22.0, 15.0, 14.0, 13.0, 21.0, 26.0, 11.0, 10.0, 8.0, 2.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.05078125, -4.89508056640625, -4.7393798828125, -4.58367919921875, -4.427978515625, -4.27227783203125, -4.1165771484375, -3.96087646484375, -3.80517578125, -3.64947509765625, -3.4937744140625, -3.33807373046875, -3.182373046875, -3.02667236328125, -2.8709716796875, -2.71527099609375, -2.5595703125, -2.40386962890625, -2.2481689453125, -2.09246826171875, -1.936767578125, -1.78106689453125, -1.6253662109375, -1.46966552734375, -1.31396484375, -1.15826416015625, -1.0025634765625, -0.84686279296875, -0.691162109375, -0.53546142578125, -0.3797607421875, -0.22406005859375, -0.068359375, 0.08734130859375, 0.2430419921875, 0.39874267578125, 0.554443359375, 0.71014404296875, 0.8658447265625, 1.02154541015625, 1.17724609375, 1.33294677734375, 1.4886474609375, 1.64434814453125, 1.800048828125, 1.95574951171875, 2.1114501953125, 2.26715087890625, 2.4228515625, 2.57855224609375, 2.7342529296875, 2.88995361328125, 3.045654296875, 3.20135498046875, 3.3570556640625, 3.51275634765625, 3.66845703125, 3.82415771484375, 3.9798583984375, 4.13555908203125, 4.291259765625, 4.44696044921875, 4.6026611328125, 4.75836181640625, 4.9140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 21.0, 10.0, 12.0, 27.0, 37.0, 44.0, 49.0, 81.0, 116.0, 194.0, 231.0, 389.0, 578.0, 850.0, 1304.0, 2073.0, 3585.0, 6161.0, 11485.0, 23504.0, 92927.0, 749995.0, 101592.0, 25051.0, 11848.0, 6360.0, 3816.0, 2185.0, 1364.0, 904.0, 536.0, 351.0, 266.0, 178.0, 126.0, 85.0, 54.0, 47.0, 22.0, 25.0, 29.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8540267944335938, -0.8218231201171875, -0.7896194458007812, -0.757415771484375, -0.7252120971679688, -0.6930084228515625, -0.6608047485351562, -0.62860107421875, -0.5963973999023438, -0.5641937255859375, -0.5319900512695312, -0.499786376953125, -0.46758270263671875, -0.4353790283203125, -0.40317535400390625, -0.3709716796875, -0.33876800537109375, -0.3065643310546875, -0.27436065673828125, -0.242156982421875, -0.20995330810546875, -0.1777496337890625, -0.14554595947265625, -0.11334228515625, -0.08113861083984375, -0.0489349365234375, -0.01673126220703125, 0.015472412109375, 0.04767608642578125, 0.0798797607421875, 0.11208343505859375, 0.144287109375, 0.17649078369140625, 0.2086944580078125, 0.24089813232421875, 0.273101806640625, 0.30530548095703125, 0.3375091552734375, 0.36971282958984375, 0.40191650390625, 0.43412017822265625, 0.4663238525390625, 0.49852752685546875, 0.530731201171875, 0.5629348754882812, 0.5951385498046875, 0.6273422241210938, 0.6595458984375, 0.6917495727539062, 0.7239532470703125, 0.7561569213867188, 0.788360595703125, 0.8205642700195312, 0.8527679443359375, 0.8849716186523438, 0.91717529296875, 0.9493789672851562, 0.9815826416015625, 1.0137863159179688, 1.045989990234375, 1.0781936645507812, 1.1103973388671875, 1.1426010131835938, 1.1748046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 9.0, 18.0, 15.0, 23.0, 34.0, 42.0, 53.0, 61.0, 67.0, 80.0, 96.0, 77.0, 82.0, 67.0, 57.0, 35.0, 32.0, 22.0, 21.0, 19.0, 11.0, 7.0, 7.0, 0.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003871917724609375, -0.00037439167499542236, -0.0003615915775299072, -0.0003487914800643921, -0.00033599138259887695, -0.0003231912851333618, -0.0003103911876678467, -0.00029759109020233154, -0.0002847909927368164, -0.00027199089527130127, -0.00025919079780578613, -0.000246390700340271, -0.00023359060287475586, -0.00022079050540924072, -0.00020799040794372559, -0.00019519031047821045, -0.0001823902130126953, -0.00016959011554718018, -0.00015679001808166504, -0.0001439899206161499, -0.00013118982315063477, -0.00011838972568511963, -0.00010558962821960449, -9.278953075408936e-05, -7.998943328857422e-05, -6.718933582305908e-05, -5.4389238357543945e-05, -4.158914089202881e-05, -2.8789043426513672e-05, -1.5988945960998535e-05, -3.1888484954833984e-06, 9.611248970031738e-06, 2.2411346435546875e-05, 3.521144390106201e-05, 4.801154136657715e-05, 6.0811638832092285e-05, 7.361173629760742e-05, 8.641183376312256e-05, 9.92119312286377e-05, 0.00011201202869415283, 0.00012481212615966797, 0.0001376122236251831, 0.00015041232109069824, 0.00016321241855621338, 0.00017601251602172852, 0.00018881261348724365, 0.0002016127109527588, 0.00021441280841827393, 0.00022721290588378906, 0.0002400130033493042, 0.00025281310081481934, 0.00026561319828033447, 0.0002784132957458496, 0.00029121339321136475, 0.0003040134906768799, 0.000316813588142395, 0.00032961368560791016, 0.0003424137830734253, 0.00035521388053894043, 0.00036801397800445557, 0.0003808140754699707, 0.00039361417293548584, 0.000406414270401001, 0.0004192143678665161, 0.00043201446533203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 5.0, 19.0, 34.0, 46.0, 52.0, 92.0, 130.0, 194.0, 250.0, 408.0, 565.0, 861.0, 1309.0, 2033.0, 3011.0, 4779.0, 7294.0, 11581.0, 18948.0, 30534.0, 50608.0, 82711.0, 130418.0, 180051.0, 179611.0, 129308.0, 81842.0, 49995.0, 30351.0, 18915.0, 11720.0, 7320.0, 4706.0, 2950.0, 1995.0, 1267.0, 836.0, 582.0, 413.0, 247.0, 189.0, 117.0, 75.0, 61.0, 32.0, 24.0, 17.0, 14.0, 6.0, 6.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.456787109375, -0.4425086975097656, -0.42823028564453125, -0.4139518737792969, -0.3996734619140625, -0.3853950500488281, -0.37111663818359375, -0.3568382263183594, -0.342559814453125, -0.3282814025878906, -0.31400299072265625, -0.2997245788574219, -0.2854461669921875, -0.2711677551269531, -0.25688934326171875, -0.24261093139648438, -0.22833251953125, -0.21405410766601562, -0.19977569580078125, -0.18549728393554688, -0.1712188720703125, -0.15694046020507812, -0.14266204833984375, -0.12838363647460938, -0.114105224609375, -0.09982681274414062, -0.08554840087890625, -0.07126998901367188, -0.0569915771484375, -0.042713165283203125, -0.02843475341796875, -0.014156341552734375, 0.0001220703125, 0.014400482177734375, 0.02867889404296875, 0.042957305908203125, 0.0572357177734375, 0.07151412963867188, 0.08579254150390625, 0.10007095336914062, 0.114349365234375, 0.12862777709960938, 0.14290618896484375, 0.15718460083007812, 0.1714630126953125, 0.18574142456054688, 0.20001983642578125, 0.21429824829101562, 0.22857666015625, 0.24285507202148438, 0.25713348388671875, 0.2714118957519531, 0.2856903076171875, 0.2999687194824219, 0.31424713134765625, 0.3285255432128906, 0.342803955078125, 0.3570823669433594, 0.37136077880859375, 0.3856391906738281, 0.3999176025390625, 0.4141960144042969, 0.42847442626953125, 0.4427528381347656, 0.45703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 8.0, 11.0, 15.0, 14.0, 17.0, 15.0, 24.0, 35.0, 22.0, 28.0, 32.0, 44.0, 34.0, 42.0, 56.0, 66.0, 54.0, 75.0, 44.0, 40.0, 38.0, 45.0, 35.0, 28.0, 26.0, 27.0, 21.0, 23.0, 13.0, 16.0, 10.0, 12.0, 10.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15225982666015625, -0.1465606689453125, -0.14086151123046875, -0.135162353515625, -0.12946319580078125, -0.1237640380859375, -0.11806488037109375, -0.11236572265625, -0.10666656494140625, -0.1009674072265625, -0.09526824951171875, -0.089569091796875, -0.08386993408203125, -0.0781707763671875, -0.07247161865234375, -0.0667724609375, -0.06107330322265625, -0.0553741455078125, -0.04967498779296875, -0.043975830078125, -0.03827667236328125, -0.0325775146484375, -0.02687835693359375, -0.02117919921875, -0.01548004150390625, -0.0097808837890625, -0.00408172607421875, 0.001617431640625, 0.00731658935546875, 0.0130157470703125, 0.01871490478515625, 0.0244140625, 0.03011322021484375, 0.0358123779296875, 0.04151153564453125, 0.047210693359375, 0.05290985107421875, 0.0586090087890625, 0.06430816650390625, 0.07000732421875, 0.07570648193359375, 0.0814056396484375, 0.08710479736328125, 0.092803955078125, 0.09850311279296875, 0.1042022705078125, 0.10990142822265625, 0.1156005859375, 0.12129974365234375, 0.1269989013671875, 0.13269805908203125, 0.138397216796875, 0.14409637451171875, 0.1497955322265625, 0.15549468994140625, 0.16119384765625, 0.16689300537109375, 0.1725921630859375, 0.17829132080078125, 0.183990478515625, 0.18968963623046875, 0.1953887939453125, 0.20108795166015625, 0.206787109375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 1.0, 6.0, 8.0, 12.0, 8.0, 10.0, 12.0, 15.0, 23.0, 21.0, 30.0, 36.0, 28.0, 31.0, 50.0, 40.0, 32.0, 46.0, 38.0, 45.0, 51.0, 40.0, 40.0, 29.0, 44.0, 40.0, 32.0, 29.0, 32.0, 21.0, 24.0, 27.0, 23.0, 14.0, 14.0, 10.0, 6.0, 6.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.384288787841797, -4.223207950592041, -4.062127113342285, -3.9010465145111084, -3.7399659156799316, -3.578885078430176, -3.41780424118042, -3.256723403930664, -3.0956428050994873, -2.9345619678497314, -2.7734813690185547, -2.612400531768799, -2.451319694519043, -2.290239095687866, -2.1291582584381104, -1.968077540397644, -1.8069968223571777, -1.6459161043167114, -1.4848353862762451, -1.3237545490264893, -1.162673830986023, -1.0015931129455566, -0.8405123353004456, -0.6794315576553345, -0.5183508396148682, -0.35727009177207947, -0.19618934392929077, -0.035108596086502075, 0.12597215175628662, 0.28705286979675293, 0.448133647441864, 0.6092144250869751, 0.7702946662902832, 0.9313753843307495, 1.0924561023712158, 1.2535369396209717, 1.414617657661438, 1.5756983757019043, 1.7367792129516602, 1.8978599309921265, 2.0589406490325928, 2.2200214862823486, 2.3811020851135254, 2.5421829223632812, 2.703263759613037, 2.864344358444214, 3.0254251956939697, 3.1865057945251465, 3.3475866317749023, 3.508667469024658, 3.669748067855835, 3.830828905105591, 3.9919095039367676, 4.152990341186523, 4.314071178436279, 4.475152015686035, 4.636232376098633, 4.797313213348389, 4.9583940505981445, 5.119474411010742, 5.280555248260498, 5.441636085510254, 5.60271692276001, 5.763797760009766, 5.9248785972595215]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 9.0, 14.0, 19.0, 26.0, 24.0, 16.0, 23.0, 27.0, 28.0, 31.0, 27.0, 42.0, 44.0, 51.0, 36.0, 40.0, 43.0, 45.0, 42.0, 38.0, 44.0, 36.0, 43.0, 33.0, 21.0, 29.0, 33.0, 19.0, 19.0, 18.0, 12.0, 15.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.684797286987305, -5.507685661315918, -5.330574035644531, -5.1534624099731445, -4.976350784301758, -4.799239158630371, -4.622127532958984, -4.445015907287598, -4.267904281616211, -4.090792655944824, -3.9136810302734375, -3.736569404602051, -3.559457778930664, -3.3823461532592773, -3.2052342891693115, -3.028122663497925, -2.851010799407959, -2.6738991737365723, -2.4967875480651855, -2.319675922393799, -2.142564296722412, -1.9654525518417358, -1.7883408069610596, -1.6112291812896729, -1.4341175556182861, -1.2570059299468994, -1.0798943042755127, -0.9027825593948364, -0.7256709337234497, -0.548559308052063, -0.3714475631713867, -0.1943359375, -0.017224788665771484, 0.15988686680793762, 0.33699852228164673, 0.5141102075576782, 0.6912218332290649, 0.8683334589004517, 1.045445203781128, 1.2225568294525146, 1.3996684551239014, 1.576780080795288, 1.7538917064666748, 1.931003451347351, 2.1081151962280273, 2.285226821899414, 2.462338447570801, 2.6394500732421875, 2.816561698913574, 2.993673324584961, 3.1707849502563477, 3.3478965759277344, 3.525008201599121, 3.702119827270508, 3.8792316913604736, 4.056343078613281, 4.233454704284668, 4.410566329956055, 4.587677955627441, 4.764789581298828, 4.941901206970215, 5.119012832641602, 5.296124458312988, 5.473236083984375, 5.65034818649292]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 8.0, 13.0, 16.0, 33.0, 53.0, 82.0, 162.0, 218.0, 320.0, 525.0, 809.0, 1157.0, 1769.0, 2807.0, 4002.0, 6297.0, 9117.0, 13409.0, 19363.0, 27265.0, 38132.0, 51075.0, 65631.0, 81007.0, 93698.0, 101823.0, 102425.0, 95017.0, 83074.0, 67819.0, 52141.0, 38964.0, 28219.0, 20027.0, 13955.0, 9340.0, 6369.0, 4305.0, 2796.0, 1854.0, 1157.0, 845.0, 520.0, 356.0, 210.0, 145.0, 101.0, 56.0, 32.0, 19.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.126953125, -3.02288818359375, -2.9188232421875, -2.81475830078125, -2.710693359375, -2.60662841796875, -2.5025634765625, -2.39849853515625, -2.29443359375, -2.19036865234375, -2.0863037109375, -1.98223876953125, -1.878173828125, -1.77410888671875, -1.6700439453125, -1.56597900390625, -1.4619140625, -1.35784912109375, -1.2537841796875, -1.14971923828125, -1.045654296875, -0.94158935546875, -0.8375244140625, -0.73345947265625, -0.62939453125, -0.52532958984375, -0.4212646484375, -0.31719970703125, -0.213134765625, -0.10906982421875, -0.0050048828125, 0.09906005859375, 0.203125, 0.30718994140625, 0.4112548828125, 0.51531982421875, 0.619384765625, 0.72344970703125, 0.8275146484375, 0.93157958984375, 1.03564453125, 1.13970947265625, 1.2437744140625, 1.34783935546875, 1.451904296875, 1.55596923828125, 1.6600341796875, 1.76409912109375, 1.8681640625, 1.97222900390625, 2.0762939453125, 2.18035888671875, 2.284423828125, 2.38848876953125, 2.4925537109375, 2.59661865234375, 2.70068359375, 2.80474853515625, 2.9088134765625, 3.01287841796875, 3.116943359375, 3.22100830078125, 3.3250732421875, 3.42913818359375, 3.533203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 9.0, 8.0, 18.0, 16.0, 22.0, 22.0, 26.0, 15.0, 26.0, 31.0, 38.0, 25.0, 27.0, 34.0, 41.0, 38.0, 42.0, 50.0, 34.0, 56.0, 29.0, 45.0, 41.0, 41.0, 37.0, 26.0, 26.0, 18.0, 28.0, 18.0, 21.0, 22.0, 16.0, 15.0, 5.0, 3.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.70703125, -5.537353515625, -5.36767578125, -5.197998046875, -5.0283203125, -4.858642578125, -4.68896484375, -4.519287109375, -4.349609375, -4.179931640625, -4.01025390625, -3.840576171875, -3.6708984375, -3.501220703125, -3.33154296875, -3.161865234375, -2.9921875, -2.822509765625, -2.65283203125, -2.483154296875, -2.3134765625, -2.143798828125, -1.97412109375, -1.804443359375, -1.634765625, -1.465087890625, -1.29541015625, -1.125732421875, -0.9560546875, -0.786376953125, -0.61669921875, -0.447021484375, -0.27734375, -0.107666015625, 0.06201171875, 0.231689453125, 0.4013671875, 0.571044921875, 0.74072265625, 0.910400390625, 1.080078125, 1.249755859375, 1.41943359375, 1.589111328125, 1.7587890625, 1.928466796875, 2.09814453125, 2.267822265625, 2.4375, 2.607177734375, 2.77685546875, 2.946533203125, 3.1162109375, 3.285888671875, 3.45556640625, 3.625244140625, 3.794921875, 3.964599609375, 4.13427734375, 4.303955078125, 4.4736328125, 4.643310546875, 4.81298828125, 4.982666015625, 5.15234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 16.0, 24.0, 31.0, 57.0, 94.0, 147.0, 248.0, 389.0, 621.0, 1020.0, 1667.0, 2949.0, 4961.0, 8569.0, 14606.0, 24058.0, 39260.0, 61194.0, 89774.0, 119250.0, 141037.0, 143504.0, 124499.0, 95609.0, 66706.0, 42815.0, 26507.0, 15863.0, 9475.0, 5518.0, 3286.0, 1870.0, 1104.0, 708.0, 456.0, 252.0, 160.0, 94.0, 48.0, 41.0, 21.0, 21.0, 11.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.9412841796875, -4.777099609375, -4.6129150390625, -4.44873046875, -4.2845458984375, -4.120361328125, -3.9561767578125, -3.7919921875, -3.6278076171875, -3.463623046875, -3.2994384765625, -3.13525390625, -2.9710693359375, -2.806884765625, -2.6427001953125, -2.478515625, -2.3143310546875, -2.150146484375, -1.9859619140625, -1.82177734375, -1.6575927734375, -1.493408203125, -1.3292236328125, -1.1650390625, -1.0008544921875, -0.836669921875, -0.6724853515625, -0.50830078125, -0.3441162109375, -0.179931640625, -0.0157470703125, 0.1484375, 0.3126220703125, 0.476806640625, 0.6409912109375, 0.80517578125, 0.9693603515625, 1.133544921875, 1.2977294921875, 1.4619140625, 1.6260986328125, 1.790283203125, 1.9544677734375, 2.11865234375, 2.2828369140625, 2.447021484375, 2.6112060546875, 2.775390625, 2.9395751953125, 3.103759765625, 3.2679443359375, 3.43212890625, 3.5963134765625, 3.760498046875, 3.9246826171875, 4.0888671875, 4.2530517578125, 4.417236328125, 4.5814208984375, 4.74560546875, 4.9097900390625, 5.073974609375, 5.2381591796875, 5.40234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 8.0, 8.0, 12.0, 10.0, 8.0, 32.0, 17.0, 20.0, 24.0, 32.0, 32.0, 41.0, 35.0, 42.0, 41.0, 30.0, 38.0, 39.0, 34.0, 49.0, 38.0, 51.0, 29.0, 36.0, 38.0, 32.0, 30.0, 27.0, 22.0, 23.0, 17.0, 15.0, 11.0, 6.0, 11.0, 13.0, 6.0, 12.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.12890625, -4.013214111328125, -3.89752197265625, -3.781829833984375, -3.6661376953125, -3.550445556640625, -3.43475341796875, -3.319061279296875, -3.203369140625, -3.087677001953125, -2.97198486328125, -2.856292724609375, -2.7406005859375, -2.624908447265625, -2.50921630859375, -2.393524169921875, -2.27783203125, -2.162139892578125, -2.04644775390625, -1.930755615234375, -1.8150634765625, -1.699371337890625, -1.58367919921875, -1.467987060546875, -1.352294921875, -1.236602783203125, -1.12091064453125, -1.005218505859375, -0.8895263671875, -0.773834228515625, -0.65814208984375, -0.542449951171875, -0.4267578125, -0.311065673828125, -0.19537353515625, -0.079681396484375, 0.0360107421875, 0.151702880859375, 0.26739501953125, 0.383087158203125, 0.498779296875, 0.614471435546875, 0.73016357421875, 0.845855712890625, 0.9615478515625, 1.077239990234375, 1.19293212890625, 1.308624267578125, 1.42431640625, 1.540008544921875, 1.65570068359375, 1.771392822265625, 1.8870849609375, 2.002777099609375, 2.11846923828125, 2.234161376953125, 2.349853515625, 2.465545654296875, 2.58123779296875, 2.696929931640625, 2.8126220703125, 2.928314208984375, 3.04400634765625, 3.159698486328125, 3.275390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 10.0, 17.0, 16.0, 28.0, 44.0, 73.0, 106.0, 179.0, 281.0, 479.0, 826.0, 1326.0, 2302.0, 4109.0, 7635.0, 13678.0, 26065.0, 50000.0, 93840.0, 158348.0, 210552.0, 194712.0, 129166.0, 72148.0, 37995.0, 20166.0, 10647.0, 5810.0, 3256.0, 1928.0, 1098.0, 641.0, 376.0, 254.0, 146.0, 108.0, 56.0, 43.0, 29.0, 10.0, 11.0, 10.0, 10.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.11328125, -3.015350341796875, -2.91741943359375, -2.819488525390625, -2.7215576171875, -2.623626708984375, -2.52569580078125, -2.427764892578125, -2.329833984375, -2.231903076171875, -2.13397216796875, -2.036041259765625, -1.9381103515625, -1.840179443359375, -1.74224853515625, -1.644317626953125, -1.54638671875, -1.448455810546875, -1.35052490234375, -1.252593994140625, -1.1546630859375, -1.056732177734375, -0.95880126953125, -0.860870361328125, -0.762939453125, -0.665008544921875, -0.56707763671875, -0.469146728515625, -0.3712158203125, -0.273284912109375, -0.17535400390625, -0.077423095703125, 0.0205078125, 0.118438720703125, 0.21636962890625, 0.314300537109375, 0.4122314453125, 0.510162353515625, 0.60809326171875, 0.706024169921875, 0.803955078125, 0.901885986328125, 0.99981689453125, 1.097747802734375, 1.1956787109375, 1.293609619140625, 1.39154052734375, 1.489471435546875, 1.58740234375, 1.685333251953125, 1.78326416015625, 1.881195068359375, 1.9791259765625, 2.077056884765625, 2.17498779296875, 2.272918701171875, 2.370849609375, 2.468780517578125, 2.56671142578125, 2.664642333984375, 2.7625732421875, 2.860504150390625, 2.95843505859375, 3.056365966796875, 3.154296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 11.0, 7.0, 20.0, 10.0, 16.0, 21.0, 27.0, 28.0, 44.0, 59.0, 59.0, 71.0, 79.0, 92.0, 76.0, 79.0, 61.0, 55.0, 40.0, 35.0, 30.0, 24.0, 11.0, 10.0, 13.0, 7.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004169940948486328, -0.00040593743324279785, -0.0003948807716369629, -0.00038382411003112793, -0.00037276744842529297, -0.000361710786819458, -0.00035065412521362305, -0.0003395974636077881, -0.0003285408020019531, -0.00031748414039611816, -0.0003064274787902832, -0.00029537081718444824, -0.0002843141555786133, -0.0002732574939727783, -0.00026220083236694336, -0.0002511441707611084, -0.00024008750915527344, -0.00022903084754943848, -0.00021797418594360352, -0.00020691752433776855, -0.0001958608627319336, -0.00018480420112609863, -0.00017374753952026367, -0.0001626908779144287, -0.00015163421630859375, -0.0001405775547027588, -0.00012952089309692383, -0.00011846423149108887, -0.0001074075698852539, -9.635090827941895e-05, -8.529424667358398e-05, -7.423758506774902e-05, -6.318092346191406e-05, -5.21242618560791e-05, -4.106760025024414e-05, -3.001093864440918e-05, -1.895427703857422e-05, -7.897615432739258e-06, 3.159046173095703e-06, 1.4215707778930664e-05, 2.5272369384765625e-05, 3.6329030990600586e-05, 4.738569259643555e-05, 5.844235420227051e-05, 6.949901580810547e-05, 8.055567741394043e-05, 9.161233901977539e-05, 0.00010266900062561035, 0.00011372566223144531, 0.00012478232383728027, 0.00013583898544311523, 0.0001468956470489502, 0.00015795230865478516, 0.00016900897026062012, 0.00018006563186645508, 0.00019112229347229004, 0.000202178955078125, 0.00021323561668395996, 0.00022429227828979492, 0.00023534893989562988, 0.00024640560150146484, 0.0002574622631072998, 0.00026851892471313477, 0.0002795755863189697, 0.0002906322479248047]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 4.0, 6.0, 15.0, 19.0, 41.0, 54.0, 69.0, 120.0, 200.0, 275.0, 508.0, 802.0, 1207.0, 1930.0, 3126.0, 5141.0, 8532.0, 13799.0, 23073.0, 37252.0, 59884.0, 90616.0, 125884.0, 151810.0, 152311.0, 125282.0, 90299.0, 59825.0, 37403.0, 23065.0, 13910.0, 8519.0, 5140.0, 3097.0, 1963.0, 1233.0, 785.0, 493.0, 306.0, 187.0, 127.0, 93.0, 54.0, 39.0, 25.0, 13.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.19293212890625, -2.1221923828125, -2.05145263671875, -1.980712890625, -1.90997314453125, -1.8392333984375, -1.76849365234375, -1.69775390625, -1.62701416015625, -1.5562744140625, -1.48553466796875, -1.414794921875, -1.34405517578125, -1.2733154296875, -1.20257568359375, -1.1318359375, -1.06109619140625, -0.9903564453125, -0.91961669921875, -0.848876953125, -0.77813720703125, -0.7073974609375, -0.63665771484375, -0.56591796875, -0.49517822265625, -0.4244384765625, -0.35369873046875, -0.282958984375, -0.21221923828125, -0.1414794921875, -0.07073974609375, 0.0, 0.07073974609375, 0.1414794921875, 0.21221923828125, 0.282958984375, 0.35369873046875, 0.4244384765625, 0.49517822265625, 0.56591796875, 0.63665771484375, 0.7073974609375, 0.77813720703125, 0.848876953125, 0.91961669921875, 0.9903564453125, 1.06109619140625, 1.1318359375, 1.20257568359375, 1.2733154296875, 1.34405517578125, 1.414794921875, 1.48553466796875, 1.5562744140625, 1.62701416015625, 1.69775390625, 1.76849365234375, 1.8392333984375, 1.90997314453125, 1.980712890625, 2.05145263671875, 2.1221923828125, 2.19293212890625, 2.263671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 6.0, 10.0, 12.0, 14.0, 7.0, 12.0, 22.0, 27.0, 19.0, 27.0, 36.0, 29.0, 48.0, 28.0, 39.0, 48.0, 49.0, 48.0, 46.0, 41.0, 43.0, 45.0, 33.0, 43.0, 44.0, 34.0, 31.0, 25.0, 17.0, 20.0, 22.0, 10.0, 10.0, 8.0, 5.0, 3.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0], "bins": [-0.9306640625, -0.9060134887695312, -0.8813629150390625, -0.8567123413085938, -0.832061767578125, -0.8074111938476562, -0.7827606201171875, -0.7581100463867188, -0.73345947265625, -0.7088088989257812, -0.6841583251953125, -0.6595077514648438, -0.634857177734375, -0.6102066040039062, -0.5855560302734375, -0.5609054565429688, -0.5362548828125, -0.5116043090820312, -0.4869537353515625, -0.46230316162109375, -0.437652587890625, -0.41300201416015625, -0.3883514404296875, -0.36370086669921875, -0.33905029296875, -0.31439971923828125, -0.2897491455078125, -0.26509857177734375, -0.240447998046875, -0.21579742431640625, -0.1911468505859375, -0.16649627685546875, -0.141845703125, -0.11719512939453125, -0.0925445556640625, -0.06789398193359375, -0.043243408203125, -0.01859283447265625, 0.0060577392578125, 0.03070831298828125, 0.05535888671875, 0.08000946044921875, 0.1046600341796875, 0.12931060791015625, 0.153961181640625, 0.17861175537109375, 0.2032623291015625, 0.22791290283203125, 0.2525634765625, 0.27721405029296875, 0.3018646240234375, 0.32651519775390625, 0.351165771484375, 0.37581634521484375, 0.4004669189453125, 0.42511749267578125, 0.44976806640625, 0.47441864013671875, 0.4990692138671875, 0.5237197875976562, 0.548370361328125, 0.5730209350585938, 0.5976715087890625, 0.6223220825195312, 0.64697265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 4.0, 5.0, 20.0, 20.0, 18.0, 25.0, 19.0, 32.0, 28.0, 26.0, 31.0, 23.0, 40.0, 34.0, 49.0, 44.0, 42.0, 31.0, 38.0, 33.0, 30.0, 38.0, 32.0, 36.0, 33.0, 27.0, 31.0, 27.0, 20.0, 22.0, 24.0, 19.0, 21.0, 9.0, 18.0, 7.0, 4.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.420706748962402, -4.278234958648682, -4.135763168334961, -3.9932916164398193, -3.8508200645446777, -3.708348274230957, -3.5658764839172363, -3.4234046936035156, -3.280933141708374, -3.1384613513946533, -2.9959897994995117, -2.853518009185791, -2.7110462188720703, -2.5685746669769287, -2.426102876663208, -2.2836313247680664, -2.1411595344543457, -1.9986878633499146, -1.8562161922454834, -1.7137444019317627, -1.5712727308273315, -1.4288010597229004, -1.2863292694091797, -1.1438575983047485, -1.0013859272003174, -0.8589142560958862, -0.7164425253868103, -0.5739707946777344, -0.4314991235733032, -0.28902745246887207, -0.14655572175979614, -0.004083991050720215, 0.13838815689086914, 0.2808598577976227, 0.4233315587043762, 0.5658032894134521, 0.7082749605178833, 0.8507466316223145, 0.9932183623313904, 1.1356900930404663, 1.2781617641448975, 1.4206334352493286, 1.5631051063537598, 1.7055768966674805, 1.8480485677719116, 1.9905202388763428, 2.1329920291900635, 2.275463581085205, 2.417935371398926, 2.5604071617126465, 2.702878713607788, 2.845350503921509, 2.9878220558166504, 3.130293846130371, 3.272765636444092, 3.4152374267578125, 3.557708978652954, 3.700180768966675, 3.8426523208618164, 3.985124111175537, 4.127595901489258, 4.27006721496582, 4.412539005279541, 4.555010795593262, 4.697482585906982]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 8.0, 10.0, 12.0, 13.0, 14.0, 14.0, 17.0, 15.0, 34.0, 27.0, 38.0, 29.0, 42.0, 30.0, 32.0, 55.0, 34.0, 42.0, 36.0, 50.0, 49.0, 38.0, 38.0, 37.0, 40.0, 28.0, 28.0, 32.0, 23.0, 28.0, 19.0, 17.0, 18.0, 10.0, 9.0, 9.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.793173313140869, -5.607846736907959, -5.422519683837891, -5.2371931076049805, -5.05186653137207, -4.86653995513916, -4.681212902069092, -4.495886325836182, -4.310559272766113, -4.125232696533203, -3.939905881881714, -3.7545790672302246, -3.5692524909973145, -3.383925676345825, -3.198598861694336, -3.013272285461426, -2.8279457092285156, -2.6426188945770264, -2.457292318344116, -2.271965503692627, -2.086638927459717, -1.9013121128082275, -1.7159852981567383, -1.5306586027145386, -1.3453319072723389, -1.1600052118301392, -0.9746784567832947, -0.7893517017364502, -0.6040250062942505, -0.4186983108520508, -0.23337149620056152, -0.048044800758361816, 0.1372814178466797, 0.3226081430912018, 0.5079348683357239, 0.6932616233825684, 0.8785883188247681, 1.0639150142669678, 1.249241828918457, 1.4345685243606567, 1.6198952198028564, 1.8052219152450562, 1.9905486106872559, 2.175875425338745, 2.3612022399902344, 2.5465288162231445, 2.731855630874634, 2.917182445526123, 3.102509021759033, 3.2878358364105225, 3.4731624126434326, 3.658489227294922, 3.843815803527832, 4.029142379760742, 4.2144694328308105, 4.399796009063721, 4.585123062133789, 4.770449638366699, 4.955776691436768, 5.141103267669678, 5.326429843902588, 5.511756896972656, 5.697083473205566, 5.882410049438477, 6.067736625671387]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 7.0, 10.0, 10.0, 16.0, 33.0, 57.0, 102.0, 123.0, 218.0, 318.0, 506.0, 740.0, 1159.0, 1816.0, 2774.0, 4289.0, 6821.0, 10770.0, 16739.0, 27673.0, 45953.0, 77805.0, 133598.0, 229748.0, 369853.0, 533693.0, 647814.0, 643457.0, 524590.0, 365140.0, 224577.0, 130984.0, 76177.0, 44357.0, 26680.0, 16566.0, 10406.0, 6602.0, 4120.0, 2690.0, 1775.0, 1184.0, 810.0, 514.0, 337.0, 214.0, 158.0, 104.0, 63.0, 44.0, 29.0, 18.0, 16.0, 9.0, 11.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-3.35546875, -3.2435302734375, -3.131591796875, -3.0196533203125, -2.90771484375, -2.7957763671875, -2.683837890625, -2.5718994140625, -2.4599609375, -2.3480224609375, -2.236083984375, -2.1241455078125, -2.01220703125, -1.9002685546875, -1.788330078125, -1.6763916015625, -1.564453125, -1.4525146484375, -1.340576171875, -1.2286376953125, -1.11669921875, -1.0047607421875, -0.892822265625, -0.7808837890625, -0.6689453125, -0.5570068359375, -0.445068359375, -0.3331298828125, -0.22119140625, -0.1092529296875, 0.002685546875, 0.1146240234375, 0.2265625, 0.3385009765625, 0.450439453125, 0.5623779296875, 0.67431640625, 0.7862548828125, 0.898193359375, 1.0101318359375, 1.1220703125, 1.2340087890625, 1.345947265625, 1.4578857421875, 1.56982421875, 1.6817626953125, 1.793701171875, 1.9056396484375, 2.017578125, 2.1295166015625, 2.241455078125, 2.3533935546875, 2.46533203125, 2.5772705078125, 2.689208984375, 2.8011474609375, 2.9130859375, 3.0250244140625, 3.136962890625, 3.2489013671875, 3.36083984375, 3.4727783203125, 3.584716796875, 3.6966552734375, 3.80859375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 11.0, 11.0, 12.0, 15.0, 13.0, 24.0, 20.0, 23.0, 21.0, 25.0, 41.0, 38.0, 28.0, 38.0, 46.0, 47.0, 50.0, 50.0, 51.0, 45.0, 56.0, 32.0, 27.0, 46.0, 31.0, 35.0, 25.0, 23.0, 26.0, 19.0, 18.0, 15.0, 16.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9232177734375, -4.756591796875, -4.5899658203125, -4.42333984375, -4.2567138671875, -4.090087890625, -3.9234619140625, -3.7568359375, -3.5902099609375, -3.423583984375, -3.2569580078125, -3.09033203125, -2.9237060546875, -2.757080078125, -2.5904541015625, -2.423828125, -2.2572021484375, -2.090576171875, -1.9239501953125, -1.75732421875, -1.5906982421875, -1.424072265625, -1.2574462890625, -1.0908203125, -0.9241943359375, -0.757568359375, -0.5909423828125, -0.42431640625, -0.2576904296875, -0.091064453125, 0.0755615234375, 0.2421875, 0.4088134765625, 0.575439453125, 0.7420654296875, 0.90869140625, 1.0753173828125, 1.241943359375, 1.4085693359375, 1.5751953125, 1.7418212890625, 1.908447265625, 2.0750732421875, 2.24169921875, 2.4083251953125, 2.574951171875, 2.7415771484375, 2.908203125, 3.0748291015625, 3.241455078125, 3.4080810546875, 3.57470703125, 3.7413330078125, 3.907958984375, 4.0745849609375, 4.2412109375, 4.4078369140625, 4.574462890625, 4.7410888671875, 4.90771484375, 5.0743408203125, 5.240966796875, 5.4075927734375, 5.57421875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 7.0, 5.0, 3.0, 8.0, 16.0, 17.0, 42.0, 56.0, 82.0, 121.0, 188.0, 310.0, 502.0, 738.0, 1131.0, 1839.0, 2949.0, 4747.0, 7923.0, 12723.0, 20775.0, 34438.0, 56592.0, 93930.0, 153092.0, 245171.0, 375783.0, 532903.0, 648360.0, 624646.0, 487462.0, 334557.0, 213264.0, 133324.0, 80668.0, 48990.0, 29744.0, 18135.0, 11133.0, 6719.0, 4149.0, 2652.0, 1598.0, 1023.0, 635.0, 398.0, 257.0, 169.0, 104.0, 83.0, 44.0, 27.0, 20.0, 13.0, 7.0, 14.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.23828125, -4.105224609375, -3.97216796875, -3.839111328125, -3.7060546875, -3.572998046875, -3.43994140625, -3.306884765625, -3.173828125, -3.040771484375, -2.90771484375, -2.774658203125, -2.6416015625, -2.508544921875, -2.37548828125, -2.242431640625, -2.109375, -1.976318359375, -1.84326171875, -1.710205078125, -1.5771484375, -1.444091796875, -1.31103515625, -1.177978515625, -1.044921875, -0.911865234375, -0.77880859375, -0.645751953125, -0.5126953125, -0.379638671875, -0.24658203125, -0.113525390625, 0.01953125, 0.152587890625, 0.28564453125, 0.418701171875, 0.5517578125, 0.684814453125, 0.81787109375, 0.950927734375, 1.083984375, 1.217041015625, 1.35009765625, 1.483154296875, 1.6162109375, 1.749267578125, 1.88232421875, 2.015380859375, 2.1484375, 2.281494140625, 2.41455078125, 2.547607421875, 2.6806640625, 2.813720703125, 2.94677734375, 3.079833984375, 3.212890625, 3.345947265625, 3.47900390625, 3.612060546875, 3.7451171875, 3.878173828125, 4.01123046875, 4.144287109375, 4.27734375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 9.0, 6.0, 18.0, 12.0, 33.0, 23.0, 27.0, 49.0, 74.0, 75.0, 77.0, 122.0, 147.0, 163.0, 193.0, 233.0, 233.0, 245.0, 274.0, 245.0, 287.0, 246.0, 211.0, 203.0, 169.0, 140.0, 122.0, 96.0, 81.0, 64.0, 57.0, 42.0, 28.0, 12.0, 15.0, 13.0, 4.0, 9.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.1358642578125, -2.068603515625, -2.0013427734375, -1.93408203125, -1.8668212890625, -1.799560546875, -1.7322998046875, -1.6650390625, -1.5977783203125, -1.530517578125, -1.4632568359375, -1.39599609375, -1.3287353515625, -1.261474609375, -1.1942138671875, -1.126953125, -1.0596923828125, -0.992431640625, -0.9251708984375, -0.85791015625, -0.7906494140625, -0.723388671875, -0.6561279296875, -0.5888671875, -0.5216064453125, -0.454345703125, -0.3870849609375, -0.31982421875, -0.2525634765625, -0.185302734375, -0.1180419921875, -0.05078125, 0.0164794921875, 0.083740234375, 0.1510009765625, 0.21826171875, 0.2855224609375, 0.352783203125, 0.4200439453125, 0.4873046875, 0.5545654296875, 0.621826171875, 0.6890869140625, 0.75634765625, 0.8236083984375, 0.890869140625, 0.9581298828125, 1.025390625, 1.0926513671875, 1.159912109375, 1.2271728515625, 1.29443359375, 1.3616943359375, 1.428955078125, 1.4962158203125, 1.5634765625, 1.6307373046875, 1.697998046875, 1.7652587890625, 1.83251953125, 1.8997802734375, 1.967041015625, 2.0343017578125, 2.1015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 9.0, 13.0, 11.0, 21.0, 21.0, 25.0, 28.0, 30.0, 22.0, 38.0, 41.0, 31.0, 26.0, 35.0, 46.0, 46.0, 38.0, 37.0, 40.0, 36.0, 35.0, 38.0, 43.0, 23.0, 28.0, 24.0, 18.0, 35.0, 24.0, 18.0, 19.0, 17.0, 18.0, 12.0, 9.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.319413185119629, -4.176229476928711, -4.033046245574951, -3.889862537384033, -3.7466788291931152, -3.6034953594207764, -3.4603118896484375, -3.3171281814575195, -3.1739444732666016, -3.0307610034942627, -2.8875772953033447, -2.744393825531006, -2.601210117340088, -2.458026647567749, -2.31484317779541, -2.171659469604492, -2.0284759998321533, -1.885292410850525, -1.7421088218688965, -1.5989253520965576, -1.4557416439056396, -1.3125581741333008, -1.1693745851516724, -1.026190996170044, -0.8830074071884155, -0.7398238182067871, -0.5966402292251587, -0.45345669984817505, -0.31027311086654663, -0.1670895218849182, -0.02390599250793457, 0.11927759647369385, 0.26246118545532227, 0.4056447744369507, 0.5488283634185791, 0.6920118927955627, 0.8351954817771912, 0.9783790707588196, 1.1215626001358032, 1.2647461891174316, 1.40792977809906, 1.5511133670806885, 1.694296956062317, 1.8374805450439453, 1.9806640148162842, 2.123847723007202, 2.267031192779541, 2.410214900970459, 2.553398370742798, 2.6965818405151367, 2.8397655487060547, 2.9829490184783936, 3.1261327266693115, 3.2693161964416504, 3.4124999046325684, 3.5556833744049072, 3.698866844177246, 3.842050313949585, 3.985234022140503, 4.128417491912842, 4.27160120010376, 4.414784908294678, 4.5579681396484375, 4.7011518478393555, 4.844335556030273]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 15.0, 17.0, 16.0, 8.0, 22.0, 19.0, 21.0, 31.0, 29.0, 32.0, 27.0, 32.0, 36.0, 37.0, 37.0, 41.0, 50.0, 43.0, 42.0, 39.0, 49.0, 32.0, 42.0, 23.0, 37.0, 27.0, 35.0, 20.0, 16.0, 15.0, 9.0, 19.0, 13.0, 14.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.253361225128174, -5.088160037994385, -4.9229583740234375, -4.757757186889648, -4.592555999755859, -4.42735481262207, -4.262153148651123, -4.096951961517334, -3.931750535964966, -3.7665491104125977, -3.6013479232788086, -3.4361464977264404, -3.2709450721740723, -3.105743885040283, -2.940542459487915, -2.775341033935547, -2.610139846801758, -2.4449384212493896, -2.2797372341156006, -2.1145358085632324, -1.9493345022201538, -1.7841331958770752, -1.618931770324707, -1.4537304639816284, -1.2885291576385498, -1.1233278512954712, -0.9581264853477478, -0.7929251194000244, -0.6277238130569458, -0.4625225067138672, -0.2973211407661438, -0.1321197748184204, 0.0330815315246582, 0.1982828676700592, 0.3634842038154602, 0.5286855697631836, 0.6938868761062622, 0.8590881824493408, 1.024289608001709, 1.1894909143447876, 1.3546922206878662, 1.5198935270309448, 1.6850948333740234, 1.8502962589263916, 2.0154976844787598, 2.180698871612549, 2.345900297164917, 2.511101722717285, 2.676302909851074, 2.8415043354034424, 3.0067055225372314, 3.1719069480895996, 3.3371081352233887, 3.502309560775757, 3.667510986328125, 3.832712173461914, 3.9979135990142822, 4.16311502456665, 4.3283162117004395, 4.4935173988342285, 4.658719062805176, 4.823920249938965, 4.989121437072754, 5.154323101043701, 5.31952428817749]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 10.0, 15.0, 12.0, 38.0, 53.0, 71.0, 140.0, 189.0, 304.0, 552.0, 894.0, 1507.0, 2538.0, 4391.0, 7563.0, 13283.0, 23442.0, 41434.0, 70158.0, 111205.0, 156790.0, 178301.0, 157153.0, 111768.0, 69951.0, 41194.0, 23611.0, 13508.0, 7656.0, 4378.0, 2531.0, 1529.0, 954.0, 558.0, 345.0, 212.0, 119.0, 72.0, 41.0, 41.0, 24.0, 14.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.572265625, -2.482025146484375, -2.39178466796875, -2.301544189453125, -2.2113037109375, -2.121063232421875, -2.03082275390625, -1.940582275390625, -1.850341796875, -1.760101318359375, -1.66986083984375, -1.579620361328125, -1.4893798828125, -1.399139404296875, -1.30889892578125, -1.218658447265625, -1.12841796875, -1.038177490234375, -0.94793701171875, -0.857696533203125, -0.7674560546875, -0.677215576171875, -0.58697509765625, -0.496734619140625, -0.406494140625, -0.316253662109375, -0.22601318359375, -0.135772705078125, -0.0455322265625, 0.044708251953125, 0.13494873046875, 0.225189208984375, 0.3154296875, 0.405670166015625, 0.49591064453125, 0.586151123046875, 0.6763916015625, 0.766632080078125, 0.85687255859375, 0.947113037109375, 1.037353515625, 1.127593994140625, 1.21783447265625, 1.308074951171875, 1.3983154296875, 1.488555908203125, 1.57879638671875, 1.669036865234375, 1.75927734375, 1.849517822265625, 1.93975830078125, 2.029998779296875, 2.1202392578125, 2.210479736328125, 2.30072021484375, 2.390960693359375, 2.481201171875, 2.571441650390625, 2.66168212890625, 2.751922607421875, 2.8421630859375, 2.932403564453125, 3.02264404296875, 3.112884521484375, 3.203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 5.0, 8.0, 14.0, 12.0, 7.0, 16.0, 19.0, 19.0, 18.0, 27.0, 37.0, 28.0, 31.0, 32.0, 35.0, 43.0, 33.0, 38.0, 35.0, 40.0, 38.0, 46.0, 45.0, 34.0, 40.0, 31.0, 37.0, 31.0, 29.0, 24.0, 18.0, 17.0, 21.0, 10.0, 15.0, 12.0, 11.0, 12.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.4921875, -5.32794189453125, -5.1636962890625, -4.99945068359375, -4.835205078125, -4.67095947265625, -4.5067138671875, -4.34246826171875, -4.17822265625, -4.01397705078125, -3.8497314453125, -3.68548583984375, -3.521240234375, -3.35699462890625, -3.1927490234375, -3.02850341796875, -2.8642578125, -2.70001220703125, -2.5357666015625, -2.37152099609375, -2.207275390625, -2.04302978515625, -1.8787841796875, -1.71453857421875, -1.55029296875, -1.38604736328125, -1.2218017578125, -1.05755615234375, -0.893310546875, -0.72906494140625, -0.5648193359375, -0.40057373046875, -0.236328125, -0.07208251953125, 0.0921630859375, 0.25640869140625, 0.420654296875, 0.58489990234375, 0.7491455078125, 0.91339111328125, 1.07763671875, 1.24188232421875, 1.4061279296875, 1.57037353515625, 1.734619140625, 1.89886474609375, 2.0631103515625, 2.22735595703125, 2.3916015625, 2.55584716796875, 2.7200927734375, 2.88433837890625, 3.048583984375, 3.21282958984375, 3.3770751953125, 3.54132080078125, 3.70556640625, 3.86981201171875, 4.0340576171875, 4.19830322265625, 4.362548828125, 4.52679443359375, 4.6910400390625, 4.85528564453125, 5.01953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 16.0, 17.0, 21.0, 21.0, 38.0, 39.0, 64.0, 85.0, 119.0, 251.0, 470.0, 884.0, 1994.0, 4550.0, 10588.0, 25605.0, 111171.0, 817091.0, 44128.0, 17788.0, 7466.0, 3196.0, 1402.0, 660.0, 324.0, 187.0, 118.0, 77.0, 55.0, 30.0, 26.0, 14.0, 18.0, 6.0, 9.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.44561767578125, -7.1998291015625, -6.95404052734375, -6.708251953125, -6.46246337890625, -6.2166748046875, -5.97088623046875, -5.72509765625, -5.47930908203125, -5.2335205078125, -4.98773193359375, -4.741943359375, -4.49615478515625, -4.2503662109375, -4.00457763671875, -3.7587890625, -3.51300048828125, -3.2672119140625, -3.02142333984375, -2.775634765625, -2.52984619140625, -2.2840576171875, -2.03826904296875, -1.79248046875, -1.54669189453125, -1.3009033203125, -1.05511474609375, -0.809326171875, -0.56353759765625, -0.3177490234375, -0.07196044921875, 0.173828125, 0.41961669921875, 0.6654052734375, 0.91119384765625, 1.156982421875, 1.40277099609375, 1.6485595703125, 1.89434814453125, 2.14013671875, 2.38592529296875, 2.6317138671875, 2.87750244140625, 3.123291015625, 3.36907958984375, 3.6148681640625, 3.86065673828125, 4.1064453125, 4.35223388671875, 4.5980224609375, 4.84381103515625, 5.089599609375, 5.33538818359375, 5.5811767578125, 5.82696533203125, 6.07275390625, 6.31854248046875, 6.5643310546875, 6.81011962890625, 7.055908203125, 7.30169677734375, 7.5474853515625, 7.79327392578125, 8.0390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 6.0, 9.0, 11.0, 12.0, 17.0, 21.0, 14.0, 20.0, 26.0, 25.0, 31.0, 31.0, 29.0, 35.0, 26.0, 38.0, 40.0, 32.0, 40.0, 49.0, 42.0, 47.0, 36.0, 38.0, 42.0, 36.0, 32.0, 38.0, 31.0, 25.0, 22.0, 19.0, 19.0, 9.0, 9.0, 5.0, 11.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.31640625, -4.17205810546875, -4.0277099609375, -3.88336181640625, -3.739013671875, -3.59466552734375, -3.4503173828125, -3.30596923828125, -3.16162109375, -3.01727294921875, -2.8729248046875, -2.72857666015625, -2.584228515625, -2.43988037109375, -2.2955322265625, -2.15118408203125, -2.0068359375, -1.86248779296875, -1.7181396484375, -1.57379150390625, -1.429443359375, -1.28509521484375, -1.1407470703125, -0.99639892578125, -0.85205078125, -0.70770263671875, -0.5633544921875, -0.41900634765625, -0.274658203125, -0.13031005859375, 0.0140380859375, 0.15838623046875, 0.302734375, 0.44708251953125, 0.5914306640625, 0.73577880859375, 0.880126953125, 1.02447509765625, 1.1688232421875, 1.31317138671875, 1.45751953125, 1.60186767578125, 1.7462158203125, 1.89056396484375, 2.034912109375, 2.17926025390625, 2.3236083984375, 2.46795654296875, 2.6123046875, 2.75665283203125, 2.9010009765625, 3.04534912109375, 3.189697265625, 3.33404541015625, 3.4783935546875, 3.62274169921875, 3.76708984375, 3.91143798828125, 4.0557861328125, 4.20013427734375, 4.344482421875, 4.48883056640625, 4.6331787109375, 4.77752685546875, 4.921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 10.0, 19.0, 24.0, 51.0, 71.0, 167.0, 326.0, 634.0, 1331.0, 2960.0, 6976.0, 17756.0, 62424.0, 859696.0, 65170.0, 18111.0, 7043.0, 2979.0, 1418.0, 658.0, 345.0, 163.0, 106.0, 52.0, 30.0, 13.0, 12.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.3231353759765625, -1.286895751953125, -1.2506561279296875, -1.21441650390625, -1.1781768798828125, -1.141937255859375, -1.1056976318359375, -1.0694580078125, -1.0332183837890625, -0.996978759765625, -0.9607391357421875, -0.92449951171875, -0.8882598876953125, -0.852020263671875, -0.8157806396484375, -0.779541015625, -0.7433013916015625, -0.707061767578125, -0.6708221435546875, -0.63458251953125, -0.5983428955078125, -0.562103271484375, -0.5258636474609375, -0.4896240234375, -0.4533843994140625, -0.417144775390625, -0.3809051513671875, -0.34466552734375, -0.3084259033203125, -0.272186279296875, -0.2359466552734375, -0.19970703125, -0.1634674072265625, -0.127227783203125, -0.0909881591796875, -0.05474853515625, -0.0185089111328125, 0.017730712890625, 0.0539703369140625, 0.0902099609375, 0.1264495849609375, 0.162689208984375, 0.1989288330078125, 0.23516845703125, 0.2714080810546875, 0.307647705078125, 0.3438873291015625, 0.380126953125, 0.4163665771484375, 0.452606201171875, 0.4888458251953125, 0.52508544921875, 0.5613250732421875, 0.597564697265625, 0.6338043212890625, 0.6700439453125, 0.7062835693359375, 0.742523193359375, 0.7787628173828125, 0.81500244140625, 0.8512420654296875, 0.887481689453125, 0.9237213134765625, 0.9599609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 15.0, 20.0, 18.0, 32.0, 33.0, 53.0, 75.0, 71.0, 99.0, 118.0, 107.0, 83.0, 54.0, 46.0, 30.0, 20.0, 21.0, 19.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023353099822998047, -0.00022614933550357819, -0.0002187676727771759, -0.00021138601005077362, -0.00020400434732437134, -0.00019662268459796906, -0.00018924102187156677, -0.0001818593591451645, -0.0001744776964187622, -0.00016709603369235992, -0.00015971437096595764, -0.00015233270823955536, -0.00014495104551315308, -0.0001375693827867508, -0.0001301877200603485, -0.00012280605733394623, -0.00011542439460754395, -0.00010804273188114166, -0.00010066106915473938, -9.32794064283371e-05, -8.589774370193481e-05, -7.851608097553253e-05, -7.113441824913025e-05, -6.375275552272797e-05, -5.6371092796325684e-05, -4.89894300699234e-05, -4.160776734352112e-05, -3.4226104617118835e-05, -2.6844441890716553e-05, -1.946277916431427e-05, -1.2081116437911987e-05, -4.699453711509705e-06, 2.682209014892578e-06, 1.006387174129486e-05, 1.7445534467697144e-05, 2.4827197194099426e-05, 3.220885992050171e-05, 3.959052264690399e-05, 4.6972185373306274e-05, 5.435384809970856e-05, 6.173551082611084e-05, 6.911717355251312e-05, 7.64988362789154e-05, 8.388049900531769e-05, 9.126216173171997e-05, 9.864382445812225e-05, 0.00010602548718452454, 0.00011340714991092682, 0.0001207888126373291, 0.00012817047536373138, 0.00013555213809013367, 0.00014293380081653595, 0.00015031546354293823, 0.00015769712626934052, 0.0001650787889957428, 0.00017246045172214508, 0.00017984211444854736, 0.00018722377717494965, 0.00019460543990135193, 0.0002019871026277542, 0.0002093687653541565, 0.00021675042808055878, 0.00022413209080696106, 0.00023151375353336334, 0.00023889541625976562]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 7.0, 6.0, 8.0, 16.0, 19.0, 20.0, 40.0, 48.0, 87.0, 148.0, 180.0, 281.0, 411.0, 582.0, 894.0, 1275.0, 1896.0, 2899.0, 4441.0, 7207.0, 11968.0, 19858.0, 34527.0, 59740.0, 99101.0, 147095.0, 180573.0, 167695.0, 120707.0, 75797.0, 44782.0, 25767.0, 15026.0, 9276.0, 5616.0, 3505.0, 2220.0, 1562.0, 1084.0, 661.0, 450.0, 363.0, 236.0, 163.0, 104.0, 78.0, 53.0, 37.0, 16.0, 11.0, 13.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.40673065185546875, -0.3930511474609375, -0.37937164306640625, -0.365692138671875, -0.35201263427734375, -0.3383331298828125, -0.32465362548828125, -0.31097412109375, -0.29729461669921875, -0.2836151123046875, -0.26993560791015625, -0.256256103515625, -0.24257659912109375, -0.2288970947265625, -0.21521759033203125, -0.2015380859375, -0.18785858154296875, -0.1741790771484375, -0.16049957275390625, -0.146820068359375, -0.13314056396484375, -0.1194610595703125, -0.10578155517578125, -0.09210205078125, -0.07842254638671875, -0.0647430419921875, -0.05106353759765625, -0.037384033203125, -0.02370452880859375, -0.0100250244140625, 0.00365447998046875, 0.017333984375, 0.03101348876953125, 0.0446929931640625, 0.05837249755859375, 0.072052001953125, 0.08573150634765625, 0.0994110107421875, 0.11309051513671875, 0.12677001953125, 0.14044952392578125, 0.1541290283203125, 0.16780853271484375, 0.181488037109375, 0.19516754150390625, 0.2088470458984375, 0.22252655029296875, 0.2362060546875, 0.24988555908203125, 0.2635650634765625, 0.27724456787109375, 0.290924072265625, 0.30460357666015625, 0.3182830810546875, 0.33196258544921875, 0.34564208984375, 0.35932159423828125, 0.3730010986328125, 0.38668060302734375, 0.400360107421875, 0.41403961181640625, 0.4277191162109375, 0.44139862060546875, 0.455078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 6.0, 2.0, 3.0, 6.0, 7.0, 8.0, 23.0, 18.0, 18.0, 25.0, 29.0, 40.0, 50.0, 47.0, 48.0, 54.0, 53.0, 76.0, 56.0, 54.0, 54.0, 44.0, 55.0, 48.0, 33.0, 33.0, 26.0, 22.0, 18.0, 16.0, 4.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.20059967041015625, -0.1946563720703125, -0.18871307373046875, -0.182769775390625, -0.17682647705078125, -0.1708831787109375, -0.16493988037109375, -0.15899658203125, -0.15305328369140625, -0.1471099853515625, -0.14116668701171875, -0.135223388671875, -0.12928009033203125, -0.1233367919921875, -0.11739349365234375, -0.1114501953125, -0.10550689697265625, -0.0995635986328125, -0.09362030029296875, -0.087677001953125, -0.08173370361328125, -0.0757904052734375, -0.06984710693359375, -0.06390380859375, -0.05796051025390625, -0.0520172119140625, -0.04607391357421875, -0.040130615234375, -0.03418731689453125, -0.0282440185546875, -0.02230072021484375, -0.016357421875, -0.01041412353515625, -0.0044708251953125, 0.00147247314453125, 0.007415771484375, 0.01335906982421875, 0.0193023681640625, 0.02524566650390625, 0.03118896484375, 0.03713226318359375, 0.0430755615234375, 0.04901885986328125, 0.054962158203125, 0.06090545654296875, 0.0668487548828125, 0.07279205322265625, 0.0787353515625, 0.08467864990234375, 0.0906219482421875, 0.09656524658203125, 0.102508544921875, 0.10845184326171875, 0.1143951416015625, 0.12033843994140625, 0.12628173828125, 0.13222503662109375, 0.1381683349609375, 0.14411163330078125, 0.150054931640625, 0.15599822998046875, 0.1619415283203125, 0.16788482666015625, 0.173828125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 5.0, 5.0, 13.0, 13.0, 17.0, 18.0, 23.0, 28.0, 37.0, 34.0, 26.0, 36.0, 37.0, 36.0, 35.0, 42.0, 36.0, 37.0, 48.0, 44.0, 27.0, 31.0, 34.0, 37.0, 46.0, 31.0, 23.0, 21.0, 24.0, 29.0, 18.0, 21.0, 15.0, 11.0, 8.0, 13.0, 12.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.329329013824463, -4.190308094024658, -4.051287651062012, -3.912266731262207, -3.7732460498809814, -3.634225368499756, -3.4952046871185303, -3.3561840057373047, -3.2171630859375, -3.0781424045562744, -2.939121723175049, -2.800100803375244, -2.6610801219940186, -2.522059440612793, -2.3830387592315674, -2.244018077850342, -2.104997396469116, -1.9659767150878906, -1.8269559144973755, -1.68793523311615, -1.5489144325256348, -1.4098937511444092, -1.2708730697631836, -1.131852388381958, -0.9928315877914429, -0.8538108468055725, -0.7147901058197021, -0.5757694244384766, -0.4367486834526062, -0.29772794246673584, -0.15870726108551025, -0.019686520099639893, 0.11933422088623047, 0.25835496187210083, 0.3973756730556488, 0.5363963842391968, 0.6754171252250671, 0.8144378662109375, 0.9534585475921631, 1.0924792289733887, 1.2315000295639038, 1.3705207109451294, 1.5095415115356445, 1.6485621929168701, 1.7875828742980957, 1.9266036748886108, 2.065624237060547, 2.2046451568603516, 2.343665838241577, 2.4826865196228027, 2.6217072010040283, 2.760727882385254, 2.8997488021850586, 3.038769483566284, 3.1777901649475098, 3.3168108463287354, 3.455831527709961, 3.5948522090911865, 3.733872890472412, 3.872893810272217, 4.011914253234863, 4.150935173034668, 4.289956092834473, 4.428976535797119, 4.567997455596924]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 12.0, 15.0, 19.0, 12.0, 6.0, 15.0, 21.0, 25.0, 26.0, 27.0, 28.0, 31.0, 21.0, 37.0, 41.0, 39.0, 36.0, 39.0, 48.0, 43.0, 45.0, 36.0, 43.0, 33.0, 34.0, 31.0, 34.0, 16.0, 37.0, 21.0, 15.0, 16.0, 15.0, 16.0, 13.0, 11.0, 9.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.071536540985107, -4.91472864151001, -4.75792121887207, -4.601113319396973, -4.444305419921875, -4.287497520446777, -4.130690097808838, -3.9738821983337402, -3.8170745372772217, -3.660266876220703, -3.5034589767456055, -3.346651315689087, -3.1898436546325684, -3.0330357551574707, -2.876228094100952, -2.7194204330444336, -2.562612533569336, -2.4058048725128174, -2.2489969730377197, -2.092189311981201, -1.935381531715393, -1.778573751449585, -1.6217660903930664, -1.4649583101272583, -1.3081505298614502, -1.151342749595642, -0.9945350289344788, -0.8377273082733154, -0.6809195280075073, -0.5241117477416992, -0.3673040270805359, -0.21049630641937256, -0.053689002990722656, 0.10311874747276306, 0.2599264979362488, 0.4167342483997345, 0.5735419988632202, 0.7303497791290283, 0.8871574997901917, 1.043965220451355, 1.200773000717163, 1.3575807809829712, 1.5143885612487793, 1.6711962223052979, 1.828004002571106, 1.984811782836914, 2.1416194438934326, 2.298427104949951, 2.455235004425049, 2.6120426654815674, 2.768850564956665, 2.9256582260131836, 3.0824661254882812, 3.2392737865448, 3.3960814476013184, 3.552889347076416, 3.7096970081329346, 3.866504669189453, 4.023312568664551, 4.180120468139648, 4.336927890777588, 4.4937357902526855, 4.650543689727783, 4.807351112365723, 4.96415901184082]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 14.0, 14.0, 25.0, 40.0, 64.0, 101.0, 160.0, 271.0, 385.0, 584.0, 889.0, 1396.0, 2175.0, 3283.0, 4952.0, 7689.0, 11082.0, 16528.0, 23483.0, 33227.0, 46042.0, 60955.0, 76401.0, 90765.0, 100496.0, 104190.0, 99262.0, 88664.0, 73814.0, 58198.0, 43574.0, 31476.0, 22209.0, 15148.0, 10465.0, 7082.0, 4669.0, 3077.0, 2020.0, 1274.0, 869.0, 522.0, 326.0, 256.0, 147.0, 110.0, 58.0, 42.0, 27.0, 17.0, 11.0, 12.0, 10.0, 2.0, 4.0], "bins": [-3.23046875, -3.1365966796875, -3.042724609375, -2.9488525390625, -2.85498046875, -2.7611083984375, -2.667236328125, -2.5733642578125, -2.4794921875, -2.3856201171875, -2.291748046875, -2.1978759765625, -2.10400390625, -2.0101318359375, -1.916259765625, -1.8223876953125, -1.728515625, -1.6346435546875, -1.540771484375, -1.4468994140625, -1.35302734375, -1.2591552734375, -1.165283203125, -1.0714111328125, -0.9775390625, -0.8836669921875, -0.789794921875, -0.6959228515625, -0.60205078125, -0.5081787109375, -0.414306640625, -0.3204345703125, -0.2265625, -0.1326904296875, -0.038818359375, 0.0550537109375, 0.14892578125, 0.2427978515625, 0.336669921875, 0.4305419921875, 0.5244140625, 0.6182861328125, 0.712158203125, 0.8060302734375, 0.89990234375, 0.9937744140625, 1.087646484375, 1.1815185546875, 1.275390625, 1.3692626953125, 1.463134765625, 1.5570068359375, 1.65087890625, 1.7447509765625, 1.838623046875, 1.9324951171875, 2.0263671875, 2.1202392578125, 2.214111328125, 2.3079833984375, 2.40185546875, 2.4957275390625, 2.589599609375, 2.6834716796875, 2.77734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 11.0, 7.0, 9.0, 14.0, 10.0, 16.0, 19.0, 18.0, 23.0, 22.0, 24.0, 18.0, 28.0, 42.0, 31.0, 47.0, 34.0, 39.0, 38.0, 45.0, 49.0, 42.0, 48.0, 34.0, 36.0, 31.0, 35.0, 39.0, 23.0, 21.0, 21.0, 22.0, 11.0, 17.0, 10.0, 19.0, 10.0, 5.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.453125, -5.29541015625, -5.1376953125, -4.97998046875, -4.822265625, -4.66455078125, -4.5068359375, -4.34912109375, -4.19140625, -4.03369140625, -3.8759765625, -3.71826171875, -3.560546875, -3.40283203125, -3.2451171875, -3.08740234375, -2.9296875, -2.77197265625, -2.6142578125, -2.45654296875, -2.298828125, -2.14111328125, -1.9833984375, -1.82568359375, -1.66796875, -1.51025390625, -1.3525390625, -1.19482421875, -1.037109375, -0.87939453125, -0.7216796875, -0.56396484375, -0.40625, -0.24853515625, -0.0908203125, 0.06689453125, 0.224609375, 0.38232421875, 0.5400390625, 0.69775390625, 0.85546875, 1.01318359375, 1.1708984375, 1.32861328125, 1.486328125, 1.64404296875, 1.8017578125, 1.95947265625, 2.1171875, 2.27490234375, 2.4326171875, 2.59033203125, 2.748046875, 2.90576171875, 3.0634765625, 3.22119140625, 3.37890625, 3.53662109375, 3.6943359375, 3.85205078125, 4.009765625, 4.16748046875, 4.3251953125, 4.48291015625, 4.640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 10.0, 18.0, 32.0, 43.0, 71.0, 110.0, 238.0, 413.0, 743.0, 1428.0, 2517.0, 4549.0, 8658.0, 15984.0, 28460.0, 49812.0, 80808.0, 119232.0, 152931.0, 164275.0, 144112.0, 108329.0, 70025.0, 42576.0, 23955.0, 13429.0, 7305.0, 3805.0, 2028.0, 1166.0, 665.0, 353.0, 191.0, 107.0, 68.0, 37.0, 24.0, 21.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.84765625, -5.67742919921875, -5.5072021484375, -5.33697509765625, -5.166748046875, -4.99652099609375, -4.8262939453125, -4.65606689453125, -4.48583984375, -4.31561279296875, -4.1453857421875, -3.97515869140625, -3.804931640625, -3.63470458984375, -3.4644775390625, -3.29425048828125, -3.1240234375, -2.95379638671875, -2.7835693359375, -2.61334228515625, -2.443115234375, -2.27288818359375, -2.1026611328125, -1.93243408203125, -1.76220703125, -1.59197998046875, -1.4217529296875, -1.25152587890625, -1.081298828125, -0.91107177734375, -0.7408447265625, -0.57061767578125, -0.400390625, -0.23016357421875, -0.0599365234375, 0.11029052734375, 0.280517578125, 0.45074462890625, 0.6209716796875, 0.79119873046875, 0.96142578125, 1.13165283203125, 1.3018798828125, 1.47210693359375, 1.642333984375, 1.81256103515625, 1.9827880859375, 2.15301513671875, 2.3232421875, 2.49346923828125, 2.6636962890625, 2.83392333984375, 3.004150390625, 3.17437744140625, 3.3446044921875, 3.51483154296875, 3.68505859375, 3.85528564453125, 4.0255126953125, 4.19573974609375, 4.365966796875, 4.53619384765625, 4.7064208984375, 4.87664794921875, 5.046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 12.0, 25.0, 18.0, 13.0, 15.0, 26.0, 18.0, 28.0, 27.0, 20.0, 33.0, 26.0, 49.0, 53.0, 36.0, 39.0, 41.0, 53.0, 43.0, 40.0, 36.0, 35.0, 36.0, 34.0, 30.0, 33.0, 25.0, 19.0, 14.0, 17.0, 10.0, 15.0, 15.0, 13.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.787109375, -2.68609619140625, -2.5850830078125, -2.48406982421875, -2.383056640625, -2.28204345703125, -2.1810302734375, -2.08001708984375, -1.97900390625, -1.87799072265625, -1.7769775390625, -1.67596435546875, -1.574951171875, -1.47393798828125, -1.3729248046875, -1.27191162109375, -1.1708984375, -1.06988525390625, -0.9688720703125, -0.86785888671875, -0.766845703125, -0.66583251953125, -0.5648193359375, -0.46380615234375, -0.36279296875, -0.26177978515625, -0.1607666015625, -0.05975341796875, 0.041259765625, 0.14227294921875, 0.2432861328125, 0.34429931640625, 0.4453125, 0.54632568359375, 0.6473388671875, 0.74835205078125, 0.849365234375, 0.95037841796875, 1.0513916015625, 1.15240478515625, 1.25341796875, 1.35443115234375, 1.4554443359375, 1.55645751953125, 1.657470703125, 1.75848388671875, 1.8594970703125, 1.96051025390625, 2.0615234375, 2.16253662109375, 2.2635498046875, 2.36456298828125, 2.465576171875, 2.56658935546875, 2.6676025390625, 2.76861572265625, 2.86962890625, 2.97064208984375, 3.0716552734375, 3.17266845703125, 3.273681640625, 3.37469482421875, 3.4757080078125, 3.57672119140625, 3.677734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 8.0, 16.0, 29.0, 25.0, 50.0, 65.0, 94.0, 127.0, 175.0, 286.0, 437.0, 589.0, 989.0, 1500.0, 2258.0, 3621.0, 5744.0, 9749.0, 16536.0, 28011.0, 47789.0, 79447.0, 121055.0, 159037.0, 168160.0, 143355.0, 101522.0, 64130.0, 37857.0, 22247.0, 12746.0, 7845.0, 4584.0, 2887.0, 1901.0, 1170.0, 775.0, 557.0, 361.0, 265.0, 168.0, 114.0, 72.0, 57.0, 36.0, 28.0, 26.0, 13.0, 14.0, 9.0, 4.0, 3.0, 2.0, 1.0], "bins": [-2.30859375, -2.241241455078125, -2.17388916015625, -2.106536865234375, -2.0391845703125, -1.971832275390625, -1.90447998046875, -1.837127685546875, -1.769775390625, -1.702423095703125, -1.63507080078125, -1.567718505859375, -1.5003662109375, -1.433013916015625, -1.36566162109375, -1.298309326171875, -1.23095703125, -1.163604736328125, -1.09625244140625, -1.028900146484375, -0.9615478515625, -0.894195556640625, -0.82684326171875, -0.759490966796875, -0.692138671875, -0.624786376953125, -0.55743408203125, -0.490081787109375, -0.4227294921875, -0.355377197265625, -0.28802490234375, -0.220672607421875, -0.1533203125, -0.085968017578125, -0.01861572265625, 0.048736572265625, 0.1160888671875, 0.183441162109375, 0.25079345703125, 0.318145751953125, 0.385498046875, 0.452850341796875, 0.52020263671875, 0.587554931640625, 0.6549072265625, 0.722259521484375, 0.78961181640625, 0.856964111328125, 0.92431640625, 0.991668701171875, 1.05902099609375, 1.126373291015625, 1.1937255859375, 1.261077880859375, 1.32843017578125, 1.395782470703125, 1.463134765625, 1.530487060546875, 1.59783935546875, 1.665191650390625, 1.7325439453125, 1.799896240234375, 1.86724853515625, 1.934600830078125, 2.001953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 3.0, 10.0, 9.0, 18.0, 13.0, 22.0, 21.0, 43.0, 35.0, 49.0, 66.0, 89.0, 73.0, 85.0, 72.0, 70.0, 63.0, 59.0, 49.0, 35.0, 36.0, 24.0, 13.0, 11.0, 5.0, 12.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00032401084899902344, -0.00031407177448272705, -0.00030413269996643066, -0.0002941936254501343, -0.0002842545509338379, -0.0002743154764175415, -0.0002643764019012451, -0.00025443732738494873, -0.00024449825286865234, -0.00023455917835235596, -0.00022462010383605957, -0.00021468102931976318, -0.0002047419548034668, -0.0001948028802871704, -0.00018486380577087402, -0.00017492473125457764, -0.00016498565673828125, -0.00015504658222198486, -0.00014510750770568848, -0.0001351684331893921, -0.0001252293586730957, -0.00011529028415679932, -0.00010535120964050293, -9.541213512420654e-05, -8.547306060791016e-05, -7.553398609161377e-05, -6.559491157531738e-05, -5.5655837059020996e-05, -4.571676254272461e-05, -3.577768802642822e-05, -2.5838613510131836e-05, -1.589953899383545e-05, -5.9604644775390625e-06, 3.978610038757324e-06, 1.3917684555053711e-05, 2.3856759071350098e-05, 3.3795833587646484e-05, 4.373490810394287e-05, 5.367398262023926e-05, 6.361305713653564e-05, 7.355213165283203e-05, 8.349120616912842e-05, 9.34302806854248e-05, 0.00010336935520172119, 0.00011330842971801758, 0.00012324750423431396, 0.00013318657875061035, 0.00014312565326690674, 0.00015306472778320312, 0.0001630038022994995, 0.0001729428768157959, 0.00018288195133209229, 0.00019282102584838867, 0.00020276010036468506, 0.00021269917488098145, 0.00022263824939727783, 0.00023257732391357422, 0.0002425163984298706, 0.000252455472946167, 0.0002623945474624634, 0.00027233362197875977, 0.00028227269649505615, 0.00029221177101135254, 0.0003021508455276489, 0.0003120899200439453]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 6.0, 6.0, 6.0, 13.0, 18.0, 15.0, 32.0, 52.0, 62.0, 95.0, 123.0, 206.0, 267.0, 419.0, 659.0, 997.0, 1602.0, 2638.0, 4617.0, 8223.0, 14411.0, 26333.0, 45775.0, 76813.0, 117285.0, 156156.0, 170816.0, 149523.0, 108347.0, 68659.0, 40636.0, 23094.0, 12898.0, 7214.0, 4073.0, 2375.0, 1460.0, 903.0, 539.0, 356.0, 246.0, 156.0, 130.0, 90.0, 66.0, 44.0, 33.0, 25.0, 20.0, 11.0, 13.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.881011962890625, -1.81475830078125, -1.748504638671875, -1.6822509765625, -1.615997314453125, -1.54974365234375, -1.483489990234375, -1.417236328125, -1.350982666015625, -1.28472900390625, -1.218475341796875, -1.1522216796875, -1.085968017578125, -1.01971435546875, -0.953460693359375, -0.88720703125, -0.820953369140625, -0.75469970703125, -0.688446044921875, -0.6221923828125, -0.555938720703125, -0.48968505859375, -0.423431396484375, -0.357177734375, -0.290924072265625, -0.22467041015625, -0.158416748046875, -0.0921630859375, -0.025909423828125, 0.04034423828125, 0.106597900390625, 0.1728515625, 0.239105224609375, 0.30535888671875, 0.371612548828125, 0.4378662109375, 0.504119873046875, 0.57037353515625, 0.636627197265625, 0.702880859375, 0.769134521484375, 0.83538818359375, 0.901641845703125, 0.9678955078125, 1.034149169921875, 1.10040283203125, 1.166656494140625, 1.23291015625, 1.299163818359375, 1.36541748046875, 1.431671142578125, 1.4979248046875, 1.564178466796875, 1.63043212890625, 1.696685791015625, 1.762939453125, 1.829193115234375, 1.89544677734375, 1.961700439453125, 2.0279541015625, 2.094207763671875, 2.16046142578125, 2.226715087890625, 2.29296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 2.0, 6.0, 11.0, 8.0, 13.0, 23.0, 11.0, 16.0, 23.0, 36.0, 34.0, 47.0, 45.0, 49.0, 63.0, 57.0, 61.0, 58.0, 62.0, 64.0, 52.0, 40.0, 26.0, 29.0, 38.0, 24.0, 28.0, 12.0, 11.0, 8.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8594512939453125, -0.833648681640625, -0.8078460693359375, -0.78204345703125, -0.7562408447265625, -0.730438232421875, -0.7046356201171875, -0.6788330078125, -0.6530303955078125, -0.627227783203125, -0.6014251708984375, -0.57562255859375, -0.5498199462890625, -0.524017333984375, -0.4982147216796875, -0.472412109375, -0.4466094970703125, -0.420806884765625, -0.3950042724609375, -0.36920166015625, -0.3433990478515625, -0.317596435546875, -0.2917938232421875, -0.2659912109375, -0.2401885986328125, -0.214385986328125, -0.1885833740234375, -0.16278076171875, -0.1369781494140625, -0.111175537109375, -0.0853729248046875, -0.0595703125, -0.0337677001953125, -0.007965087890625, 0.0178375244140625, 0.04364013671875, 0.0694427490234375, 0.095245361328125, 0.1210479736328125, 0.1468505859375, 0.1726531982421875, 0.198455810546875, 0.2242584228515625, 0.25006103515625, 0.2758636474609375, 0.301666259765625, 0.3274688720703125, 0.353271484375, 0.3790740966796875, 0.404876708984375, 0.4306793212890625, 0.45648193359375, 0.4822845458984375, 0.508087158203125, 0.5338897705078125, 0.5596923828125, 0.5854949951171875, 0.611297607421875, 0.6371002197265625, 0.66290283203125, 0.6887054443359375, 0.714508056640625, 0.7403106689453125, 0.76611328125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 0.0, 2.0, 3.0, 6.0, 9.0, 13.0, 3.0, 12.0, 18.0, 24.0, 20.0, 16.0, 19.0, 21.0, 27.0, 27.0, 29.0, 38.0, 27.0, 34.0, 48.0, 41.0, 41.0, 40.0, 33.0, 41.0, 46.0, 37.0, 21.0, 33.0, 29.0, 23.0, 25.0, 27.0, 24.0, 21.0, 20.0, 19.0, 10.0, 15.0, 13.0, 10.0, 6.0, 6.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.133406162261963, -4.004630088806152, -3.875854015350342, -3.7470779418945312, -3.6183018684387207, -3.48952579498291, -3.3607499599456787, -3.231973886489868, -3.1031978130340576, -2.974421739578247, -2.8456456661224365, -2.716869592666626, -2.5880937576293945, -2.459317684173584, -2.3305416107177734, -2.201765537261963, -2.0729894638061523, -1.9442133903503418, -1.8154373168945312, -1.6866613626480103, -1.5578852891921997, -1.4291092157363892, -1.3003332614898682, -1.1715571880340576, -1.042781114578247, -0.9140050411224365, -0.7852290272712708, -0.656453013420105, -0.5276769399642944, -0.3989008665084839, -0.2701248526573181, -0.14134883880615234, -0.012572765350341797, 0.11620327830314636, 0.24497932195663452, 0.3737553656101227, 0.5025314092636108, 0.6313074827194214, 0.7600834965705872, 0.8888595104217529, 1.0176355838775635, 1.146411657333374, 1.2751877307891846, 1.4039636850357056, 1.5327397584915161, 1.6615158319473267, 1.7902917861938477, 1.9190678596496582, 2.0478439331054688, 2.1766200065612793, 2.30539608001709, 2.4341721534729004, 2.562948226928711, 2.6917243003845215, 2.820500135421753, 2.9492762088775635, 3.078052282333374, 3.2068283557891846, 3.335604429244995, 3.4643805027008057, 3.593156337738037, 3.7219324111938477, 3.850708484649658, 3.9794845581054688, 4.108260631561279]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 6.0, 10.0, 10.0, 16.0, 12.0, 10.0, 17.0, 22.0, 23.0, 28.0, 23.0, 33.0, 23.0, 37.0, 30.0, 32.0, 37.0, 38.0, 32.0, 30.0, 38.0, 36.0, 37.0, 43.0, 36.0, 32.0, 30.0, 30.0, 26.0, 21.0, 24.0, 21.0, 15.0, 22.0, 21.0, 9.0, 16.0, 8.0, 10.0, 8.0, 3.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0], "bins": [-4.821759223937988, -4.674951076507568, -4.528142929077148, -4.3813347816467285, -4.234526634216309, -4.087718486785889, -3.9409101009368896, -3.7941019535064697, -3.64729380607605, -3.50048565864563, -3.35367751121521, -3.20686936378479, -3.060060977935791, -2.913252830505371, -2.766444683074951, -2.6196365356445312, -2.4728283882141113, -2.3260202407836914, -2.1792120933532715, -2.0324039459228516, -1.885595679283142, -1.7387875318527222, -1.5919792652130127, -1.4451711177825928, -1.2983629703521729, -1.151554822921753, -1.004746675491333, -0.8579384088516235, -0.7111302614212036, -0.5643221139907837, -0.417513906955719, -0.2707056999206543, -0.12389755249023438, 0.022910624742507935, 0.16971880197525024, 0.31652697920799255, 0.46333515644073486, 0.6101433038711548, 0.7569515109062195, 0.9037597179412842, 1.050567865371704, 1.197376012802124, 1.344184160232544, 1.4909924268722534, 1.6378005743026733, 1.7846087217330933, 1.9314169883728027, 2.0782251358032227, 2.2250332832336426, 2.3718414306640625, 2.5186495780944824, 2.6654577255249023, 2.8122658729553223, 2.959074020385742, 3.105882406234741, 3.252690553665161, 3.399498701095581, 3.546306848526001, 3.693114995956421, 3.839923143386841, 3.98673152923584, 4.13353967666626, 4.28034782409668, 4.4271559715271, 4.5739641189575195]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 7.0, 7.0, 19.0, 43.0, 53.0, 100.0, 119.0, 159.0, 272.0, 428.0, 694.0, 1047.0, 1612.0, 2567.0, 4298.0, 6764.0, 11132.0, 18240.0, 31405.0, 54899.0, 97671.0, 178175.0, 314540.0, 507264.0, 684330.0, 725669.0, 602702.0, 404598.0, 237935.0, 131620.0, 73386.0, 41311.0, 24095.0, 14197.0, 8679.0, 5288.0, 3245.0, 2119.0, 1287.0, 783.0, 553.0, 354.0, 218.0, 140.0, 98.0, 64.0, 39.0, 24.0, 17.0, 7.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.447265625, -3.329376220703125, -3.21148681640625, -3.093597412109375, -2.9757080078125, -2.857818603515625, -2.73992919921875, -2.622039794921875, -2.504150390625, -2.386260986328125, -2.26837158203125, -2.150482177734375, -2.0325927734375, -1.914703369140625, -1.79681396484375, -1.678924560546875, -1.56103515625, -1.443145751953125, -1.32525634765625, -1.207366943359375, -1.0894775390625, -0.971588134765625, -0.85369873046875, -0.735809326171875, -0.617919921875, -0.500030517578125, -0.38214111328125, -0.264251708984375, -0.1463623046875, -0.028472900390625, 0.08941650390625, 0.207305908203125, 0.3251953125, 0.443084716796875, 0.56097412109375, 0.678863525390625, 0.7967529296875, 0.914642333984375, 1.03253173828125, 1.150421142578125, 1.268310546875, 1.386199951171875, 1.50408935546875, 1.621978759765625, 1.7398681640625, 1.857757568359375, 1.97564697265625, 2.093536376953125, 2.21142578125, 2.329315185546875, 2.44720458984375, 2.565093994140625, 2.6829833984375, 2.800872802734375, 2.91876220703125, 3.036651611328125, 3.154541015625, 3.272430419921875, 3.39031982421875, 3.508209228515625, 3.6260986328125, 3.743988037109375, 3.86187744140625, 3.979766845703125, 4.09765625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 5.0, 14.0, 11.0, 6.0, 18.0, 17.0, 16.0, 23.0, 21.0, 33.0, 33.0, 30.0, 35.0, 37.0, 46.0, 24.0, 38.0, 49.0, 31.0, 38.0, 36.0, 44.0, 38.0, 40.0, 37.0, 32.0, 33.0, 20.0, 21.0, 18.0, 19.0, 17.0, 23.0, 9.0, 16.0, 8.0, 9.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.9891357421875, -3.857177734375, -3.7252197265625, -3.59326171875, -3.4613037109375, -3.329345703125, -3.1973876953125, -3.0654296875, -2.9334716796875, -2.801513671875, -2.6695556640625, -2.53759765625, -2.4056396484375, -2.273681640625, -2.1417236328125, -2.009765625, -1.8778076171875, -1.745849609375, -1.6138916015625, -1.48193359375, -1.3499755859375, -1.218017578125, -1.0860595703125, -0.9541015625, -0.8221435546875, -0.690185546875, -0.5582275390625, -0.42626953125, -0.2943115234375, -0.162353515625, -0.0303955078125, 0.1015625, 0.2335205078125, 0.365478515625, 0.4974365234375, 0.62939453125, 0.7613525390625, 0.893310546875, 1.0252685546875, 1.1572265625, 1.2891845703125, 1.421142578125, 1.5531005859375, 1.68505859375, 1.8170166015625, 1.948974609375, 2.0809326171875, 2.212890625, 2.3448486328125, 2.476806640625, 2.6087646484375, 2.74072265625, 2.8726806640625, 3.004638671875, 3.1365966796875, 3.2685546875, 3.4005126953125, 3.532470703125, 3.6644287109375, 3.79638671875, 3.9283447265625, 4.060302734375, 4.1922607421875, 4.32421875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 12.0, 8.0, 11.0, 15.0, 37.0, 51.0, 68.0, 117.0, 177.0, 297.0, 463.0, 781.0, 1211.0, 1955.0, 3538.0, 5804.0, 9800.0, 16867.0, 29719.0, 52328.0, 91802.0, 162679.0, 277707.0, 453301.0, 657289.0, 749844.0, 633987.0, 429502.0, 262253.0, 151518.0, 86410.0, 48677.0, 27418.0, 16002.0, 9163.0, 5425.0, 3119.0, 1906.0, 1152.0, 689.0, 424.0, 276.0, 188.0, 100.0, 65.0, 39.0, 30.0, 26.0, 10.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.61328125, -4.4710693359375, -4.328857421875, -4.1866455078125, -4.04443359375, -3.9022216796875, -3.760009765625, -3.6177978515625, -3.4755859375, -3.3333740234375, -3.191162109375, -3.0489501953125, -2.90673828125, -2.7645263671875, -2.622314453125, -2.4801025390625, -2.337890625, -2.1956787109375, -2.053466796875, -1.9112548828125, -1.76904296875, -1.6268310546875, -1.484619140625, -1.3424072265625, -1.2001953125, -1.0579833984375, -0.915771484375, -0.7735595703125, -0.63134765625, -0.4891357421875, -0.346923828125, -0.2047119140625, -0.0625, 0.0797119140625, 0.221923828125, 0.3641357421875, 0.50634765625, 0.6485595703125, 0.790771484375, 0.9329833984375, 1.0751953125, 1.2174072265625, 1.359619140625, 1.5018310546875, 1.64404296875, 1.7862548828125, 1.928466796875, 2.0706787109375, 2.212890625, 2.3551025390625, 2.497314453125, 2.6395263671875, 2.78173828125, 2.9239501953125, 3.066162109375, 3.2083740234375, 3.3505859375, 3.4927978515625, 3.635009765625, 3.7772216796875, 3.91943359375, 4.0616455078125, 4.203857421875, 4.3460693359375, 4.48828125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 6.0, 4.0, 2.0, 6.0, 8.0, 14.0, 24.0, 28.0, 45.0, 45.0, 68.0, 83.0, 87.0, 130.0, 113.0, 201.0, 228.0, 259.0, 288.0, 300.0, 263.0, 258.0, 290.0, 255.0, 230.0, 181.0, 175.0, 126.0, 81.0, 61.0, 65.0, 30.0, 31.0, 24.0, 18.0, 15.0, 10.0, 13.0, 5.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.14825439453125, -2.0797119140625, -2.01116943359375, -1.942626953125, -1.87408447265625, -1.8055419921875, -1.73699951171875, -1.66845703125, -1.59991455078125, -1.5313720703125, -1.46282958984375, -1.394287109375, -1.32574462890625, -1.2572021484375, -1.18865966796875, -1.1201171875, -1.05157470703125, -0.9830322265625, -0.91448974609375, -0.845947265625, -0.77740478515625, -0.7088623046875, -0.64031982421875, -0.57177734375, -0.50323486328125, -0.4346923828125, -0.36614990234375, -0.297607421875, -0.22906494140625, -0.1605224609375, -0.09197998046875, -0.0234375, 0.04510498046875, 0.1136474609375, 0.18218994140625, 0.250732421875, 0.31927490234375, 0.3878173828125, 0.45635986328125, 0.52490234375, 0.59344482421875, 0.6619873046875, 0.73052978515625, 0.799072265625, 0.86761474609375, 0.9361572265625, 1.00469970703125, 1.0732421875, 1.14178466796875, 1.2103271484375, 1.27886962890625, 1.347412109375, 1.41595458984375, 1.4844970703125, 1.55303955078125, 1.62158203125, 1.69012451171875, 1.7586669921875, 1.82720947265625, 1.895751953125, 1.96429443359375, 2.0328369140625, 2.10137939453125, 2.169921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 12.0, 12.0, 10.0, 14.0, 19.0, 21.0, 15.0, 16.0, 25.0, 25.0, 34.0, 29.0, 38.0, 38.0, 40.0, 40.0, 44.0, 44.0, 36.0, 51.0, 37.0, 41.0, 27.0, 39.0, 43.0, 26.0, 17.0, 26.0, 25.0, 21.0, 24.0, 20.0, 18.0, 11.0, 8.0, 11.0, 12.0, 8.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.944974184036255, -3.8122129440307617, -3.6794514656066895, -3.5466902256011963, -3.413928985595703, -3.28116774559021, -3.148406505584717, -3.0156450271606445, -2.8828837871551514, -2.750122547149658, -2.617361068725586, -2.4845998287200928, -2.3518385887145996, -2.2190773487091064, -2.0863161087036133, -1.953554630279541, -1.8207933902740479, -1.6880321502685547, -1.555270791053772, -1.4225094318389893, -1.289748191833496, -1.156986951828003, -1.0242255926132202, -0.8914642930030823, -0.7587029933929443, -0.6259416937828064, -0.49318039417266846, -0.3604190945625305, -0.22765779495239258, -0.09489649534225464, 0.0378648042678833, 0.17062610387802124, 0.3033871650695801, 0.436148464679718, 0.568909764289856, 0.7016710638999939, 0.8344323635101318, 0.9671936631202698, 1.0999549627304077, 1.2327163219451904, 1.3654775619506836, 1.4982388019561768, 1.6310001611709595, 1.7637615203857422, 1.8965227603912354, 2.0292840003967285, 2.162045478820801, 2.294806718826294, 2.427567958831787, 2.5603291988372803, 2.6930904388427734, 2.8258519172668457, 2.958613157272339, 3.091374397277832, 3.2241358757019043, 3.3568971157073975, 3.4896583557128906, 3.622419595718384, 3.755180835723877, 3.887942314147949, 4.020703315734863, 4.1534647941589355, 4.286226272583008, 4.418987274169922, 4.551748752593994]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 4.0, 11.0, 12.0, 11.0, 8.0, 14.0, 13.0, 21.0, 18.0, 27.0, 20.0, 24.0, 26.0, 40.0, 51.0, 30.0, 40.0, 25.0, 30.0, 48.0, 40.0, 38.0, 52.0, 38.0, 24.0, 31.0, 36.0, 25.0, 26.0, 19.0, 23.0, 17.0, 23.0, 15.0, 14.0, 16.0, 20.0, 8.0, 8.0, 8.0, 5.0, 14.0, 2.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.738590240478516, -4.594986915588379, -4.451383590698242, -4.3077802658081055, -4.164176940917969, -4.02057409286499, -3.8769707679748535, -3.733367443084717, -3.58976411819458, -3.4461607933044434, -3.3025574684143066, -3.158954381942749, -3.0153510570526123, -2.8717477321624756, -2.728144645690918, -2.5845413208007812, -2.4409379959106445, -2.297334671020508, -2.153731346130371, -2.0101282596588135, -1.8665249347686768, -1.72292160987854, -1.5793184041976929, -1.4357151985168457, -1.292111873626709, -1.1485085487365723, -1.004905343055725, -0.8613020777702332, -0.7176988124847412, -0.5740955471992493, -0.4304922819137573, -0.28688907623291016, -0.14328527450561523, 0.000317990779876709, 0.14392125606536865, 0.2875245213508606, 0.43112778663635254, 0.5747310519218445, 0.7183343172073364, 0.8619375228881836, 1.0055408477783203, 1.149144172668457, 1.2927473783493042, 1.4363505840301514, 1.579953908920288, 1.7235572338104248, 1.867160439491272, 2.010763645172119, 2.154366970062256, 2.2979702949523926, 2.4415736198425293, 2.585176706314087, 2.7287800312042236, 2.8723833560943604, 3.015986442565918, 3.1595897674560547, 3.3031930923461914, 3.446796417236328, 3.590399742126465, 3.7340028285980225, 3.877606153488159, 4.021209239959717, 4.1648125648498535, 4.30841588973999, 4.452019214630127]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 10.0, 6.0, 13.0, 15.0, 30.0, 51.0, 59.0, 103.0, 141.0, 206.0, 287.0, 452.0, 674.0, 1021.0, 1396.0, 2336.0, 3561.0, 5588.0, 8840.0, 14381.0, 22951.0, 35899.0, 55008.0, 82509.0, 113326.0, 138775.0, 144294.0, 126923.0, 97697.0, 68810.0, 45092.0, 28905.0, 18106.0, 11089.0, 7073.0, 4536.0, 2855.0, 1860.0, 1239.0, 832.0, 508.0, 364.0, 239.0, 160.0, 112.0, 70.0, 58.0, 29.0, 15.0, 25.0, 16.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.513671875, -1.465240478515625, -1.41680908203125, -1.368377685546875, -1.3199462890625, -1.271514892578125, -1.22308349609375, -1.174652099609375, -1.126220703125, -1.077789306640625, -1.02935791015625, -0.980926513671875, -0.9324951171875, -0.884063720703125, -0.83563232421875, -0.787200927734375, -0.73876953125, -0.690338134765625, -0.64190673828125, -0.593475341796875, -0.5450439453125, -0.496612548828125, -0.44818115234375, -0.399749755859375, -0.351318359375, -0.302886962890625, -0.25445556640625, -0.206024169921875, -0.1575927734375, -0.109161376953125, -0.06072998046875, -0.012298583984375, 0.0361328125, 0.084564208984375, 0.13299560546875, 0.181427001953125, 0.2298583984375, 0.278289794921875, 0.32672119140625, 0.375152587890625, 0.423583984375, 0.472015380859375, 0.52044677734375, 0.568878173828125, 0.6173095703125, 0.665740966796875, 0.71417236328125, 0.762603759765625, 0.81103515625, 0.859466552734375, 0.90789794921875, 0.956329345703125, 1.0047607421875, 1.053192138671875, 1.10162353515625, 1.150054931640625, 1.198486328125, 1.246917724609375, 1.29534912109375, 1.343780517578125, 1.3922119140625, 1.440643310546875, 1.48907470703125, 1.537506103515625, 1.5859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 3.0, 7.0, 8.0, 8.0, 16.0, 7.0, 16.0, 15.0, 23.0, 17.0, 30.0, 29.0, 36.0, 32.0, 41.0, 43.0, 32.0, 37.0, 45.0, 52.0, 41.0, 43.0, 32.0, 34.0, 39.0, 39.0, 24.0, 23.0, 23.0, 23.0, 19.0, 17.0, 26.0, 20.0, 19.0, 16.0, 11.0, 8.0, 12.0, 5.0, 9.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.106201171875, -4.95068359375, -4.795166015625, -4.6396484375, -4.484130859375, -4.32861328125, -4.173095703125, -4.017578125, -3.862060546875, -3.70654296875, -3.551025390625, -3.3955078125, -3.239990234375, -3.08447265625, -2.928955078125, -2.7734375, -2.617919921875, -2.46240234375, -2.306884765625, -2.1513671875, -1.995849609375, -1.84033203125, -1.684814453125, -1.529296875, -1.373779296875, -1.21826171875, -1.062744140625, -0.9072265625, -0.751708984375, -0.59619140625, -0.440673828125, -0.28515625, -0.129638671875, 0.02587890625, 0.181396484375, 0.3369140625, 0.492431640625, 0.64794921875, 0.803466796875, 0.958984375, 1.114501953125, 1.27001953125, 1.425537109375, 1.5810546875, 1.736572265625, 1.89208984375, 2.047607421875, 2.203125, 2.358642578125, 2.51416015625, 2.669677734375, 2.8251953125, 2.980712890625, 3.13623046875, 3.291748046875, 3.447265625, 3.602783203125, 3.75830078125, 3.913818359375, 4.0693359375, 4.224853515625, 4.38037109375, 4.535888671875, 4.69140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 10.0, 20.0, 18.0, 23.0, 30.0, 36.0, 57.0, 74.0, 100.0, 125.0, 176.0, 299.0, 445.0, 689.0, 1306.0, 2533.0, 5272.0, 10893.0, 23113.0, 72655.0, 836231.0, 53345.0, 20819.0, 9922.0, 4701.0, 2325.0, 1198.0, 675.0, 411.0, 263.0, 190.0, 127.0, 106.0, 91.0, 53.0, 35.0, 37.0, 25.0, 16.0, 18.0, 17.0, 8.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.9140625, -5.731689453125, -5.54931640625, -5.366943359375, -5.1845703125, -5.002197265625, -4.81982421875, -4.637451171875, -4.455078125, -4.272705078125, -4.09033203125, -3.907958984375, -3.7255859375, -3.543212890625, -3.36083984375, -3.178466796875, -2.99609375, -2.813720703125, -2.63134765625, -2.448974609375, -2.2666015625, -2.084228515625, -1.90185546875, -1.719482421875, -1.537109375, -1.354736328125, -1.17236328125, -0.989990234375, -0.8076171875, -0.625244140625, -0.44287109375, -0.260498046875, -0.078125, 0.104248046875, 0.28662109375, 0.468994140625, 0.6513671875, 0.833740234375, 1.01611328125, 1.198486328125, 1.380859375, 1.563232421875, 1.74560546875, 1.927978515625, 2.1103515625, 2.292724609375, 2.47509765625, 2.657470703125, 2.83984375, 3.022216796875, 3.20458984375, 3.386962890625, 3.5693359375, 3.751708984375, 3.93408203125, 4.116455078125, 4.298828125, 4.481201171875, 4.66357421875, 4.845947265625, 5.0283203125, 5.210693359375, 5.39306640625, 5.575439453125, 5.7578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 14.0, 18.0, 20.0, 10.0, 17.0, 25.0, 21.0, 34.0, 27.0, 29.0, 46.0, 30.0, 38.0, 36.0, 41.0, 49.0, 33.0, 45.0, 41.0, 32.0, 46.0, 36.0, 43.0, 37.0, 28.0, 31.0, 28.0, 28.0, 13.0, 17.0, 13.0, 9.0, 12.0, 14.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.358978271484375, -3.23553466796875, -3.112091064453125, -2.9886474609375, -2.865203857421875, -2.74176025390625, -2.618316650390625, -2.494873046875, -2.371429443359375, -2.24798583984375, -2.124542236328125, -2.0010986328125, -1.877655029296875, -1.75421142578125, -1.630767822265625, -1.50732421875, -1.383880615234375, -1.26043701171875, -1.136993408203125, -1.0135498046875, -0.890106201171875, -0.76666259765625, -0.643218994140625, -0.519775390625, -0.396331787109375, -0.27288818359375, -0.149444580078125, -0.0260009765625, 0.097442626953125, 0.22088623046875, 0.344329833984375, 0.4677734375, 0.591217041015625, 0.71466064453125, 0.838104248046875, 0.9615478515625, 1.084991455078125, 1.20843505859375, 1.331878662109375, 1.455322265625, 1.578765869140625, 1.70220947265625, 1.825653076171875, 1.9490966796875, 2.072540283203125, 2.19598388671875, 2.319427490234375, 2.44287109375, 2.566314697265625, 2.68975830078125, 2.813201904296875, 2.9366455078125, 3.060089111328125, 3.18353271484375, 3.306976318359375, 3.430419921875, 3.553863525390625, 3.67730712890625, 3.800750732421875, 3.9241943359375, 4.047637939453125, 4.17108154296875, 4.294525146484375, 4.41796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 6.0, 8.0, 18.0, 16.0, 13.0, 22.0, 41.0, 52.0, 80.0, 137.0, 141.0, 214.0, 294.0, 357.0, 551.0, 815.0, 1225.0, 1926.0, 3454.0, 6452.0, 13691.0, 39354.0, 646672.0, 277894.0, 29911.0, 11507.0, 5467.0, 2860.0, 1774.0, 1120.0, 720.0, 521.0, 357.0, 232.0, 165.0, 133.0, 105.0, 61.0, 49.0, 36.0, 32.0, 21.0, 21.0, 6.0, 7.0, 0.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5661468505859375, -0.547821044921875, -0.5294952392578125, -0.51116943359375, -0.4928436279296875, -0.474517822265625, -0.4561920166015625, -0.4378662109375, -0.4195404052734375, -0.401214599609375, -0.3828887939453125, -0.36456298828125, -0.3462371826171875, -0.327911376953125, -0.3095855712890625, -0.291259765625, -0.2729339599609375, -0.254608154296875, -0.2362823486328125, -0.21795654296875, -0.1996307373046875, -0.181304931640625, -0.1629791259765625, -0.1446533203125, -0.1263275146484375, -0.108001708984375, -0.0896759033203125, -0.07135009765625, -0.0530242919921875, -0.034698486328125, -0.0163726806640625, 0.001953125, 0.0202789306640625, 0.038604736328125, 0.0569305419921875, 0.07525634765625, 0.0935821533203125, 0.111907958984375, 0.1302337646484375, 0.1485595703125, 0.1668853759765625, 0.185211181640625, 0.2035369873046875, 0.22186279296875, 0.2401885986328125, 0.258514404296875, 0.2768402099609375, 0.295166015625, 0.3134918212890625, 0.331817626953125, 0.3501434326171875, 0.36846923828125, 0.3867950439453125, 0.405120849609375, 0.4234466552734375, 0.4417724609375, 0.4600982666015625, 0.478424072265625, 0.4967498779296875, 0.51507568359375, 0.5334014892578125, 0.551727294921875, 0.5700531005859375, 0.58837890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 9.0, 8.0, 4.0, 11.0, 15.0, 10.0, 29.0, 32.0, 58.0, 79.0, 132.0, 138.0, 123.0, 109.0, 52.0, 54.0, 31.0, 25.0, 21.0, 13.0, 10.0, 4.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014959368854761124, -0.00014540739357471466, -0.00014122109860181808, -0.0001370348036289215, -0.00013284850865602493, -0.00012866221368312836, -0.00012447591871023178, -0.0001202896237373352, -0.00011610332876443863, -0.00011191703379154205, -0.00010773073881864548, -0.0001035444438457489, -9.935814887285233e-05, -9.517185389995575e-05, -9.098555892705917e-05, -8.67992639541626e-05, -8.261296898126602e-05, -7.842667400836945e-05, -7.424037903547287e-05, -7.00540840625763e-05, -6.586778908967972e-05, -6.168149411678314e-05, -5.7495199143886566e-05, -5.330890417098999e-05, -4.9122609198093414e-05, -4.493631422519684e-05, -4.075001925230026e-05, -3.6563724279403687e-05, -3.237742930650711e-05, -2.8191134333610535e-05, -2.400483936071396e-05, -1.9818544387817383e-05, -1.5632249414920807e-05, -1.1445954442024231e-05, -7.259659469127655e-06, -3.073364496231079e-06, 1.1129304766654968e-06, 5.299225449562073e-06, 9.485520422458649e-06, 1.3671815395355225e-05, 1.78581103682518e-05, 2.2044405341148376e-05, 2.6230700314044952e-05, 3.041699528694153e-05, 3.4603290259838104e-05, 3.878958523273468e-05, 4.2975880205631256e-05, 4.716217517852783e-05, 5.134847015142441e-05, 5.5534765124320984e-05, 5.972106009721756e-05, 6.390735507011414e-05, 6.809365004301071e-05, 7.227994501590729e-05, 7.646623998880386e-05, 8.065253496170044e-05, 8.483882993459702e-05, 8.902512490749359e-05, 9.321141988039017e-05, 9.739771485328674e-05, 0.00010158400982618332, 0.0001057703047990799, 0.00010995659977197647, 0.00011414289474487305]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 6.0, 13.0, 15.0, 6.0, 23.0, 28.0, 36.0, 54.0, 121.0, 135.0, 180.0, 241.0, 371.0, 502.0, 698.0, 1023.0, 1353.0, 1963.0, 2756.0, 4156.0, 6173.0, 9630.0, 15897.0, 28363.0, 53271.0, 103442.0, 180835.0, 229634.0, 179309.0, 102224.0, 52945.0, 27950.0, 15943.0, 9587.0, 6093.0, 4052.0, 2749.0, 1948.0, 1347.0, 1008.0, 711.0, 529.0, 375.0, 227.0, 172.0, 140.0, 106.0, 67.0, 47.0, 28.0, 26.0, 16.0, 11.0, 12.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.36328125, -0.35174560546875, -0.3402099609375, -0.32867431640625, -0.317138671875, -0.30560302734375, -0.2940673828125, -0.28253173828125, -0.27099609375, -0.25946044921875, -0.2479248046875, -0.23638916015625, -0.224853515625, -0.21331787109375, -0.2017822265625, -0.19024658203125, -0.1787109375, -0.16717529296875, -0.1556396484375, -0.14410400390625, -0.132568359375, -0.12103271484375, -0.1094970703125, -0.09796142578125, -0.08642578125, -0.07489013671875, -0.0633544921875, -0.05181884765625, -0.040283203125, -0.02874755859375, -0.0172119140625, -0.00567626953125, 0.005859375, 0.01739501953125, 0.0289306640625, 0.04046630859375, 0.052001953125, 0.06353759765625, 0.0750732421875, 0.08660888671875, 0.09814453125, 0.10968017578125, 0.1212158203125, 0.13275146484375, 0.144287109375, 0.15582275390625, 0.1673583984375, 0.17889404296875, 0.1904296875, 0.20196533203125, 0.2135009765625, 0.22503662109375, 0.236572265625, 0.24810791015625, 0.2596435546875, 0.27117919921875, 0.28271484375, 0.29425048828125, 0.3057861328125, 0.31732177734375, 0.328857421875, 0.34039306640625, 0.3519287109375, 0.36346435546875, 0.375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 7.0, 14.0, 16.0, 18.0, 27.0, 30.0, 44.0, 78.0, 112.0, 88.0, 97.0, 91.0, 91.0, 70.0, 47.0, 25.0, 28.0, 17.0, 11.0, 10.0, 7.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18603515625, -0.17988014221191406, -0.17372512817382812, -0.1675701141357422, -0.16141510009765625, -0.1552600860595703, -0.14910507202148438, -0.14295005798339844, -0.1367950439453125, -0.13064002990722656, -0.12448501586914062, -0.11833000183105469, -0.11217498779296875, -0.10601997375488281, -0.09986495971679688, -0.09370994567871094, -0.087554931640625, -0.08139991760253906, -0.07524490356445312, -0.06908988952636719, -0.06293487548828125, -0.05677986145019531, -0.050624847412109375, -0.04446983337402344, -0.0383148193359375, -0.03215980529785156, -0.026004791259765625, -0.019849777221679688, -0.01369476318359375, -0.0075397491455078125, -0.001384735107421875, 0.0047702789306640625, 0.01092529296875, 0.017080307006835938, 0.023235321044921875, 0.029390335083007812, 0.03554534912109375, 0.04170036315917969, 0.047855377197265625, 0.05401039123535156, 0.0601654052734375, 0.06632041931152344, 0.07247543334960938, 0.07863044738769531, 0.08478546142578125, 0.09094047546386719, 0.09709548950195312, 0.10325050354003906, 0.109405517578125, 0.11556053161621094, 0.12171554565429688, 0.1278705596923828, 0.13402557373046875, 0.1401805877685547, 0.14633560180664062, 0.15249061584472656, 0.1586456298828125, 0.16480064392089844, 0.17095565795898438, 0.1771106719970703, 0.18326568603515625, 0.1894207000732422, 0.19557571411132812, 0.20173072814941406, 0.2078857421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 11.0, 10.0, 12.0, 17.0, 17.0, 16.0, 11.0, 16.0, 28.0, 25.0, 36.0, 29.0, 34.0, 38.0, 41.0, 39.0, 46.0, 37.0, 36.0, 38.0, 43.0, 51.0, 28.0, 38.0, 23.0, 26.0, 30.0, 26.0, 21.0, 27.0, 23.0, 19.0, 22.0, 9.0, 15.0, 10.0, 4.0, 11.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513746738433838, -3.388150691986084, -3.26255464553833, -3.136958599090576, -3.0113625526428223, -2.8857665061950684, -2.7601704597473145, -2.6345744132995605, -2.5089783668518066, -2.3833823204040527, -2.257786273956299, -2.132190227508545, -2.006594181060791, -1.880998134613037, -1.7554022073745728, -1.6298061609268188, -1.5042102336883545, -1.3786141872406006, -1.2530181407928467, -1.1274220943450928, -1.0018260478973389, -0.8762300610542297, -0.7506340742111206, -0.6250380277633667, -0.4994419813156128, -0.3738459348678589, -0.24824991822242737, -0.12265390157699585, 0.0029421448707580566, 0.12853819131851196, 0.2541341781616211, 0.379730224609375, 0.5053262710571289, 0.6309223175048828, 0.7565183639526367, 0.8821143507957458, 1.0077104568481445, 1.1333065032958984, 1.2589024305343628, 1.3844984769821167, 1.5100945234298706, 1.6356905698776245, 1.7612866163253784, 1.8868825435638428, 2.0124785900115967, 2.1380746364593506, 2.2636706829071045, 2.3892667293548584, 2.5148627758026123, 2.640458822250366, 2.76605486869812, 2.891650915145874, 3.017246961593628, 3.142843008041382, 3.2684388160705566, 3.3940348625183105, 3.5196309089660645, 3.6452269554138184, 3.7708230018615723, 3.896419048309326, 4.02201509475708, 4.147611141204834, 4.273207187652588, 4.398803234100342, 4.524399280548096]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 7.0, 6.0, 11.0, 12.0, 11.0, 12.0, 18.0, 19.0, 20.0, 21.0, 20.0, 22.0, 29.0, 48.0, 32.0, 34.0, 38.0, 31.0, 34.0, 34.0, 48.0, 31.0, 46.0, 44.0, 32.0, 23.0, 34.0, 34.0, 24.0, 14.0, 22.0, 26.0, 19.0, 10.0, 17.0, 22.0, 12.0, 15.0, 7.0, 4.0, 10.0, 10.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.607686996459961, -4.469289779663086, -4.330893039703369, -4.192495822906494, -4.054099082946777, -3.9157018661499023, -3.7773048877716064, -3.6389079093933105, -3.5005109310150146, -3.3621139526367188, -3.223716974258423, -3.085319995880127, -2.946922779083252, -2.808526039123535, -2.67012882232666, -2.5317318439483643, -2.3933348655700684, -2.2549378871917725, -2.1165409088134766, -1.9781438112258911, -1.8397468328475952, -1.7013498544692993, -1.5629527568817139, -1.424555778503418, -1.286158800125122, -1.1477618217468262, -1.0093648433685303, -0.8709677457809448, -0.7325707674026489, -0.594173789024353, -0.45577675104141235, -0.3173797130584717, -0.17898225784301758, -0.04058524966239929, 0.097811758518219, 0.23620876669883728, 0.37460577487945557, 0.5130027532577515, 0.6513997912406921, 0.7897968292236328, 0.9281938076019287, 1.0665907859802246, 1.2049877643585205, 1.343384861946106, 1.4817818403244019, 1.6201788187026978, 1.7585759162902832, 1.896972894668579, 2.035369873046875, 2.173766851425171, 2.312163829803467, 2.4505608081817627, 2.5889577865600586, 2.7273550033569336, 2.8657519817352295, 3.0041489601135254, 3.1425459384918213, 3.280942916870117, 3.419339895248413, 3.557736873626709, 3.696134090423584, 3.834530830383301, 3.972928047180176, 4.111325263977051, 4.249722003936768]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 23.0, 22.0, 37.0, 82.0, 105.0, 188.0, 255.0, 437.0, 696.0, 1046.0, 1673.0, 2716.0, 4168.0, 6463.0, 10087.0, 15738.0, 23355.0, 34499.0, 49191.0, 66879.0, 86388.0, 102636.0, 114272.0, 113846.0, 104519.0, 87484.0, 67597.0, 50173.0, 35320.0, 23982.0, 15913.0, 10330.0, 6583.0, 4375.0, 2704.0, 1807.0, 1078.0, 655.0, 447.0, 298.0, 174.0, 115.0, 68.0, 54.0, 24.0, 16.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.863616943359375, -2.76824951171875, -2.672882080078125, -2.5775146484375, -2.482147216796875, -2.38677978515625, -2.291412353515625, -2.196044921875, -2.100677490234375, -2.00531005859375, -1.909942626953125, -1.8145751953125, -1.719207763671875, -1.62384033203125, -1.528472900390625, -1.43310546875, -1.337738037109375, -1.24237060546875, -1.147003173828125, -1.0516357421875, -0.956268310546875, -0.86090087890625, -0.765533447265625, -0.670166015625, -0.574798583984375, -0.47943115234375, -0.384063720703125, -0.2886962890625, -0.193328857421875, -0.09796142578125, -0.002593994140625, 0.0927734375, 0.188140869140625, 0.28350830078125, 0.378875732421875, 0.4742431640625, 0.569610595703125, 0.66497802734375, 0.760345458984375, 0.855712890625, 0.951080322265625, 1.04644775390625, 1.141815185546875, 1.2371826171875, 1.332550048828125, 1.42791748046875, 1.523284912109375, 1.61865234375, 1.714019775390625, 1.80938720703125, 1.904754638671875, 2.0001220703125, 2.095489501953125, 2.19085693359375, 2.286224365234375, 2.381591796875, 2.476959228515625, 2.57232666015625, 2.667694091796875, 2.7630615234375, 2.858428955078125, 2.95379638671875, 3.049163818359375, 3.14453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 6.0, 13.0, 14.0, 16.0, 18.0, 5.0, 15.0, 20.0, 22.0, 23.0, 21.0, 25.0, 29.0, 46.0, 29.0, 38.0, 40.0, 36.0, 43.0, 41.0, 44.0, 44.0, 28.0, 38.0, 37.0, 23.0, 26.0, 22.0, 22.0, 25.0, 18.0, 21.0, 22.0, 10.0, 19.0, 10.0, 11.0, 11.0, 9.0, 6.0, 6.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.92578125, -4.786376953125, -4.64697265625, -4.507568359375, -4.3681640625, -4.228759765625, -4.08935546875, -3.949951171875, -3.810546875, -3.671142578125, -3.53173828125, -3.392333984375, -3.2529296875, -3.113525390625, -2.97412109375, -2.834716796875, -2.6953125, -2.555908203125, -2.41650390625, -2.277099609375, -2.1376953125, -1.998291015625, -1.85888671875, -1.719482421875, -1.580078125, -1.440673828125, -1.30126953125, -1.161865234375, -1.0224609375, -0.883056640625, -0.74365234375, -0.604248046875, -0.46484375, -0.325439453125, -0.18603515625, -0.046630859375, 0.0927734375, 0.232177734375, 0.37158203125, 0.510986328125, 0.650390625, 0.789794921875, 0.92919921875, 1.068603515625, 1.2080078125, 1.347412109375, 1.48681640625, 1.626220703125, 1.765625, 1.905029296875, 2.04443359375, 2.183837890625, 2.3232421875, 2.462646484375, 2.60205078125, 2.741455078125, 2.880859375, 3.020263671875, 3.15966796875, 3.299072265625, 3.4384765625, 3.577880859375, 3.71728515625, 3.856689453125, 3.99609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 13.0, 13.0, 37.0, 51.0, 97.0, 183.0, 346.0, 580.0, 1033.0, 1805.0, 3155.0, 5850.0, 10011.0, 17487.0, 29288.0, 47179.0, 72131.0, 101799.0, 129403.0, 143788.0, 138726.0, 115415.0, 84869.0, 56884.0, 36663.0, 21600.0, 12944.0, 7533.0, 4162.0, 2382.0, 1321.0, 748.0, 442.0, 260.0, 144.0, 83.0, 56.0, 31.0, 11.0, 14.0, 1.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.20343017578125, -4.0709228515625, -3.93841552734375, -3.805908203125, -3.67340087890625, -3.5408935546875, -3.40838623046875, -3.27587890625, -3.14337158203125, -3.0108642578125, -2.87835693359375, -2.745849609375, -2.61334228515625, -2.4808349609375, -2.34832763671875, -2.2158203125, -2.08331298828125, -1.9508056640625, -1.81829833984375, -1.685791015625, -1.55328369140625, -1.4207763671875, -1.28826904296875, -1.15576171875, -1.02325439453125, -0.8907470703125, -0.75823974609375, -0.625732421875, -0.49322509765625, -0.3607177734375, -0.22821044921875, -0.095703125, 0.03680419921875, 0.1693115234375, 0.30181884765625, 0.434326171875, 0.56683349609375, 0.6993408203125, 0.83184814453125, 0.96435546875, 1.09686279296875, 1.2293701171875, 1.36187744140625, 1.494384765625, 1.62689208984375, 1.7593994140625, 1.89190673828125, 2.0244140625, 2.15692138671875, 2.2894287109375, 2.42193603515625, 2.554443359375, 2.68695068359375, 2.8194580078125, 2.95196533203125, 3.08447265625, 3.21697998046875, 3.3494873046875, 3.48199462890625, 3.614501953125, 3.74700927734375, 3.8795166015625, 4.01202392578125, 4.14453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 1.0, 7.0, 9.0, 8.0, 12.0, 16.0, 11.0, 23.0, 15.0, 26.0, 16.0, 25.0, 14.0, 33.0, 27.0, 33.0, 36.0, 42.0, 39.0, 28.0, 38.0, 39.0, 35.0, 37.0, 35.0, 35.0, 33.0, 47.0, 27.0, 24.0, 32.0, 24.0, 23.0, 20.0, 22.0, 12.0, 19.0, 15.0, 12.0, 6.0, 12.0, 8.0, 7.0, 4.0, 9.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.15234375, -3.06341552734375, -2.9744873046875, -2.88555908203125, -2.796630859375, -2.70770263671875, -2.6187744140625, -2.52984619140625, -2.44091796875, -2.35198974609375, -2.2630615234375, -2.17413330078125, -2.085205078125, -1.99627685546875, -1.9073486328125, -1.81842041015625, -1.7294921875, -1.64056396484375, -1.5516357421875, -1.46270751953125, -1.373779296875, -1.28485107421875, -1.1959228515625, -1.10699462890625, -1.01806640625, -0.92913818359375, -0.8402099609375, -0.75128173828125, -0.662353515625, -0.57342529296875, -0.4844970703125, -0.39556884765625, -0.306640625, -0.21771240234375, -0.1287841796875, -0.03985595703125, 0.049072265625, 0.13800048828125, 0.2269287109375, 0.31585693359375, 0.40478515625, 0.49371337890625, 0.5826416015625, 0.67156982421875, 0.760498046875, 0.84942626953125, 0.9383544921875, 1.02728271484375, 1.1162109375, 1.20513916015625, 1.2940673828125, 1.38299560546875, 1.471923828125, 1.56085205078125, 1.6497802734375, 1.73870849609375, 1.82763671875, 1.91656494140625, 2.0054931640625, 2.09442138671875, 2.183349609375, 2.27227783203125, 2.3612060546875, 2.45013427734375, 2.5390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 10.0, 18.0, 27.0, 32.0, 52.0, 81.0, 135.0, 198.0, 334.0, 520.0, 785.0, 1310.0, 2237.0, 3545.0, 6157.0, 10372.0, 17543.0, 29623.0, 47774.0, 74802.0, 106636.0, 136040.0, 150461.0, 138955.0, 111590.0, 79325.0, 51322.0, 31826.0, 19099.0, 11227.0, 6541.0, 3909.0, 2296.0, 1410.0, 837.0, 555.0, 332.0, 206.0, 148.0, 93.0, 61.0, 48.0, 22.0, 21.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.58984375, -1.53948974609375, -1.4891357421875, -1.43878173828125, -1.388427734375, -1.33807373046875, -1.2877197265625, -1.23736572265625, -1.18701171875, -1.13665771484375, -1.0863037109375, -1.03594970703125, -0.985595703125, -0.93524169921875, -0.8848876953125, -0.83453369140625, -0.7841796875, -0.73382568359375, -0.6834716796875, -0.63311767578125, -0.582763671875, -0.53240966796875, -0.4820556640625, -0.43170166015625, -0.38134765625, -0.33099365234375, -0.2806396484375, -0.23028564453125, -0.179931640625, -0.12957763671875, -0.0792236328125, -0.02886962890625, 0.021484375, 0.07183837890625, 0.1221923828125, 0.17254638671875, 0.222900390625, 0.27325439453125, 0.3236083984375, 0.37396240234375, 0.42431640625, 0.47467041015625, 0.5250244140625, 0.57537841796875, 0.625732421875, 0.67608642578125, 0.7264404296875, 0.77679443359375, 0.8271484375, 0.87750244140625, 0.9278564453125, 0.97821044921875, 1.028564453125, 1.07891845703125, 1.1292724609375, 1.17962646484375, 1.22998046875, 1.28033447265625, 1.3306884765625, 1.38104248046875, 1.431396484375, 1.48175048828125, 1.5321044921875, 1.58245849609375, 1.6328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 9.0, 11.0, 5.0, 12.0, 14.0, 13.0, 15.0, 21.0, 20.0, 32.0, 31.0, 38.0, 43.0, 56.0, 44.0, 39.0, 42.0, 52.0, 58.0, 57.0, 40.0, 48.0, 49.0, 34.0, 29.0, 29.0, 31.0, 17.0, 18.0, 11.0, 10.0, 11.0, 5.0, 15.0, 7.0, 6.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015115737915039062, -0.00014615431427955627, -0.00014115124940872192, -0.00013614818453788757, -0.00013114511966705322, -0.00012614205479621887, -0.00012113898992538452, -0.00011613592505455017, -0.00011113286018371582, -0.00010612979531288147, -0.00010112673044204712, -9.612366557121277e-05, -9.112060070037842e-05, -8.611753582954407e-05, -8.111447095870972e-05, -7.611140608787537e-05, -7.110834121704102e-05, -6.610527634620667e-05, -6.110221147537231e-05, -5.6099146604537964e-05, -5.109608173370361e-05, -4.609301686286926e-05, -4.108995199203491e-05, -3.608688712120056e-05, -3.108382225036621e-05, -2.608075737953186e-05, -2.107769250869751e-05, -1.607462763786316e-05, -1.1071562767028809e-05, -6.068497896194458e-06, -1.0654330253601074e-06, 3.937631845474243e-06, 8.940696716308594e-06, 1.3943761587142944e-05, 1.8946826457977295e-05, 2.3949891328811646e-05, 2.8952956199645996e-05, 3.395602107048035e-05, 3.89590859413147e-05, 4.396215081214905e-05, 4.89652156829834e-05, 5.396828055381775e-05, 5.89713454246521e-05, 6.397441029548645e-05, 6.89774751663208e-05, 7.398054003715515e-05, 7.89836049079895e-05, 8.398666977882385e-05, 8.89897346496582e-05, 9.399279952049255e-05, 9.89958643913269e-05, 0.00010399892926216125, 0.0001090019941329956, 0.00011400505900382996, 0.0001190081238746643, 0.00012401118874549866, 0.000129014253616333, 0.00013401731848716736, 0.0001390203833580017, 0.00014402344822883606, 0.0001490265130996704, 0.00015402957797050476, 0.0001590326428413391, 0.00016403570771217346, 0.0001690387725830078]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 7.0, 12.0, 8.0, 14.0, 30.0, 27.0, 50.0, 80.0, 143.0, 220.0, 339.0, 570.0, 985.0, 1651.0, 2739.0, 4858.0, 8333.0, 14254.0, 24013.0, 38940.0, 60546.0, 87956.0, 116808.0, 137580.0, 140799.0, 124890.0, 98537.0, 69668.0, 45501.0, 28181.0, 16933.0, 9821.0, 5910.0, 3386.0, 1909.0, 1172.0, 624.0, 409.0, 240.0, 158.0, 85.0, 59.0, 38.0, 20.0, 24.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.6396484375, -1.5916595458984375, -1.543670654296875, -1.4956817626953125, -1.44769287109375, -1.3997039794921875, -1.351715087890625, -1.3037261962890625, -1.2557373046875, -1.2077484130859375, -1.159759521484375, -1.1117706298828125, -1.06378173828125, -1.0157928466796875, -0.967803955078125, -0.9198150634765625, -0.871826171875, -0.8238372802734375, -0.775848388671875, -0.7278594970703125, -0.67987060546875, -0.6318817138671875, -0.583892822265625, -0.5359039306640625, -0.4879150390625, -0.4399261474609375, -0.391937255859375, -0.3439483642578125, -0.29595947265625, -0.2479705810546875, -0.199981689453125, -0.1519927978515625, -0.10400390625, -0.0560150146484375, -0.008026123046875, 0.0399627685546875, 0.08795166015625, 0.1359405517578125, 0.183929443359375, 0.2319183349609375, 0.2799072265625, 0.3278961181640625, 0.375885009765625, 0.4238739013671875, 0.47186279296875, 0.5198516845703125, 0.567840576171875, 0.6158294677734375, 0.663818359375, 0.7118072509765625, 0.759796142578125, 0.8077850341796875, 0.85577392578125, 0.9037628173828125, 0.951751708984375, 0.9997406005859375, 1.0477294921875, 1.0957183837890625, 1.143707275390625, 1.1916961669921875, 1.23968505859375, 1.2876739501953125, 1.335662841796875, 1.3836517333984375, 1.431640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 12.0, 13.0, 17.0, 17.0, 22.0, 18.0, 28.0, 26.0, 33.0, 34.0, 46.0, 34.0, 43.0, 40.0, 36.0, 47.0, 43.0, 49.0, 38.0, 52.0, 34.0, 29.0, 28.0, 39.0, 20.0, 25.0, 26.0, 14.0, 21.0, 11.0, 17.0, 12.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.572265625, -0.5557670593261719, -0.5392684936523438, -0.5227699279785156, -0.5062713623046875, -0.4897727966308594, -0.47327423095703125, -0.4567756652832031, -0.440277099609375, -0.4237785339355469, -0.40727996826171875, -0.3907814025878906, -0.3742828369140625, -0.3577842712402344, -0.34128570556640625, -0.3247871398925781, -0.30828857421875, -0.2917900085449219, -0.27529144287109375, -0.2587928771972656, -0.2422943115234375, -0.22579574584960938, -0.20929718017578125, -0.19279861450195312, -0.176300048828125, -0.15980148315429688, -0.14330291748046875, -0.12680435180664062, -0.1103057861328125, -0.09380722045898438, -0.07730865478515625, -0.060810089111328125, -0.0443115234375, -0.027812957763671875, -0.01131439208984375, 0.005184173583984375, 0.0216827392578125, 0.038181304931640625, 0.05467987060546875, 0.07117843627929688, 0.087677001953125, 0.10417556762695312, 0.12067413330078125, 0.13717269897460938, 0.1536712646484375, 0.17016983032226562, 0.18666839599609375, 0.20316696166992188, 0.21966552734375, 0.23616409301757812, 0.25266265869140625, 0.2691612243652344, 0.2856597900390625, 0.3021583557128906, 0.31865692138671875, 0.3351554870605469, 0.351654052734375, 0.3681526184082031, 0.38465118408203125, 0.4011497497558594, 0.4176483154296875, 0.4341468811035156, 0.45064544677734375, 0.4671440124511719, 0.483642578125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 4.0, 5.0, 5.0, 14.0, 9.0, 17.0, 20.0, 11.0, 23.0, 25.0, 23.0, 19.0, 20.0, 27.0, 35.0, 48.0, 35.0, 45.0, 33.0, 38.0, 44.0, 38.0, 50.0, 30.0, 22.0, 34.0, 41.0, 25.0, 28.0, 23.0, 25.0, 24.0, 19.0, 19.0, 18.0, 20.0, 10.0, 11.0, 7.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.537482500076294, -3.419198989868164, -3.3009157180786133, -3.1826322078704834, -3.0643489360809326, -2.9460654258728027, -2.827782154083252, -2.709498643875122, -2.591215133666992, -2.4729316234588623, -2.3546483516693115, -2.2363648414611816, -2.118081569671631, -1.999798059463501, -1.8815146684646606, -1.7632312774658203, -1.6449480056762695, -1.5266646146774292, -1.4083812236785889, -1.290097713470459, -1.1718144416809082, -1.0535309314727783, -0.935247540473938, -0.8169641494750977, -0.6986807584762573, -0.580397367477417, -0.4621139466762543, -0.34383052587509155, -0.22554713487625122, -0.10726374387741089, 0.011019706726074219, 0.12930309772491455, 0.24758672714233398, 0.3658701181411743, 0.48415353894233704, 0.6024369597434998, 0.7207203507423401, 0.8390037417411804, 0.9572871923446655, 1.0755705833435059, 1.1938539743423462, 1.3121373653411865, 1.4304207563400269, 1.5487041473388672, 1.666987657546997, 1.7852709293365479, 1.9035544395446777, 2.0218377113342285, 2.1401212215423584, 2.2584047317504883, 2.376688003540039, 2.494971513748169, 2.6132547855377197, 2.7315382957458496, 2.8498215675354004, 2.9681050777435303, 3.08638858795166, 3.20467209815979, 3.322955369949341, 3.4412388801574707, 3.5595221519470215, 3.6778056621551514, 3.7960891723632812, 3.914372444152832, 4.032655715942383]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 2.0, 1.0, 4.0, 7.0, 8.0, 15.0, 11.0, 21.0, 17.0, 14.0, 26.0, 24.0, 24.0, 21.0, 42.0, 35.0, 33.0, 44.0, 31.0, 40.0, 34.0, 32.0, 39.0, 41.0, 42.0, 30.0, 37.0, 26.0, 34.0, 30.0, 28.0, 47.0, 21.0, 19.0, 15.0, 16.0, 17.0, 14.0, 6.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.582244396209717, -4.433873176574707, -4.285501480102539, -4.137130260467529, -3.9887590408325195, -3.8403878211975098, -3.692016363143921, -3.543644905090332, -3.3952736854553223, -3.2469024658203125, -3.0985310077667236, -2.9501595497131348, -2.801788330078125, -2.6534171104431152, -2.5050456523895264, -2.3566741943359375, -2.2083029747009277, -2.059931755065918, -1.911560297012329, -1.7631889581680298, -1.6148176193237305, -1.4664462804794312, -1.3180749416351318, -1.1697036027908325, -1.0213322639465332, -0.8729609251022339, -0.7245895862579346, -0.5762182474136353, -0.42784690856933594, -0.2794755697250366, -0.1311042308807373, 0.01726710796356201, 0.16563844680786133, 0.31400978565216064, 0.46238112449645996, 0.6107524633407593, 0.7591238021850586, 0.9074951410293579, 1.0558664798736572, 1.2042378187179565, 1.3526091575622559, 1.5009804964065552, 1.6493518352508545, 1.7977231740951538, 1.9460945129394531, 2.094465732574463, 2.2428371906280518, 2.3912086486816406, 2.5395798683166504, 2.68795108795166, 2.836322546005249, 2.984694004058838, 3.1330652236938477, 3.2814364433288574, 3.4298079013824463, 3.578179359436035, 3.726550579071045, 3.8749217987060547, 4.023293495178223, 4.171664714813232, 4.320035934448242, 4.468407154083252, 4.616778373718262, 4.76515007019043, 4.9135212898254395]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 12.0, 16.0, 21.0, 36.0, 33.0, 79.0, 96.0, 177.0, 263.0, 410.0, 654.0, 967.0, 1666.0, 2741.0, 4419.0, 7392.0, 12597.0, 21278.0, 36990.0, 66460.0, 122776.0, 225273.0, 389350.0, 589348.0, 728536.0, 700737.0, 530071.0, 332549.0, 187365.0, 102002.0, 55732.0, 30768.0, 17838.0, 10282.0, 6010.0, 3544.0, 2206.0, 1319.0, 818.0, 526.0, 328.0, 198.0, 127.0, 97.0, 56.0, 37.0, 27.0, 16.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.533203125, -3.41864013671875, -3.3040771484375, -3.18951416015625, -3.074951171875, -2.96038818359375, -2.8458251953125, -2.73126220703125, -2.61669921875, -2.50213623046875, -2.3875732421875, -2.27301025390625, -2.158447265625, -2.04388427734375, -1.9293212890625, -1.81475830078125, -1.7001953125, -1.58563232421875, -1.4710693359375, -1.35650634765625, -1.241943359375, -1.12738037109375, -1.0128173828125, -0.89825439453125, -0.78369140625, -0.66912841796875, -0.5545654296875, -0.44000244140625, -0.325439453125, -0.21087646484375, -0.0963134765625, 0.01824951171875, 0.1328125, 0.24737548828125, 0.3619384765625, 0.47650146484375, 0.591064453125, 0.70562744140625, 0.8201904296875, 0.93475341796875, 1.04931640625, 1.16387939453125, 1.2784423828125, 1.39300537109375, 1.507568359375, 1.62213134765625, 1.7366943359375, 1.85125732421875, 1.9658203125, 2.08038330078125, 2.1949462890625, 2.30950927734375, 2.424072265625, 2.53863525390625, 2.6531982421875, 2.76776123046875, 2.88232421875, 2.99688720703125, 3.1114501953125, 3.22601318359375, 3.340576171875, 3.45513916015625, 3.5697021484375, 3.68426513671875, 3.798828125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 3.0, 2.0, 4.0, 4.0, 10.0, 7.0, 8.0, 7.0, 18.0, 15.0, 17.0, 18.0, 18.0, 34.0, 28.0, 32.0, 28.0, 40.0, 34.0, 30.0, 34.0, 41.0, 38.0, 53.0, 26.0, 51.0, 41.0, 29.0, 36.0, 28.0, 28.0, 25.0, 35.0, 29.0, 25.0, 13.0, 20.0, 13.0, 19.0, 12.0, 7.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.703826904296875, -3.57757568359375, -3.451324462890625, -3.3250732421875, -3.198822021484375, -3.07257080078125, -2.946319580078125, -2.820068359375, -2.693817138671875, -2.56756591796875, -2.441314697265625, -2.3150634765625, -2.188812255859375, -2.06256103515625, -1.936309814453125, -1.81005859375, -1.683807373046875, -1.55755615234375, -1.431304931640625, -1.3050537109375, -1.178802490234375, -1.05255126953125, -0.926300048828125, -0.800048828125, -0.673797607421875, -0.54754638671875, -0.421295166015625, -0.2950439453125, -0.168792724609375, -0.04254150390625, 0.083709716796875, 0.2099609375, 0.336212158203125, 0.46246337890625, 0.588714599609375, 0.7149658203125, 0.841217041015625, 0.96746826171875, 1.093719482421875, 1.219970703125, 1.346221923828125, 1.47247314453125, 1.598724365234375, 1.7249755859375, 1.851226806640625, 1.97747802734375, 2.103729248046875, 2.22998046875, 2.356231689453125, 2.48248291015625, 2.608734130859375, 2.7349853515625, 2.861236572265625, 2.98748779296875, 3.113739013671875, 3.239990234375, 3.366241455078125, 3.49249267578125, 3.618743896484375, 3.7449951171875, 3.871246337890625, 3.99749755859375, 4.123748779296875, 4.25]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 9.0, 25.0, 37.0, 54.0, 65.0, 133.0, 216.0, 321.0, 638.0, 1067.0, 1728.0, 2847.0, 4943.0, 8418.0, 13831.0, 23900.0, 41520.0, 72117.0, 124337.0, 210272.0, 344827.0, 518964.0, 673088.0, 685841.0, 547042.0, 369331.0, 227076.0, 135167.0, 78319.0, 45034.0, 26194.0, 15099.0, 8906.0, 5319.0, 3094.0, 1801.0, 1093.0, 631.0, 409.0, 233.0, 130.0, 81.0, 58.0, 25.0, 19.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.1484375, -4.01910400390625, -3.8897705078125, -3.76043701171875, -3.631103515625, -3.50177001953125, -3.3724365234375, -3.24310302734375, -3.11376953125, -2.98443603515625, -2.8551025390625, -2.72576904296875, -2.596435546875, -2.46710205078125, -2.3377685546875, -2.20843505859375, -2.0791015625, -1.94976806640625, -1.8204345703125, -1.69110107421875, -1.561767578125, -1.43243408203125, -1.3031005859375, -1.17376708984375, -1.04443359375, -0.91510009765625, -0.7857666015625, -0.65643310546875, -0.527099609375, -0.39776611328125, -0.2684326171875, -0.13909912109375, -0.009765625, 0.11956787109375, 0.2489013671875, 0.37823486328125, 0.507568359375, 0.63690185546875, 0.7662353515625, 0.89556884765625, 1.02490234375, 1.15423583984375, 1.2835693359375, 1.41290283203125, 1.542236328125, 1.67156982421875, 1.8009033203125, 1.93023681640625, 2.0595703125, 2.18890380859375, 2.3182373046875, 2.44757080078125, 2.576904296875, 2.70623779296875, 2.8355712890625, 2.96490478515625, 3.09423828125, 3.22357177734375, 3.3529052734375, 3.48223876953125, 3.611572265625, 3.74090576171875, 3.8702392578125, 3.99957275390625, 4.12890625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 6.0, 8.0, 3.0, 4.0, 8.0, 12.0, 25.0, 27.0, 35.0, 44.0, 48.0, 57.0, 72.0, 69.0, 108.0, 99.0, 143.0, 156.0, 187.0, 195.0, 213.0, 245.0, 226.0, 248.0, 238.0, 234.0, 210.0, 191.0, 159.0, 132.0, 115.0, 121.0, 92.0, 66.0, 47.0, 57.0, 50.0, 26.0, 26.0, 15.0, 10.0, 11.0, 7.0, 11.0, 11.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.767578125, -1.7144317626953125, -1.661285400390625, -1.6081390380859375, -1.55499267578125, -1.5018463134765625, -1.448699951171875, -1.3955535888671875, -1.3424072265625, -1.2892608642578125, -1.236114501953125, -1.1829681396484375, -1.12982177734375, -1.0766754150390625, -1.023529052734375, -0.9703826904296875, -0.917236328125, -0.8640899658203125, -0.810943603515625, -0.7577972412109375, -0.70465087890625, -0.6515045166015625, -0.598358154296875, -0.5452117919921875, -0.4920654296875, -0.4389190673828125, -0.385772705078125, -0.3326263427734375, -0.27947998046875, -0.2263336181640625, -0.173187255859375, -0.1200408935546875, -0.06689453125, -0.0137481689453125, 0.039398193359375, 0.0925445556640625, 0.14569091796875, 0.1988372802734375, 0.251983642578125, 0.3051300048828125, 0.3582763671875, 0.4114227294921875, 0.464569091796875, 0.5177154541015625, 0.57086181640625, 0.6240081787109375, 0.677154541015625, 0.7303009033203125, 0.783447265625, 0.8365936279296875, 0.889739990234375, 0.9428863525390625, 0.99603271484375, 1.0491790771484375, 1.102325439453125, 1.1554718017578125, 1.2086181640625, 1.2617645263671875, 1.314910888671875, 1.3680572509765625, 1.42120361328125, 1.4743499755859375, 1.527496337890625, 1.5806427001953125, 1.6337890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 11.0, 5.0, 14.0, 10.0, 20.0, 17.0, 20.0, 24.0, 26.0, 35.0, 43.0, 47.0, 32.0, 43.0, 37.0, 37.0, 37.0, 42.0, 44.0, 32.0, 36.0, 42.0, 45.0, 34.0, 29.0, 24.0, 33.0, 20.0, 21.0, 14.0, 15.0, 20.0, 16.0, 8.0, 11.0, 17.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3410446643829346, -3.211775064468384, -3.082505702972412, -2.9532361030578613, -2.8239665031433105, -2.6946969032287598, -2.565427541732788, -2.4361579418182373, -2.3068885803222656, -2.177618980407715, -2.048349618911743, -1.9190800189971924, -1.7898104190826416, -1.6605409383773804, -1.5312714576721191, -1.4020018577575684, -1.2727322578430176, -1.1434627771377563, -1.0141931772232056, -0.8849236965179443, -0.7556541562080383, -0.6263846158981323, -0.4971151351928711, -0.3678455948829651, -0.23857605457305908, -0.10930652916431427, 0.019962996244430542, 0.14923250675201416, 0.27850204706192017, 0.40777158737182617, 0.5370410680770874, 0.6663106083869934, 0.7955803871154785, 0.9248499274253845, 1.0541194677352905, 1.1833889484405518, 1.3126585483551025, 1.4419280290603638, 1.571197509765625, 1.7004671096801758, 1.829736590385437, 1.9590060710906982, 2.088275671005249, 2.2175450325012207, 2.3468146324157715, 2.4760842323303223, 2.605353832244873, 2.7346231937408447, 2.8638927936553955, 2.9931623935699463, 3.122431755065918, 3.2517013549804688, 3.3809709548950195, 3.5102405548095703, 3.639509916305542, 3.7687795162200928, 3.8980488777160645, 4.027318477630615, 4.156588077545166, 4.285857200622559, 4.415126800537109, 4.54439640045166, 4.673666000366211, 4.802935600280762, 4.9322052001953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 10.0, 11.0, 10.0, 14.0, 17.0, 21.0, 19.0, 16.0, 21.0, 16.0, 27.0, 34.0, 39.0, 37.0, 34.0, 26.0, 45.0, 25.0, 39.0, 31.0, 38.0, 37.0, 35.0, 31.0, 32.0, 34.0, 24.0, 24.0, 27.0, 22.0, 25.0, 22.0, 25.0, 21.0, 20.0, 13.0, 7.0, 10.0, 8.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.446274280548096, -4.311962127685547, -4.17764949798584, -4.043337345123291, -3.909025192260742, -3.7747128009796143, -3.6404004096984863, -3.5060882568359375, -3.3717758655548096, -3.2374634742736816, -3.103151321411133, -2.968838930130005, -2.834526538848877, -2.700214385986328, -2.5659019947052, -2.4315896034240723, -2.2972774505615234, -2.1629650592803955, -2.0286529064178467, -1.8943405151367188, -1.7600282430648804, -1.625715970993042, -1.491403579711914, -1.3570913076400757, -1.2227790355682373, -1.088466763496399, -0.9541544318199158, -0.8198421001434326, -0.6855298280715942, -0.5512175559997559, -0.4169052243232727, -0.28259289264678955, -0.14828109741210938, -0.013968795537948608, 0.12034350633621216, 0.2546558082103729, 0.3889681100845337, 0.5232803821563721, 0.6575927138328552, 0.7919050455093384, 0.9262173175811768, 1.0605295896530151, 1.1948418617248535, 1.3291542530059814, 1.4634665250778198, 1.5977787971496582, 1.7320911884307861, 1.8664034605026245, 2.000715732574463, 2.135028123855591, 2.2693402767181396, 2.4036526679992676, 2.5379648208618164, 2.6722772121429443, 2.8065896034240723, 2.940901756286621, 3.075214147567749, 3.209526538848877, 3.343838691711426, 3.4781510829925537, 3.6124634742736816, 3.7467756271362305, 3.8810880184173584, 4.015400409698486, 4.149712562561035]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 13.0, 22.0, 32.0, 39.0, 52.0, 76.0, 113.0, 164.0, 254.0, 377.0, 565.0, 814.0, 1226.0, 1830.0, 2912.0, 4484.0, 6810.0, 10967.0, 17325.0, 27222.0, 41826.0, 63389.0, 90252.0, 120428.0, 141034.0, 138895.0, 117368.0, 87485.0, 60846.0, 39868.0, 25923.0, 16432.0, 10330.0, 6672.0, 4214.0, 2703.0, 1941.0, 1146.0, 829.0, 519.0, 357.0, 241.0, 150.0, 125.0, 83.0, 51.0, 44.0, 26.0, 20.0, 13.0, 14.0, 7.0, 2.0, 2.0, 2.0, 3.0], "bins": [-1.2587890625, -1.2205810546875, -1.182373046875, -1.1441650390625, -1.10595703125, -1.0677490234375, -1.029541015625, -0.9913330078125, -0.953125, -0.9149169921875, -0.876708984375, -0.8385009765625, -0.80029296875, -0.7620849609375, -0.723876953125, -0.6856689453125, -0.6474609375, -0.6092529296875, -0.571044921875, -0.5328369140625, -0.49462890625, -0.4564208984375, -0.418212890625, -0.3800048828125, -0.341796875, -0.3035888671875, -0.265380859375, -0.2271728515625, -0.18896484375, -0.1507568359375, -0.112548828125, -0.0743408203125, -0.0361328125, 0.0020751953125, 0.040283203125, 0.0784912109375, 0.11669921875, 0.1549072265625, 0.193115234375, 0.2313232421875, 0.26953125, 0.3077392578125, 0.345947265625, 0.3841552734375, 0.42236328125, 0.4605712890625, 0.498779296875, 0.5369873046875, 0.5751953125, 0.6134033203125, 0.651611328125, 0.6898193359375, 0.72802734375, 0.7662353515625, 0.804443359375, 0.8426513671875, 0.880859375, 0.9190673828125, 0.957275390625, 0.9954833984375, 1.03369140625, 1.0718994140625, 1.110107421875, 1.1483154296875, 1.1865234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 11.0, 7.0, 8.0, 6.0, 8.0, 14.0, 16.0, 18.0, 21.0, 15.0, 22.0, 27.0, 36.0, 33.0, 38.0, 29.0, 29.0, 43.0, 32.0, 34.0, 37.0, 39.0, 38.0, 41.0, 35.0, 34.0, 25.0, 28.0, 22.0, 32.0, 27.0, 20.0, 28.0, 19.0, 23.0, 17.0, 15.0, 12.0, 14.0, 3.0, 5.0, 4.0, 6.0, 3.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.5078125, -4.36627197265625, -4.2247314453125, -4.08319091796875, -3.941650390625, -3.80010986328125, -3.6585693359375, -3.51702880859375, -3.37548828125, -3.23394775390625, -3.0924072265625, -2.95086669921875, -2.809326171875, -2.66778564453125, -2.5262451171875, -2.38470458984375, -2.2431640625, -2.10162353515625, -1.9600830078125, -1.81854248046875, -1.677001953125, -1.53546142578125, -1.3939208984375, -1.25238037109375, -1.11083984375, -0.96929931640625, -0.8277587890625, -0.68621826171875, -0.544677734375, -0.40313720703125, -0.2615966796875, -0.12005615234375, 0.021484375, 0.16302490234375, 0.3045654296875, 0.44610595703125, 0.587646484375, 0.72918701171875, 0.8707275390625, 1.01226806640625, 1.15380859375, 1.29534912109375, 1.4368896484375, 1.57843017578125, 1.719970703125, 1.86151123046875, 2.0030517578125, 2.14459228515625, 2.2861328125, 2.42767333984375, 2.5692138671875, 2.71075439453125, 2.852294921875, 2.99383544921875, 3.1353759765625, 3.27691650390625, 3.41845703125, 3.55999755859375, 3.7015380859375, 3.84307861328125, 3.984619140625, 4.12615966796875, 4.2677001953125, 4.40924072265625, 4.55078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 13.0, 21.0, 22.0, 27.0, 42.0, 51.0, 81.0, 107.0, 141.0, 252.0, 441.0, 798.0, 1563.0, 3609.0, 8897.0, 23266.0, 119371.0, 826242.0, 38772.0, 14144.0, 5490.0, 2407.0, 1124.0, 623.0, 315.0, 192.0, 136.0, 99.0, 68.0, 50.0, 38.0, 27.0, 18.0, 20.0, 16.0, 7.0, 10.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.109375, -5.91986083984375, -5.7303466796875, -5.54083251953125, -5.351318359375, -5.16180419921875, -4.9722900390625, -4.78277587890625, -4.59326171875, -4.40374755859375, -4.2142333984375, -4.02471923828125, -3.835205078125, -3.64569091796875, -3.4561767578125, -3.26666259765625, -3.0771484375, -2.88763427734375, -2.6981201171875, -2.50860595703125, -2.319091796875, -2.12957763671875, -1.9400634765625, -1.75054931640625, -1.56103515625, -1.37152099609375, -1.1820068359375, -0.99249267578125, -0.802978515625, -0.61346435546875, -0.4239501953125, -0.23443603515625, -0.044921875, 0.14459228515625, 0.3341064453125, 0.52362060546875, 0.713134765625, 0.90264892578125, 1.0921630859375, 1.28167724609375, 1.47119140625, 1.66070556640625, 1.8502197265625, 2.03973388671875, 2.229248046875, 2.41876220703125, 2.6082763671875, 2.79779052734375, 2.9873046875, 3.17681884765625, 3.3663330078125, 3.55584716796875, 3.745361328125, 3.93487548828125, 4.1243896484375, 4.31390380859375, 4.50341796875, 4.69293212890625, 4.8824462890625, 5.07196044921875, 5.261474609375, 5.45098876953125, 5.6405029296875, 5.83001708984375, 6.01953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 7.0, 7.0, 9.0, 10.0, 15.0, 12.0, 17.0, 20.0, 37.0, 34.0, 25.0, 38.0, 30.0, 27.0, 35.0, 47.0, 43.0, 36.0, 35.0, 46.0, 48.0, 42.0, 36.0, 38.0, 31.0, 36.0, 28.0, 23.0, 25.0, 27.0, 17.0, 15.0, 15.0, 12.0, 13.0, 7.0, 10.0, 10.0, 7.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.203125, -3.09466552734375, -2.9862060546875, -2.87774658203125, -2.769287109375, -2.66082763671875, -2.5523681640625, -2.44390869140625, -2.33544921875, -2.22698974609375, -2.1185302734375, -2.01007080078125, -1.901611328125, -1.79315185546875, -1.6846923828125, -1.57623291015625, -1.4677734375, -1.35931396484375, -1.2508544921875, -1.14239501953125, -1.033935546875, -0.92547607421875, -0.8170166015625, -0.70855712890625, -0.60009765625, -0.49163818359375, -0.3831787109375, -0.27471923828125, -0.166259765625, -0.05780029296875, 0.0506591796875, 0.15911865234375, 0.267578125, 0.37603759765625, 0.4844970703125, 0.59295654296875, 0.701416015625, 0.80987548828125, 0.9183349609375, 1.02679443359375, 1.13525390625, 1.24371337890625, 1.3521728515625, 1.46063232421875, 1.569091796875, 1.67755126953125, 1.7860107421875, 1.89447021484375, 2.0029296875, 2.11138916015625, 2.2198486328125, 2.32830810546875, 2.436767578125, 2.54522705078125, 2.6536865234375, 2.76214599609375, 2.87060546875, 2.97906494140625, 3.0875244140625, 3.19598388671875, 3.304443359375, 3.41290283203125, 3.5213623046875, 3.62982177734375, 3.73828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 3.0, 6.0, 21.0, 12.0, 27.0, 30.0, 51.0, 77.0, 130.0, 214.0, 353.0, 662.0, 1246.0, 2230.0, 4236.0, 8522.0, 18239.0, 51969.0, 801916.0, 112462.0, 24014.0, 10848.0, 5231.0, 2777.0, 1418.0, 779.0, 437.0, 246.0, 121.0, 85.0, 59.0, 40.0, 27.0, 19.0, 10.0, 8.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.40869140625, -0.39443206787109375, -0.3801727294921875, -0.36591339111328125, -0.351654052734375, -0.33739471435546875, -0.3231353759765625, -0.30887603759765625, -0.29461669921875, -0.28035736083984375, -0.2660980224609375, -0.25183868408203125, -0.237579345703125, -0.22332000732421875, -0.2090606689453125, -0.19480133056640625, -0.1805419921875, -0.16628265380859375, -0.1520233154296875, -0.13776397705078125, -0.123504638671875, -0.10924530029296875, -0.0949859619140625, -0.08072662353515625, -0.06646728515625, -0.05220794677734375, -0.0379486083984375, -0.02368927001953125, -0.009429931640625, 0.00482940673828125, 0.0190887451171875, 0.03334808349609375, 0.047607421875, 0.06186676025390625, 0.0761260986328125, 0.09038543701171875, 0.104644775390625, 0.11890411376953125, 0.1331634521484375, 0.14742279052734375, 0.16168212890625, 0.17594146728515625, 0.1902008056640625, 0.20446014404296875, 0.218719482421875, 0.23297882080078125, 0.2472381591796875, 0.26149749755859375, 0.2757568359375, 0.29001617431640625, 0.3042755126953125, 0.31853485107421875, 0.332794189453125, 0.34705352783203125, 0.3613128662109375, 0.37557220458984375, 0.38983154296875, 0.40409088134765625, 0.4183502197265625, 0.43260955810546875, 0.446868896484375, 0.46112823486328125, 0.4753875732421875, 0.48964691162109375, 0.50390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 13.0, 8.0, 14.0, 8.0, 20.0, 18.0, 32.0, 34.0, 40.0, 24.0, 47.0, 62.0, 49.0, 62.0, 59.0, 63.0, 48.0, 43.0, 62.0, 67.0, 48.0, 26.0, 36.0, 24.0, 21.0, 11.0, 6.0, 10.0, 5.0, 8.0, 8.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6372413635253906e-05, -4.4959597289562225e-05, -4.3546780943870544e-05, -4.2133964598178864e-05, -4.072114825248718e-05, -3.93083319067955e-05, -3.789551556110382e-05, -3.648269921541214e-05, -3.506988286972046e-05, -3.365706652402878e-05, -3.22442501783371e-05, -3.0831433832645416e-05, -2.9418617486953735e-05, -2.8005801141262054e-05, -2.6592984795570374e-05, -2.5180168449878693e-05, -2.3767352104187012e-05, -2.235453575849533e-05, -2.094171941280365e-05, -1.952890306711197e-05, -1.8116086721420288e-05, -1.6703270375728607e-05, -1.5290454030036926e-05, -1.3877637684345245e-05, -1.2464821338653564e-05, -1.1052004992961884e-05, -9.639188647270203e-06, -8.226372301578522e-06, -6.813555955886841e-06, -5.40073961019516e-06, -3.987923264503479e-06, -2.575106918811798e-06, -1.1622905731201172e-06, 2.505257725715637e-07, 1.6633421182632446e-06, 3.0761584639549255e-06, 4.4889748096466064e-06, 5.901791155338287e-06, 7.314607501029968e-06, 8.72742384672165e-06, 1.014024019241333e-05, 1.1553056538105011e-05, 1.2965872883796692e-05, 1.4378689229488373e-05, 1.5791505575180054e-05, 1.7204321920871735e-05, 1.8617138266563416e-05, 2.0029954612255096e-05, 2.1442770957946777e-05, 2.2855587303638458e-05, 2.426840364933014e-05, 2.568121999502182e-05, 2.70940363407135e-05, 2.8506852686405182e-05, 2.9919669032096863e-05, 3.1332485377788544e-05, 3.2745301723480225e-05, 3.4158118069171906e-05, 3.5570934414863586e-05, 3.698375076055527e-05, 3.839656710624695e-05, 3.980938345193863e-05, 4.122219979763031e-05, 4.263501614332199e-05, 4.404783248901367e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 7.0, 19.0, 35.0, 48.0, 55.0, 80.0, 116.0, 170.0, 220.0, 311.0, 427.0, 598.0, 817.0, 1188.0, 1655.0, 2766.0, 4906.0, 9767.0, 21568.0, 50175.0, 112816.0, 213805.0, 265600.0, 188693.0, 93724.0, 40524.0, 17849.0, 8422.0, 4420.0, 2445.0, 1553.0, 1052.0, 790.0, 517.0, 374.0, 288.0, 206.0, 171.0, 104.0, 86.0, 46.0, 43.0, 33.0, 16.0, 18.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.396484375, -0.38385009765625, -0.3712158203125, -0.35858154296875, -0.345947265625, -0.33331298828125, -0.3206787109375, -0.30804443359375, -0.29541015625, -0.28277587890625, -0.2701416015625, -0.25750732421875, -0.244873046875, -0.23223876953125, -0.2196044921875, -0.20697021484375, -0.1943359375, -0.18170166015625, -0.1690673828125, -0.15643310546875, -0.143798828125, -0.13116455078125, -0.1185302734375, -0.10589599609375, -0.09326171875, -0.08062744140625, -0.0679931640625, -0.05535888671875, -0.042724609375, -0.03009033203125, -0.0174560546875, -0.00482177734375, 0.0078125, 0.02044677734375, 0.0330810546875, 0.04571533203125, 0.058349609375, 0.07098388671875, 0.0836181640625, 0.09625244140625, 0.10888671875, 0.12152099609375, 0.1341552734375, 0.14678955078125, 0.159423828125, 0.17205810546875, 0.1846923828125, 0.19732666015625, 0.2099609375, 0.22259521484375, 0.2352294921875, 0.24786376953125, 0.260498046875, 0.27313232421875, 0.2857666015625, 0.29840087890625, 0.31103515625, 0.32366943359375, 0.3363037109375, 0.34893798828125, 0.361572265625, 0.37420654296875, 0.3868408203125, 0.39947509765625, 0.412109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 11.0, 20.0, 12.0, 12.0, 22.0, 17.0, 28.0, 31.0, 36.0, 28.0, 33.0, 48.0, 39.0, 50.0, 42.0, 41.0, 55.0, 43.0, 43.0, 45.0, 43.0, 46.0, 32.0, 28.0, 28.0, 28.0, 21.0, 14.0, 14.0, 13.0, 10.0, 5.0, 7.0, 4.0, 10.0, 8.0, 5.0, 4.0, 8.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0882568359375, -0.08521842956542969, -0.08218002319335938, -0.07914161682128906, -0.07610321044921875, -0.07306480407714844, -0.07002639770507812, -0.06698799133300781, -0.0639495849609375, -0.06091117858886719, -0.057872772216796875, -0.05483436584472656, -0.05179595947265625, -0.04875755310058594, -0.045719146728515625, -0.04268074035644531, -0.039642333984375, -0.03660392761230469, -0.033565521240234375, -0.030527114868164062, -0.02748870849609375, -0.024450302124023438, -0.021411895751953125, -0.018373489379882812, -0.0153350830078125, -0.012296676635742188, -0.009258270263671875, -0.0062198638916015625, -0.00318145751953125, -0.0001430511474609375, 0.002895355224609375, 0.0059337615966796875, 0.00897216796875, 0.012010574340820312, 0.015048980712890625, 0.018087387084960938, 0.02112579345703125, 0.024164199829101562, 0.027202606201171875, 0.030241012573242188, 0.0332794189453125, 0.03631782531738281, 0.039356231689453125, 0.04239463806152344, 0.04543304443359375, 0.04847145080566406, 0.051509857177734375, 0.05454826354980469, 0.057586669921875, 0.06062507629394531, 0.06366348266601562, 0.06670188903808594, 0.06974029541015625, 0.07277870178222656, 0.07581710815429688, 0.07885551452636719, 0.0818939208984375, 0.08493232727050781, 0.08797073364257812, 0.09100914001464844, 0.09404754638671875, 0.09708595275878906, 0.10012435913085938, 0.10316276550292969, 0.106201171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 4.0, 6.0, 3.0, 9.0, 9.0, 9.0, 12.0, 15.0, 18.0, 21.0, 19.0, 19.0, 27.0, 51.0, 43.0, 47.0, 34.0, 25.0, 30.0, 39.0, 37.0, 33.0, 41.0, 39.0, 39.0, 31.0, 35.0, 32.0, 30.0, 33.0, 22.0, 19.0, 24.0, 15.0, 17.0, 15.0, 17.0, 15.0, 9.0, 10.0, 10.0, 9.0, 7.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3780593872070312, -3.2601850032806396, -3.142310619354248, -3.0244364738464355, -2.906562089920044, -2.7886877059936523, -2.6708133220672607, -2.552938938140869, -2.4350645542144775, -2.317190170288086, -2.1993157863616943, -2.0814414024353027, -1.9635671377182007, -1.8456928730010986, -1.727818489074707, -1.6099441051483154, -1.4920698404312134, -1.3741954565048218, -1.2563211917877197, -1.1384468078613281, -1.0205724239349365, -0.9026980996131897, -0.7848237752914429, -0.6669493913650513, -0.5490750670433044, -0.43120071291923523, -0.313326358795166, -0.1954520344734192, -0.07757768034934998, 0.04029667377471924, 0.15817099809646606, 0.27604538202285767, 0.3939197063446045, 0.5117940306663513, 0.6296684145927429, 0.7475427389144897, 0.8654171228408813, 0.9832914471626282, 1.101165771484375, 1.2190401554107666, 1.3369145393371582, 1.4547889232635498, 1.5726631879806519, 1.6905375719070435, 1.808411955833435, 1.926286220550537, 2.0441606044769287, 2.1620349884033203, 2.279909133911133, 2.3977835178375244, 2.515657901763916, 2.6335320472717285, 2.75140643119812, 2.8692808151245117, 2.9871551990509033, 3.105029582977295, 3.2229039669036865, 3.340778350830078, 3.4586527347564697, 3.5765271186828613, 3.694401264190674, 3.8122756481170654, 3.930150032043457, 4.0480241775512695, 4.16589879989624]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 1.0, 6.0, 5.0, 2.0, 9.0, 8.0, 8.0, 12.0, 10.0, 13.0, 20.0, 21.0, 22.0, 18.0, 14.0, 19.0, 28.0, 36.0, 39.0, 41.0, 29.0, 35.0, 36.0, 30.0, 33.0, 37.0, 43.0, 33.0, 26.0, 39.0, 34.0, 27.0, 27.0, 26.0, 22.0, 26.0, 29.0, 19.0, 25.0, 14.0, 22.0, 8.0, 11.0, 6.0, 7.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.3891425132751465, -4.255234241485596, -4.121325492858887, -3.987417221069336, -3.853508949279785, -3.7196004390716553, -3.5856919288635254, -3.4517836570739746, -3.3178751468658447, -3.183966636657715, -3.050058364868164, -2.916149854660034, -2.7822413444519043, -2.6483330726623535, -2.5144245624542236, -2.3805160522460938, -2.246607780456543, -2.112699270248413, -1.9787909984588623, -1.8448824882507324, -1.710974097251892, -1.5770657062530518, -1.4431571960449219, -1.3092488050460815, -1.1753404140472412, -1.0414320230484009, -0.9075235724449158, -0.7736151218414307, -0.6397067308425903, -0.50579833984375, -0.3718898892402649, -0.23798143863677979, -0.10407257080078125, 0.02983585000038147, 0.1637442708015442, 0.2976526916027069, 0.43156111240386963, 0.56546950340271, 0.6993779540061951, 0.8332864046096802, 0.9671947956085205, 1.1011031866073608, 1.2350115776062012, 1.368920087814331, 1.5028284788131714, 1.6367368698120117, 1.7706453800201416, 1.904553771018982, 2.0384621620178223, 2.172370672225952, 2.306278944015503, 2.440187454223633, 2.5740957260131836, 2.7080042362213135, 2.8419127464294434, 2.975821018218994, 3.109729528427124, 3.243638038635254, 3.3775463104248047, 3.5114548206329346, 3.6453633308410645, 3.7792716026306152, 3.913180112838745, 4.047088623046875, 4.180996894836426]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 10.0, 30.0, 17.0, 40.0, 66.0, 97.0, 172.0, 243.0, 421.0, 647.0, 1065.0, 1763.0, 2789.0, 4507.0, 6898.0, 10767.0, 16787.0, 25268.0, 36930.0, 52301.0, 69655.0, 89944.0, 105618.0, 114439.0, 113542.0, 101634.0, 84005.0, 65302.0, 47245.0, 33350.0, 22409.0, 14731.0, 9495.0, 6012.0, 3886.0, 2470.0, 1520.0, 953.0, 555.0, 397.0, 235.0, 135.0, 69.0, 47.0, 39.0, 17.0, 14.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.068359375, -2.9749755859375, -2.881591796875, -2.7882080078125, -2.69482421875, -2.6014404296875, -2.508056640625, -2.4146728515625, -2.3212890625, -2.2279052734375, -2.134521484375, -2.0411376953125, -1.94775390625, -1.8543701171875, -1.760986328125, -1.6676025390625, -1.57421875, -1.4808349609375, -1.387451171875, -1.2940673828125, -1.20068359375, -1.1072998046875, -1.013916015625, -0.9205322265625, -0.8271484375, -0.7337646484375, -0.640380859375, -0.5469970703125, -0.45361328125, -0.3602294921875, -0.266845703125, -0.1734619140625, -0.080078125, 0.0133056640625, 0.106689453125, 0.2000732421875, 0.29345703125, 0.3868408203125, 0.480224609375, 0.5736083984375, 0.6669921875, 0.7603759765625, 0.853759765625, 0.9471435546875, 1.04052734375, 1.1339111328125, 1.227294921875, 1.3206787109375, 1.4140625, 1.5074462890625, 1.600830078125, 1.6942138671875, 1.78759765625, 1.8809814453125, 1.974365234375, 2.0677490234375, 2.1611328125, 2.2545166015625, 2.347900390625, 2.4412841796875, 2.53466796875, 2.6280517578125, 2.721435546875, 2.8148193359375, 2.908203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 13.0, 13.0, 15.0, 21.0, 20.0, 24.0, 22.0, 37.0, 33.0, 36.0, 41.0, 38.0, 52.0, 42.0, 35.0, 49.0, 56.0, 42.0, 35.0, 38.0, 35.0, 33.0, 36.0, 25.0, 32.0, 23.0, 24.0, 19.0, 16.0, 11.0, 14.0, 11.0, 6.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.86224365234375, -4.7010498046875, -4.53985595703125, -4.378662109375, -4.21746826171875, -4.0562744140625, -3.89508056640625, -3.73388671875, -3.57269287109375, -3.4114990234375, -3.25030517578125, -3.089111328125, -2.92791748046875, -2.7667236328125, -2.60552978515625, -2.4443359375, -2.28314208984375, -2.1219482421875, -1.96075439453125, -1.799560546875, -1.63836669921875, -1.4771728515625, -1.31597900390625, -1.15478515625, -0.99359130859375, -0.8323974609375, -0.67120361328125, -0.510009765625, -0.34881591796875, -0.1876220703125, -0.02642822265625, 0.134765625, 0.29595947265625, 0.4571533203125, 0.61834716796875, 0.779541015625, 0.94073486328125, 1.1019287109375, 1.26312255859375, 1.42431640625, 1.58551025390625, 1.7467041015625, 1.90789794921875, 2.069091796875, 2.23028564453125, 2.3914794921875, 2.55267333984375, 2.7138671875, 2.87506103515625, 3.0362548828125, 3.19744873046875, 3.358642578125, 3.51983642578125, 3.6810302734375, 3.84222412109375, 4.00341796875, 4.16461181640625, 4.3258056640625, 4.48699951171875, 4.648193359375, 4.80938720703125, 4.9705810546875, 5.13177490234375, 5.29296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 11.0, 18.0, 33.0, 47.0, 68.0, 81.0, 157.0, 236.0, 362.0, 581.0, 896.0, 1433.0, 2168.0, 3302.0, 5152.0, 7551.0, 11490.0, 16769.0, 24385.0, 34528.0, 47306.0, 63168.0, 79733.0, 95106.0, 104004.0, 106459.0, 100275.0, 87543.0, 70812.0, 54795.0, 40478.0, 28684.0, 20269.0, 13727.0, 9309.0, 6171.0, 4114.0, 2596.0, 1647.0, 1065.0, 759.0, 445.0, 329.0, 214.0, 99.0, 72.0, 48.0, 23.0, 11.0, 11.0, 2.0, 7.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.001953125, -2.905853271484375, -2.80975341796875, -2.713653564453125, -2.6175537109375, -2.521453857421875, -2.42535400390625, -2.329254150390625, -2.233154296875, -2.137054443359375, -2.04095458984375, -1.944854736328125, -1.8487548828125, -1.752655029296875, -1.65655517578125, -1.560455322265625, -1.46435546875, -1.368255615234375, -1.27215576171875, -1.176055908203125, -1.0799560546875, -0.983856201171875, -0.88775634765625, -0.791656494140625, -0.695556640625, -0.599456787109375, -0.50335693359375, -0.407257080078125, -0.3111572265625, -0.215057373046875, -0.11895751953125, -0.022857666015625, 0.0732421875, 0.169342041015625, 0.26544189453125, 0.361541748046875, 0.4576416015625, 0.553741455078125, 0.64984130859375, 0.745941162109375, 0.842041015625, 0.938140869140625, 1.03424072265625, 1.130340576171875, 1.2264404296875, 1.322540283203125, 1.41864013671875, 1.514739990234375, 1.61083984375, 1.706939697265625, 1.80303955078125, 1.899139404296875, 1.9952392578125, 2.091339111328125, 2.18743896484375, 2.283538818359375, 2.379638671875, 2.475738525390625, 2.57183837890625, 2.667938232421875, 2.7640380859375, 2.860137939453125, 2.95623779296875, 3.052337646484375, 3.1484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 4.0, 6.0, 3.0, 12.0, 13.0, 20.0, 17.0, 25.0, 25.0, 19.0, 26.0, 16.0, 22.0, 31.0, 42.0, 33.0, 32.0, 40.0, 39.0, 42.0, 41.0, 33.0, 38.0, 45.0, 36.0, 33.0, 29.0, 30.0, 39.0, 36.0, 23.0, 21.0, 32.0, 14.0, 13.0, 11.0, 15.0, 9.0, 8.0, 7.0, 6.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65234375, -2.556671142578125, -2.46099853515625, -2.365325927734375, -2.2696533203125, -2.173980712890625, -2.07830810546875, -1.982635498046875, -1.886962890625, -1.791290283203125, -1.69561767578125, -1.599945068359375, -1.5042724609375, -1.408599853515625, -1.31292724609375, -1.217254638671875, -1.12158203125, -1.025909423828125, -0.93023681640625, -0.834564208984375, -0.7388916015625, -0.643218994140625, -0.54754638671875, -0.451873779296875, -0.356201171875, -0.260528564453125, -0.16485595703125, -0.069183349609375, 0.0264892578125, 0.122161865234375, 0.21783447265625, 0.313507080078125, 0.4091796875, 0.504852294921875, 0.60052490234375, 0.696197509765625, 0.7918701171875, 0.887542724609375, 0.98321533203125, 1.078887939453125, 1.174560546875, 1.270233154296875, 1.36590576171875, 1.461578369140625, 1.5572509765625, 1.652923583984375, 1.74859619140625, 1.844268798828125, 1.93994140625, 2.035614013671875, 2.13128662109375, 2.226959228515625, 2.3226318359375, 2.418304443359375, 2.51397705078125, 2.609649658203125, 2.705322265625, 2.800994873046875, 2.89666748046875, 2.992340087890625, 3.0880126953125, 3.183685302734375, 3.27935791015625, 3.375030517578125, 3.470703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 13.0, 12.0, 11.0, 35.0, 34.0, 72.0, 82.0, 135.0, 213.0, 355.0, 528.0, 906.0, 1381.0, 2311.0, 3853.0, 6629.0, 10959.0, 18487.0, 30995.0, 50746.0, 78785.0, 111933.0, 141298.0, 152411.0, 137725.0, 106937.0, 73696.0, 46573.0, 28389.0, 17394.0, 10237.0, 6028.0, 3648.0, 2168.0, 1322.0, 827.0, 507.0, 286.0, 187.0, 143.0, 95.0, 57.0, 35.0, 28.0, 27.0, 15.0, 15.0, 7.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.4716796875, -1.421661376953125, -1.37164306640625, -1.321624755859375, -1.2716064453125, -1.221588134765625, -1.17156982421875, -1.121551513671875, -1.071533203125, -1.021514892578125, -0.97149658203125, -0.921478271484375, -0.8714599609375, -0.821441650390625, -0.77142333984375, -0.721405029296875, -0.67138671875, -0.621368408203125, -0.57135009765625, -0.521331787109375, -0.4713134765625, -0.421295166015625, -0.37127685546875, -0.321258544921875, -0.271240234375, -0.221221923828125, -0.17120361328125, -0.121185302734375, -0.0711669921875, -0.021148681640625, 0.02886962890625, 0.078887939453125, 0.12890625, 0.178924560546875, 0.22894287109375, 0.278961181640625, 0.3289794921875, 0.378997802734375, 0.42901611328125, 0.479034423828125, 0.529052734375, 0.579071044921875, 0.62908935546875, 0.679107666015625, 0.7291259765625, 0.779144287109375, 0.82916259765625, 0.879180908203125, 0.92919921875, 0.979217529296875, 1.02923583984375, 1.079254150390625, 1.1292724609375, 1.179290771484375, 1.22930908203125, 1.279327392578125, 1.329345703125, 1.379364013671875, 1.42938232421875, 1.479400634765625, 1.5294189453125, 1.579437255859375, 1.62945556640625, 1.679473876953125, 1.7294921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 10.0, 11.0, 11.0, 15.0, 17.0, 18.0, 30.0, 34.0, 22.0, 29.0, 37.0, 44.0, 49.0, 39.0, 53.0, 50.0, 46.0, 57.0, 55.0, 58.0, 46.0, 42.0, 27.0, 29.0, 31.0, 26.0, 25.0, 14.0, 14.0, 8.0, 13.0, 7.0, 0.0, 5.0, 0.0, 7.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001494884490966797, -0.00014436990022659302, -0.00013925135135650635, -0.00013413280248641968, -0.000129014253616333, -0.00012389570474624634, -0.00011877715587615967, -0.000113658607006073, -0.00010854005813598633, -0.00010342150926589966, -9.830296039581299e-05, -9.318441152572632e-05, -8.806586265563965e-05, -8.294731378555298e-05, -7.782876491546631e-05, -7.271021604537964e-05, -6.759166717529297e-05, -6.24731183052063e-05, -5.735456943511963e-05, -5.223602056503296e-05, -4.711747169494629e-05, -4.199892282485962e-05, -3.688037395477295e-05, -3.176182508468628e-05, -2.664327621459961e-05, -2.152472734451294e-05, -1.640617847442627e-05, -1.12876296043396e-05, -6.16908073425293e-06, -1.0505318641662598e-06, 4.06801700592041e-06, 9.18656587600708e-06, 1.430511474609375e-05, 1.942366361618042e-05, 2.454221248626709e-05, 2.966076135635376e-05, 3.477931022644043e-05, 3.98978590965271e-05, 4.501640796661377e-05, 5.013495683670044e-05, 5.525350570678711e-05, 6.037205457687378e-05, 6.549060344696045e-05, 7.060915231704712e-05, 7.572770118713379e-05, 8.084625005722046e-05, 8.596479892730713e-05, 9.10833477973938e-05, 9.620189666748047e-05, 0.00010132044553756714, 0.00010643899440765381, 0.00011155754327774048, 0.00011667609214782715, 0.00012179464101791382, 0.0001269131898880005, 0.00013203173875808716, 0.00013715028762817383, 0.0001422688364982605, 0.00014738738536834717, 0.00015250593423843384, 0.0001576244831085205, 0.00016274303197860718, 0.00016786158084869385, 0.00017298012971878052, 0.0001780986785888672]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 14.0, 25.0, 35.0, 52.0, 54.0, 112.0, 155.0, 261.0, 474.0, 792.0, 1304.0, 2457.0, 4616.0, 8452.0, 15134.0, 27821.0, 48385.0, 79165.0, 118232.0, 153307.0, 165353.0, 145404.0, 108907.0, 71074.0, 42487.0, 24471.0, 13545.0, 7395.0, 3924.0, 2262.0, 1227.0, 688.0, 384.0, 213.0, 135.0, 76.0, 56.0, 30.0, 27.0, 14.0, 10.0, 11.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7275390625, -1.6741943359375, -1.620849609375, -1.5675048828125, -1.51416015625, -1.4608154296875, -1.407470703125, -1.3541259765625, -1.30078125, -1.2474365234375, -1.194091796875, -1.1407470703125, -1.08740234375, -1.0340576171875, -0.980712890625, -0.9273681640625, -0.8740234375, -0.8206787109375, -0.767333984375, -0.7139892578125, -0.66064453125, -0.6072998046875, -0.553955078125, -0.5006103515625, -0.447265625, -0.3939208984375, -0.340576171875, -0.2872314453125, -0.23388671875, -0.1805419921875, -0.127197265625, -0.0738525390625, -0.0205078125, 0.0328369140625, 0.086181640625, 0.1395263671875, 0.19287109375, 0.2462158203125, 0.299560546875, 0.3529052734375, 0.40625, 0.4595947265625, 0.512939453125, 0.5662841796875, 0.61962890625, 0.6729736328125, 0.726318359375, 0.7796630859375, 0.8330078125, 0.8863525390625, 0.939697265625, 0.9930419921875, 1.04638671875, 1.0997314453125, 1.153076171875, 1.2064208984375, 1.259765625, 1.3131103515625, 1.366455078125, 1.4197998046875, 1.47314453125, 1.5264892578125, 1.579833984375, 1.6331787109375, 1.6865234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 8.0, 9.0, 12.0, 11.0, 26.0, 22.0, 27.0, 38.0, 31.0, 49.0, 45.0, 47.0, 62.0, 78.0, 73.0, 68.0, 45.0, 61.0, 44.0, 32.0, 37.0, 32.0, 34.0, 21.0, 21.0, 13.0, 14.0, 9.0, 14.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7320785522460938, -0.7068328857421875, -0.6815872192382812, -0.656341552734375, -0.6310958862304688, -0.6058502197265625, -0.5806045532226562, -0.55535888671875, -0.5301132202148438, -0.5048675537109375, -0.47962188720703125, -0.454376220703125, -0.42913055419921875, -0.4038848876953125, -0.37863922119140625, -0.3533935546875, -0.32814788818359375, -0.3029022216796875, -0.27765655517578125, -0.252410888671875, -0.22716522216796875, -0.2019195556640625, -0.17667388916015625, -0.15142822265625, -0.12618255615234375, -0.1009368896484375, -0.07569122314453125, -0.050445556640625, -0.02519989013671875, 4.57763671875e-05, 0.02529144287109375, 0.050537109375, 0.07578277587890625, 0.1010284423828125, 0.12627410888671875, 0.151519775390625, 0.17676544189453125, 0.2020111083984375, 0.22725677490234375, 0.25250244140625, 0.27774810791015625, 0.3029937744140625, 0.32823944091796875, 0.353485107421875, 0.37873077392578125, 0.4039764404296875, 0.42922210693359375, 0.4544677734375, 0.47971343994140625, 0.5049591064453125, 0.5302047729492188, 0.555450439453125, 0.5806961059570312, 0.6059417724609375, 0.6311874389648438, 0.65643310546875, 0.6816787719726562, 0.7069244384765625, 0.7321701049804688, 0.757415771484375, 0.7826614379882812, 0.8079071044921875, 0.8331527709960938, 0.8583984375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 11.0, 8.0, 6.0, 9.0, 8.0, 12.0, 18.0, 18.0, 25.0, 24.0, 25.0, 25.0, 33.0, 29.0, 37.0, 39.0, 36.0, 43.0, 30.0, 42.0, 37.0, 34.0, 33.0, 37.0, 37.0, 29.0, 28.0, 41.0, 28.0, 29.0, 20.0, 19.0, 16.0, 16.0, 15.0, 12.0, 9.0, 12.0, 15.0, 11.0, 9.0, 7.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.447143793106079, -3.3342535495758057, -3.2213635444641113, -3.108473300933838, -2.9955830574035645, -2.88269305229187, -2.7698028087615967, -2.6569128036499023, -2.544022560119629, -2.4311323165893555, -2.318242311477661, -2.2053520679473877, -2.0924620628356934, -1.97957181930542, -1.8666815757751465, -1.7537914514541626, -1.6409013271331787, -1.5280112028121948, -1.415121078491211, -1.3022308349609375, -1.1893407106399536, -1.0764505863189697, -0.9635604023933411, -0.8506702184677124, -0.7377800941467285, -0.6248899698257446, -0.511999785900116, -0.3991096317768097, -0.2862194776535034, -0.17332935333251953, -0.06043916940689087, 0.05245101451873779, 0.16534090042114258, 0.27823105454444885, 0.3911212086677551, 0.5040113925933838, 0.6169015169143677, 0.7297916412353516, 0.8426818251609802, 0.9555720090866089, 1.0684621334075928, 1.1813522577285767, 1.2942423820495605, 1.407132625579834, 1.5200227499008179, 1.6329128742218018, 1.7458031177520752, 1.858693242073059, 1.971583366394043, 2.0844736099243164, 2.1973636150360107, 2.310253858566284, 2.4231438636779785, 2.536034107208252, 2.6489243507385254, 2.761814594268799, 2.874704599380493, 2.9875948429107666, 3.100484848022461, 3.2133750915527344, 3.326265335083008, 3.439155340194702, 3.5520455837249756, 3.66493558883667, 3.7778258323669434]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 5.0, 6.0, 6.0, 14.0, 11.0, 17.0, 16.0, 17.0, 14.0, 16.0, 26.0, 28.0, 27.0, 33.0, 29.0, 33.0, 26.0, 31.0, 31.0, 31.0, 43.0, 30.0, 38.0, 32.0, 47.0, 30.0, 30.0, 31.0, 25.0, 16.0, 26.0, 23.0, 31.0, 27.0, 29.0, 22.0, 13.0, 9.0, 12.0, 10.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.207154750823975, -4.070943832397461, -3.9347333908081055, -3.798522710800171, -3.6623120307922363, -3.5261011123657227, -3.389890432357788, -3.2536797523498535, -3.117469072341919, -2.9812583923339844, -2.84504771232605, -2.7088370323181152, -2.5726261138916016, -2.436415672302246, -2.3002047538757324, -2.163994073867798, -2.0277833938598633, -1.8915727138519287, -1.7553620338439941, -1.61915123462677, -1.4829405546188354, -1.3467298746109009, -1.2105190753936768, -1.0743083953857422, -0.9380977153778076, -0.801887035369873, -0.6656762957572937, -0.5294655561447144, -0.3932548761367798, -0.2570441961288452, -0.12083345651626587, 0.015377283096313477, 0.15158796310424805, 0.287798672914505, 0.42400938272476196, 0.5602201223373413, 0.6964308023452759, 0.8326414823532104, 0.9688522219657898, 1.1050629615783691, 1.2412736415863037, 1.3774843215942383, 1.5136950016021729, 1.649905800819397, 1.7861164808273315, 1.9223271608352661, 2.0585379600524902, 2.194748640060425, 2.3309593200683594, 2.467170000076294, 2.6033806800842285, 2.739591360092163, 2.8758020401000977, 3.0120129585266113, 3.148223638534546, 3.2844343185424805, 3.420644998550415, 3.5568556785583496, 3.693066358566284, 3.8292770385742188, 3.9654879570007324, 4.101698398590088, 4.237909317016602, 4.374119758605957, 4.510330677032471]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 12.0, 25.0, 24.0, 33.0, 53.0, 76.0, 158.0, 207.0, 295.0, 463.0, 757.0, 1177.0, 1905.0, 3049.0, 5296.0, 8697.0, 15358.0, 27478.0, 49645.0, 93265.0, 175775.0, 320245.0, 525392.0, 712090.0, 751591.0, 609597.0, 398700.0, 227375.0, 120320.0, 64083.0, 34742.0, 19398.0, 10945.0, 6339.0, 3790.0, 2236.0, 1391.0, 816.0, 538.0, 316.0, 233.0, 126.0, 90.0, 50.0, 40.0, 20.0, 21.0, 15.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-3.884765625, -3.76776123046875, -3.6507568359375, -3.53375244140625, -3.416748046875, -3.29974365234375, -3.1827392578125, -3.06573486328125, -2.94873046875, -2.83172607421875, -2.7147216796875, -2.59771728515625, -2.480712890625, -2.36370849609375, -2.2467041015625, -2.12969970703125, -2.0126953125, -1.89569091796875, -1.7786865234375, -1.66168212890625, -1.544677734375, -1.42767333984375, -1.3106689453125, -1.19366455078125, -1.07666015625, -0.95965576171875, -0.8426513671875, -0.72564697265625, -0.608642578125, -0.49163818359375, -0.3746337890625, -0.25762939453125, -0.140625, -0.02362060546875, 0.0933837890625, 0.21038818359375, 0.327392578125, 0.44439697265625, 0.5614013671875, 0.67840576171875, 0.79541015625, 0.91241455078125, 1.0294189453125, 1.14642333984375, 1.263427734375, 1.38043212890625, 1.4974365234375, 1.61444091796875, 1.7314453125, 1.84844970703125, 1.9654541015625, 2.08245849609375, 2.199462890625, 2.31646728515625, 2.4334716796875, 2.55047607421875, 2.66748046875, 2.78448486328125, 2.9014892578125, 3.01849365234375, 3.135498046875, 3.25250244140625, 3.3695068359375, 3.48651123046875, 3.603515625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 8.0, 9.0, 8.0, 12.0, 10.0, 16.0, 15.0, 19.0, 24.0, 19.0, 21.0, 28.0, 22.0, 25.0, 29.0, 40.0, 37.0, 33.0, 30.0, 33.0, 40.0, 44.0, 35.0, 42.0, 39.0, 35.0, 40.0, 32.0, 23.0, 31.0, 22.0, 28.0, 27.0, 20.0, 17.0, 14.0, 11.0, 7.0, 12.0, 10.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.990234375, -3.863128662109375, -3.73602294921875, -3.608917236328125, -3.4818115234375, -3.354705810546875, -3.22760009765625, -3.100494384765625, -2.973388671875, -2.846282958984375, -2.71917724609375, -2.592071533203125, -2.4649658203125, -2.337860107421875, -2.21075439453125, -2.083648681640625, -1.95654296875, -1.829437255859375, -1.70233154296875, -1.575225830078125, -1.4481201171875, -1.321014404296875, -1.19390869140625, -1.066802978515625, -0.939697265625, -0.812591552734375, -0.68548583984375, -0.558380126953125, -0.4312744140625, -0.304168701171875, -0.17706298828125, -0.049957275390625, 0.0771484375, 0.204254150390625, 0.33135986328125, 0.458465576171875, 0.5855712890625, 0.712677001953125, 0.83978271484375, 0.966888427734375, 1.093994140625, 1.221099853515625, 1.34820556640625, 1.475311279296875, 1.6024169921875, 1.729522705078125, 1.85662841796875, 1.983734130859375, 2.11083984375, 2.237945556640625, 2.36505126953125, 2.492156982421875, 2.6192626953125, 2.746368408203125, 2.87347412109375, 3.000579833984375, 3.127685546875, 3.254791259765625, 3.38189697265625, 3.509002685546875, 3.6361083984375, 3.763214111328125, 3.89031982421875, 4.017425537109375, 4.14453125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 16.0, 13.0, 18.0, 39.0, 54.0, 84.0, 148.0, 210.0, 290.0, 504.0, 784.0, 1316.0, 2002.0, 3540.0, 5808.0, 9595.0, 16017.0, 27308.0, 46786.0, 79670.0, 135529.0, 226753.0, 364469.0, 536554.0, 671346.0, 664384.0, 522237.0, 349574.0, 215819.0, 128790.0, 76197.0, 44193.0, 26081.0, 15160.0, 9099.0, 5495.0, 3089.0, 2024.0, 1232.0, 772.0, 480.0, 289.0, 194.0, 108.0, 73.0, 61.0, 28.0, 22.0, 13.0, 5.0, 5.0, 0.0, 5.0, 3.0, 0.0, 2.0], "bins": [-4.15625, -4.030120849609375, -3.90399169921875, -3.777862548828125, -3.6517333984375, -3.525604248046875, -3.39947509765625, -3.273345947265625, -3.147216796875, -3.021087646484375, -2.89495849609375, -2.768829345703125, -2.6427001953125, -2.516571044921875, -2.39044189453125, -2.264312744140625, -2.13818359375, -2.012054443359375, -1.88592529296875, -1.759796142578125, -1.6336669921875, -1.507537841796875, -1.38140869140625, -1.255279541015625, -1.129150390625, -1.003021240234375, -0.87689208984375, -0.750762939453125, -0.6246337890625, -0.498504638671875, -0.37237548828125, -0.246246337890625, -0.1201171875, 0.006011962890625, 0.13214111328125, 0.258270263671875, 0.3843994140625, 0.510528564453125, 0.63665771484375, 0.762786865234375, 0.888916015625, 1.015045166015625, 1.14117431640625, 1.267303466796875, 1.3934326171875, 1.519561767578125, 1.64569091796875, 1.771820068359375, 1.89794921875, 2.024078369140625, 2.15020751953125, 2.276336669921875, 2.4024658203125, 2.528594970703125, 2.65472412109375, 2.780853271484375, 2.906982421875, 3.033111572265625, 3.15924072265625, 3.285369873046875, 3.4114990234375, 3.537628173828125, 3.66375732421875, 3.789886474609375, 3.916015625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 6.0, 11.0, 19.0, 23.0, 25.0, 35.0, 49.0, 43.0, 48.0, 62.0, 81.0, 91.0, 112.0, 140.0, 145.0, 142.0, 154.0, 192.0, 181.0, 204.0, 219.0, 207.0, 230.0, 205.0, 198.0, 177.0, 150.0, 168.0, 105.0, 96.0, 107.0, 91.0, 58.0, 48.0, 45.0, 38.0, 30.0, 24.0, 20.0, 16.0, 12.0, 11.0, 7.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6044921875, -1.554901123046875, -1.50531005859375, -1.455718994140625, -1.4061279296875, -1.356536865234375, -1.30694580078125, -1.257354736328125, -1.207763671875, -1.158172607421875, -1.10858154296875, -1.058990478515625, -1.0093994140625, -0.959808349609375, -0.91021728515625, -0.860626220703125, -0.81103515625, -0.761444091796875, -0.71185302734375, -0.662261962890625, -0.6126708984375, -0.563079833984375, -0.51348876953125, -0.463897705078125, -0.414306640625, -0.364715576171875, -0.31512451171875, -0.265533447265625, -0.2159423828125, -0.166351318359375, -0.11676025390625, -0.067169189453125, -0.017578125, 0.032012939453125, 0.08160400390625, 0.131195068359375, 0.1807861328125, 0.230377197265625, 0.27996826171875, 0.329559326171875, 0.379150390625, 0.428741455078125, 0.47833251953125, 0.527923583984375, 0.5775146484375, 0.627105712890625, 0.67669677734375, 0.726287841796875, 0.77587890625, 0.825469970703125, 0.87506103515625, 0.924652099609375, 0.9742431640625, 1.023834228515625, 1.07342529296875, 1.123016357421875, 1.172607421875, 1.222198486328125, 1.27178955078125, 1.321380615234375, 1.3709716796875, 1.420562744140625, 1.47015380859375, 1.519744873046875, 1.5693359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 8.0, 12.0, 8.0, 7.0, 13.0, 16.0, 17.0, 12.0, 27.0, 21.0, 30.0, 38.0, 37.0, 36.0, 47.0, 43.0, 45.0, 37.0, 52.0, 50.0, 35.0, 40.0, 36.0, 43.0, 33.0, 27.0, 42.0, 19.0, 17.0, 18.0, 24.0, 19.0, 15.0, 7.0, 14.0, 8.0, 7.0, 3.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.161049842834473, -4.037417888641357, -3.913785934448242, -3.790153980255127, -3.6665220260620117, -3.5428900718688965, -3.4192581176757812, -3.295626163482666, -3.171994209289551, -3.0483622550964355, -2.9247303009033203, -2.801098346710205, -2.67746639251709, -2.5538344383239746, -2.4302024841308594, -2.306570529937744, -2.18293833732605, -2.0593063831329346, -1.9356744289398193, -1.812042474746704, -1.6884105205535889, -1.5647785663604736, -1.4411464929580688, -1.3175145387649536, -1.1938825845718384, -1.0702506303787231, -0.9466186761856079, -0.8229866623878479, -0.6993547081947327, -0.5757227540016174, -0.4520907402038574, -0.3284587860107422, -0.20482707023620605, -0.08119510114192963, 0.0424368679523468, 0.16606885194778442, 0.28970080614089966, 0.4133327603340149, 0.5369647741317749, 0.6605967283248901, 0.7842286825180054, 0.9078606367111206, 1.0314925909042358, 1.1551246643066406, 1.2787566184997559, 1.402388572692871, 1.5260205268859863, 1.6496524810791016, 1.7732844352722168, 1.896916389465332, 2.0205483436584473, 2.1441802978515625, 2.2678122520446777, 2.391444206237793, 2.515076160430908, 2.6387081146240234, 2.7623400688171387, 2.885972023010254, 3.009603977203369, 3.1332359313964844, 3.2568678855895996, 3.380499839782715, 3.50413179397583, 3.6277637481689453, 3.7513959407806396]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 11.0, 14.0, 12.0, 10.0, 11.0, 14.0, 13.0, 16.0, 22.0, 22.0, 23.0, 32.0, 29.0, 32.0, 32.0, 37.0, 41.0, 46.0, 40.0, 35.0, 30.0, 43.0, 41.0, 29.0, 32.0, 40.0, 25.0, 36.0, 29.0, 18.0, 17.0, 18.0, 12.0, 25.0, 16.0, 15.0, 9.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 10.0, 6.0, 3.0, 1.0, 4.0, 3.0], "bins": [-4.6989970207214355, -4.563592910766602, -4.428188800811768, -4.292784690856934, -4.1573805809021, -4.021976470947266, -3.8865723609924316, -3.7511682510375977, -3.6157641410827637, -3.4803600311279297, -3.3449559211730957, -3.2095518112182617, -3.0741477012634277, -2.9387435913085938, -2.8033394813537598, -2.667935371398926, -2.532531261444092, -2.397127151489258, -2.261723041534424, -2.12631893157959, -1.9909148216247559, -1.8555107116699219, -1.720106601715088, -1.584702491760254, -1.44929838180542, -1.313894271850586, -1.178490161895752, -1.043086051940918, -0.907681941986084, -0.77227783203125, -0.636873722076416, -0.501469612121582, -0.36606550216674805, -0.23066139221191406, -0.09525728225708008, 0.040146827697753906, 0.1755509376525879, 0.3109550476074219, 0.44635915756225586, 0.5817632675170898, 0.7171673774719238, 0.8525714874267578, 0.9879755973815918, 1.1233797073364258, 1.2587838172912598, 1.3941879272460938, 1.5295920372009277, 1.6649961471557617, 1.8004002571105957, 1.9358043670654297, 2.0712084770202637, 2.2066125869750977, 2.3420166969299316, 2.4774208068847656, 2.6128249168395996, 2.7482290267944336, 2.8836331367492676, 3.0190372467041016, 3.1544413566589355, 3.2898454666137695, 3.4252495765686035, 3.5606536865234375, 3.6960577964782715, 3.8314619064331055, 3.9668660163879395]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 5.0, 10.0, 17.0, 23.0, 44.0, 80.0, 89.0, 142.0, 243.0, 303.0, 431.0, 683.0, 1083.0, 1559.0, 2547.0, 3806.0, 6215.0, 10247.0, 16243.0, 25983.0, 41678.0, 63529.0, 92707.0, 123952.0, 144742.0, 141555.0, 119116.0, 88287.0, 60041.0, 38443.0, 24202.0, 15179.0, 9194.0, 5749.0, 3647.0, 2327.0, 1487.0, 954.0, 667.0, 436.0, 279.0, 222.0, 129.0, 88.0, 57.0, 41.0, 29.0, 16.0, 16.0, 9.0, 7.0, 7.0, 3.0, 5.0, 3.0], "bins": [-1.0732421875, -1.0416030883789062, -1.0099639892578125, -0.9783248901367188, -0.946685791015625, -0.9150466918945312, -0.8834075927734375, -0.8517684936523438, -0.82012939453125, -0.7884902954101562, -0.7568511962890625, -0.7252120971679688, -0.693572998046875, -0.6619338989257812, -0.6302947998046875, -0.5986557006835938, -0.5670166015625, -0.5353775024414062, -0.5037384033203125, -0.47209930419921875, -0.440460205078125, -0.40882110595703125, -0.3771820068359375, -0.34554290771484375, -0.31390380859375, -0.28226470947265625, -0.2506256103515625, -0.21898651123046875, -0.187347412109375, -0.15570831298828125, -0.1240692138671875, -0.09243011474609375, -0.060791015625, -0.02915191650390625, 0.0024871826171875, 0.03412628173828125, 0.065765380859375, 0.09740447998046875, 0.1290435791015625, 0.16068267822265625, 0.19232177734375, 0.22396087646484375, 0.2555999755859375, 0.28723907470703125, 0.318878173828125, 0.35051727294921875, 0.3821563720703125, 0.41379547119140625, 0.4454345703125, 0.47707366943359375, 0.5087127685546875, 0.5403518676757812, 0.571990966796875, 0.6036300659179688, 0.6352691650390625, 0.6669082641601562, 0.69854736328125, 0.7301864624023438, 0.7618255615234375, 0.7934646606445312, 0.825103759765625, 0.8567428588867188, 0.8883819580078125, 0.9200210571289062, 0.95166015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 10.0, 7.0, 10.0, 15.0, 14.0, 16.0, 21.0, 31.0, 31.0, 25.0, 24.0, 23.0, 36.0, 37.0, 47.0, 51.0, 63.0, 38.0, 50.0, 36.0, 34.0, 39.0, 34.0, 47.0, 32.0, 23.0, 31.0, 26.0, 17.0, 23.0, 20.0, 18.0, 11.0, 8.0, 3.0, 10.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.12847900390625, -4.9678955078125, -4.80731201171875, -4.646728515625, -4.48614501953125, -4.3255615234375, -4.16497802734375, -4.00439453125, -3.84381103515625, -3.6832275390625, -3.52264404296875, -3.362060546875, -3.20147705078125, -3.0408935546875, -2.88031005859375, -2.7197265625, -2.55914306640625, -2.3985595703125, -2.23797607421875, -2.077392578125, -1.91680908203125, -1.7562255859375, -1.59564208984375, -1.43505859375, -1.27447509765625, -1.1138916015625, -0.95330810546875, -0.792724609375, -0.63214111328125, -0.4715576171875, -0.31097412109375, -0.150390625, 0.01019287109375, 0.1707763671875, 0.33135986328125, 0.491943359375, 0.65252685546875, 0.8131103515625, 0.97369384765625, 1.13427734375, 1.29486083984375, 1.4554443359375, 1.61602783203125, 1.776611328125, 1.93719482421875, 2.0977783203125, 2.25836181640625, 2.4189453125, 2.57952880859375, 2.7401123046875, 2.90069580078125, 3.061279296875, 3.22186279296875, 3.3824462890625, 3.54302978515625, 3.70361328125, 3.86419677734375, 4.0247802734375, 4.18536376953125, 4.345947265625, 4.50653076171875, 4.6671142578125, 4.82769775390625, 4.98828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 5.0, 8.0, 13.0, 23.0, 12.0, 25.0, 31.0, 48.0, 49.0, 65.0, 93.0, 95.0, 139.0, 195.0, 312.0, 480.0, 867.0, 1619.0, 3293.0, 6788.0, 15297.0, 36228.0, 690409.0, 240203.0, 28413.0, 12049.0, 5642.0, 2650.0, 1319.0, 751.0, 447.0, 269.0, 184.0, 130.0, 80.0, 64.0, 39.0, 48.0, 40.0, 18.0, 23.0, 21.0, 12.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.27734375, -4.1387939453125, -4.000244140625, -3.8616943359375, -3.72314453125, -3.5845947265625, -3.446044921875, -3.3074951171875, -3.1689453125, -3.0303955078125, -2.891845703125, -2.7532958984375, -2.61474609375, -2.4761962890625, -2.337646484375, -2.1990966796875, -2.060546875, -1.9219970703125, -1.783447265625, -1.6448974609375, -1.50634765625, -1.3677978515625, -1.229248046875, -1.0906982421875, -0.9521484375, -0.8135986328125, -0.675048828125, -0.5364990234375, -0.39794921875, -0.2593994140625, -0.120849609375, 0.0177001953125, 0.15625, 0.2947998046875, 0.433349609375, 0.5718994140625, 0.71044921875, 0.8489990234375, 0.987548828125, 1.1260986328125, 1.2646484375, 1.4031982421875, 1.541748046875, 1.6802978515625, 1.81884765625, 1.9573974609375, 2.095947265625, 2.2344970703125, 2.373046875, 2.5115966796875, 2.650146484375, 2.7886962890625, 2.92724609375, 3.0657958984375, 3.204345703125, 3.3428955078125, 3.4814453125, 3.6199951171875, 3.758544921875, 3.8970947265625, 4.03564453125, 4.1741943359375, 4.312744140625, 4.4512939453125, 4.58984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 7.0, 24.0, 11.0, 20.0, 18.0, 14.0, 24.0, 38.0, 28.0, 26.0, 41.0, 31.0, 38.0, 35.0, 30.0, 39.0, 40.0, 26.0, 36.0, 37.0, 37.0, 41.0, 36.0, 31.0, 28.0, 26.0, 20.0, 28.0, 24.0, 20.0, 15.0, 25.0, 9.0, 12.0, 14.0, 9.0, 10.0, 3.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.22265625, -3.12200927734375, -3.0213623046875, -2.92071533203125, -2.820068359375, -2.71942138671875, -2.6187744140625, -2.51812744140625, -2.41748046875, -2.31683349609375, -2.2161865234375, -2.11553955078125, -2.014892578125, -1.91424560546875, -1.8135986328125, -1.71295166015625, -1.6123046875, -1.51165771484375, -1.4110107421875, -1.31036376953125, -1.209716796875, -1.10906982421875, -1.0084228515625, -0.90777587890625, -0.80712890625, -0.70648193359375, -0.6058349609375, -0.50518798828125, -0.404541015625, -0.30389404296875, -0.2032470703125, -0.10260009765625, -0.001953125, 0.09869384765625, 0.1993408203125, 0.29998779296875, 0.400634765625, 0.50128173828125, 0.6019287109375, 0.70257568359375, 0.80322265625, 0.90386962890625, 1.0045166015625, 1.10516357421875, 1.205810546875, 1.30645751953125, 1.4071044921875, 1.50775146484375, 1.6083984375, 1.70904541015625, 1.8096923828125, 1.91033935546875, 2.010986328125, 2.11163330078125, 2.2122802734375, 2.31292724609375, 2.41357421875, 2.51422119140625, 2.6148681640625, 2.71551513671875, 2.816162109375, 2.91680908203125, 3.0174560546875, 3.11810302734375, 3.21875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 8.0, 7.0, 11.0, 13.0, 26.0, 19.0, 47.0, 48.0, 96.0, 138.0, 249.0, 434.0, 723.0, 1292.0, 2520.0, 4840.0, 9893.0, 21533.0, 66134.0, 820968.0, 75407.0, 22637.0, 10381.0, 5098.0, 2578.0, 1484.0, 778.0, 443.0, 249.0, 167.0, 124.0, 64.0, 43.0, 31.0, 17.0, 14.0, 14.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2861137390136719, -0.27608489990234375, -0.2660560607910156, -0.2560272216796875, -0.24599838256835938, -0.23596954345703125, -0.22594070434570312, -0.215911865234375, -0.20588302612304688, -0.19585418701171875, -0.18582534790039062, -0.1757965087890625, -0.16576766967773438, -0.15573883056640625, -0.14570999145507812, -0.13568115234375, -0.12565231323242188, -0.11562347412109375, -0.10559463500976562, -0.0955657958984375, -0.08553695678710938, -0.07550811767578125, -0.06547927856445312, -0.055450439453125, -0.045421600341796875, -0.03539276123046875, -0.025363922119140625, -0.0153350830078125, -0.005306243896484375, 0.00472259521484375, 0.014751434326171875, 0.0247802734375, 0.034809112548828125, 0.04483795166015625, 0.054866790771484375, 0.0648956298828125, 0.07492446899414062, 0.08495330810546875, 0.09498214721679688, 0.105010986328125, 0.11503982543945312, 0.12506866455078125, 0.13509750366210938, 0.1451263427734375, 0.15515518188476562, 0.16518402099609375, 0.17521286010742188, 0.18524169921875, 0.19527053833007812, 0.20529937744140625, 0.21532821655273438, 0.2253570556640625, 0.23538589477539062, 0.24541473388671875, 0.2554435729980469, 0.265472412109375, 0.2755012512207031, 0.28553009033203125, 0.2955589294433594, 0.3055877685546875, 0.3156166076660156, 0.32564544677734375, 0.3356742858886719, 0.345703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 8.0, 12.0, 15.0, 23.0, 14.0, 26.0, 34.0, 34.0, 45.0, 36.0, 47.0, 47.0, 48.0, 54.0, 62.0, 54.0, 48.0, 42.0, 50.0, 48.0, 44.0, 30.0, 28.0, 26.0, 22.0, 12.0, 13.0, 7.0, 11.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.042856067419052e-05, -1.975707709789276e-05, -1.9085593521595e-05, -1.841410994529724e-05, -1.774262636899948e-05, -1.707114279270172e-05, -1.639965921640396e-05, -1.57281756401062e-05, -1.5056692063808441e-05, -1.4385208487510681e-05, -1.3713724911212921e-05, -1.3042241334915161e-05, -1.2370757758617401e-05, -1.1699274182319641e-05, -1.1027790606021881e-05, -1.0356307029724121e-05, -9.684823453426361e-06, -9.013339877128601e-06, -8.341856300830841e-06, -7.670372724533081e-06, -6.998889148235321e-06, -6.327405571937561e-06, -5.655921995639801e-06, -4.984438419342041e-06, -4.312954843044281e-06, -3.641471266746521e-06, -2.969987690448761e-06, -2.298504114151001e-06, -1.627020537853241e-06, -9.55536961555481e-07, -2.8405338525772095e-07, 3.8743019104003906e-07, 1.058913767337799e-06, 1.730397343635559e-06, 2.401880919933319e-06, 3.073364496231079e-06, 3.744848072528839e-06, 4.416331648826599e-06, 5.087815225124359e-06, 5.759298801422119e-06, 6.430782377719879e-06, 7.102265954017639e-06, 7.7737495303154e-06, 8.44523310661316e-06, 9.11671668291092e-06, 9.78820025920868e-06, 1.045968383550644e-05, 1.11311674118042e-05, 1.180265098810196e-05, 1.247413456439972e-05, 1.314561814069748e-05, 1.381710171699524e-05, 1.4488585293293e-05, 1.516006886959076e-05, 1.583155244588852e-05, 1.650303602218628e-05, 1.717451959848404e-05, 1.78460031747818e-05, 1.851748675107956e-05, 1.918897032737732e-05, 1.986045390367508e-05, 2.053193747997284e-05, 2.12034210562706e-05, 2.187490463256836e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 12.0, 22.0, 23.0, 45.0, 59.0, 89.0, 131.0, 204.0, 299.0, 455.0, 656.0, 1050.0, 1528.0, 2346.0, 3413.0, 5170.0, 7624.0, 11595.0, 17809.0, 27002.0, 40608.0, 61113.0, 86661.0, 115861.0, 137191.0, 138775.0, 116873.0, 88208.0, 61345.0, 41699.0, 27193.0, 17845.0, 11743.0, 7892.0, 5271.0, 3527.0, 2473.0, 1574.0, 1035.0, 724.0, 473.0, 324.0, 199.0, 138.0, 82.0, 66.0, 38.0, 18.0, 22.0, 15.0, 15.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1903076171875, -0.18436431884765625, -0.1784210205078125, -0.17247772216796875, -0.166534423828125, -0.16059112548828125, -0.1546478271484375, -0.14870452880859375, -0.14276123046875, -0.13681793212890625, -0.1308746337890625, -0.12493133544921875, -0.118988037109375, -0.11304473876953125, -0.1071014404296875, -0.10115814208984375, -0.09521484375, -0.08927154541015625, -0.0833282470703125, -0.07738494873046875, -0.071441650390625, -0.06549835205078125, -0.0595550537109375, -0.05361175537109375, -0.04766845703125, -0.04172515869140625, -0.0357818603515625, -0.02983856201171875, -0.023895263671875, -0.01795196533203125, -0.0120086669921875, -0.00606536865234375, -0.0001220703125, 0.00582122802734375, 0.0117645263671875, 0.01770782470703125, 0.023651123046875, 0.02959442138671875, 0.0355377197265625, 0.04148101806640625, 0.04742431640625, 0.05336761474609375, 0.0593109130859375, 0.06525421142578125, 0.071197509765625, 0.07714080810546875, 0.0830841064453125, 0.08902740478515625, 0.094970703125, 0.10091400146484375, 0.1068572998046875, 0.11280059814453125, 0.118743896484375, 0.12468719482421875, 0.1306304931640625, 0.13657379150390625, 0.14251708984375, 0.14846038818359375, 0.1544036865234375, 0.16034698486328125, 0.166290283203125, 0.17223358154296875, 0.1781768798828125, 0.18412017822265625, 0.1900634765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 6.0, 5.0, 10.0, 14.0, 8.0, 14.0, 18.0, 19.0, 14.0, 22.0, 33.0, 30.0, 33.0, 52.0, 55.0, 50.0, 49.0, 61.0, 40.0, 47.0, 58.0, 44.0, 53.0, 43.0, 30.0, 28.0, 30.0, 29.0, 12.0, 13.0, 11.0, 15.0, 7.0, 8.0, 6.0, 2.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07824039459228516, -0.07567024230957031, -0.07310009002685547, -0.07052993774414062, -0.06795978546142578, -0.06538963317871094, -0.0628194808959961, -0.06024932861328125, -0.057679176330566406, -0.05510902404785156, -0.05253887176513672, -0.049968719482421875, -0.04739856719970703, -0.04482841491699219, -0.042258262634277344, -0.0396881103515625, -0.037117958068847656, -0.03454780578613281, -0.03197765350341797, -0.029407501220703125, -0.02683734893798828, -0.024267196655273438, -0.021697044372558594, -0.01912689208984375, -0.016556739807128906, -0.013986587524414062, -0.011416435241699219, -0.008846282958984375, -0.006276130676269531, -0.0037059783935546875, -0.0011358261108398438, 0.001434326171875, 0.004004478454589844, 0.0065746307373046875, 0.009144783020019531, 0.011714935302734375, 0.014285087585449219, 0.016855239868164062, 0.019425392150878906, 0.02199554443359375, 0.024565696716308594, 0.027135848999023438, 0.02970600128173828, 0.032276153564453125, 0.03484630584716797, 0.03741645812988281, 0.039986610412597656, 0.0425567626953125, 0.045126914978027344, 0.04769706726074219, 0.05026721954345703, 0.052837371826171875, 0.05540752410888672, 0.05797767639160156, 0.060547828674316406, 0.06311798095703125, 0.0656881332397461, 0.06825828552246094, 0.07082843780517578, 0.07339859008789062, 0.07596874237060547, 0.07853889465332031, 0.08110904693603516, 0.08367919921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 8.0, 5.0, 5.0, 9.0, 2.0, 9.0, 13.0, 14.0, 13.0, 15.0, 25.0, 24.0, 26.0, 25.0, 31.0, 41.0, 41.0, 54.0, 35.0, 43.0, 53.0, 47.0, 47.0, 38.0, 37.0, 36.0, 45.0, 33.0, 32.0, 35.0, 20.0, 17.0, 20.0, 22.0, 18.0, 15.0, 11.0, 6.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1700215339660645, -4.044659614562988, -3.919297218322754, -3.7939352989196777, -3.6685731410980225, -3.543210983276367, -3.417848825454712, -3.2924866676330566, -3.1671247482299805, -3.041762590408325, -2.91640043258667, -2.7910385131835938, -2.6656763553619385, -2.540314197540283, -2.414952039718628, -2.2895898818969727, -2.1642277240753174, -2.038865566253662, -1.9135035276412964, -1.7881413698196411, -1.6627793312072754, -1.5374171733856201, -1.4120550155639648, -1.2866928577423096, -1.1613308191299438, -1.0359686613082886, -0.9106066226959229, -0.7852444648742676, -0.6598823666572571, -0.5345202684402466, -0.4091581106185913, -0.2837960124015808, -0.1584336757659912, -0.03307156264781952, 0.09229055047035217, 0.21765267848968506, 0.34301477670669556, 0.46837687492370605, 0.5937390327453613, 0.7191011309623718, 0.8444632291793823, 0.9698253273963928, 1.0951874256134033, 1.2205495834350586, 1.3459117412567139, 1.4712737798690796, 1.5966359376907349, 1.7219979763031006, 1.8473601341247559, 1.9727222919464111, 2.0980844497680664, 2.2234463691711426, 2.348808526992798, 2.474170684814453, 2.5995328426361084, 2.7248950004577637, 2.85025691986084, 2.975619077682495, 3.1009812355041504, 3.2263431549072266, 3.351705312728882, 3.477067470550537, 3.6024296283721924, 3.7277917861938477, 3.853153944015503]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 8.0, 12.0, 14.0, 6.0, 14.0, 10.0, 17.0, 15.0, 21.0, 18.0, 30.0, 29.0, 33.0, 31.0, 28.0, 36.0, 47.0, 40.0, 36.0, 43.0, 32.0, 39.0, 41.0, 26.0, 41.0, 36.0, 25.0, 37.0, 28.0, 22.0, 16.0, 19.0, 14.0, 19.0, 17.0, 16.0, 12.0, 8.0, 6.0, 5.0, 6.0, 3.0, 3.0, 11.0, 5.0, 1.0, 3.0, 4.0, 2.0], "bins": [-4.717719078063965, -4.582234859466553, -4.446750640869141, -4.3112664222717285, -4.175782203674316, -4.040297985076904, -3.904813766479492, -3.76932954788208, -3.633845329284668, -3.498361110687256, -3.3628768920898438, -3.2273926734924316, -3.0919084548950195, -2.9564242362976074, -2.8209400177001953, -2.685455799102783, -2.549971342086792, -2.41448712348938, -2.2790029048919678, -2.1435186862945557, -2.0080344676971436, -1.8725502490997314, -1.7370659112930298, -1.6015816926956177, -1.4660974740982056, -1.3306132555007935, -1.1951290369033813, -1.0596446990966797, -0.9241605401039124, -0.7886763215065002, -0.6531920433044434, -0.5177078247070312, -0.38222360610961914, -0.24673937261104584, -0.11125513911247253, 0.024229109287261963, 0.15971332788467407, 0.2951975464820862, 0.43068182468414307, 0.5661660432815552, 0.7016502618789673, 0.8371344804763794, 0.9726186990737915, 1.1081030368804932, 1.2435872554779053, 1.3790714740753174, 1.5145556926727295, 1.6500399112701416, 1.7855241298675537, 1.9210083484649658, 2.056492567062378, 2.19197678565979, 2.327461004257202, 2.4629452228546143, 2.5984296798706055, 2.7339138984680176, 2.8693981170654297, 3.004882335662842, 3.140366554260254, 3.275850772857666, 3.411334991455078, 3.5468192100524902, 3.6823034286499023, 3.8177876472473145, 3.9532718658447266]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 11.0, 24.0, 40.0, 53.0, 71.0, 104.0, 203.0, 258.0, 406.0, 682.0, 1049.0, 1456.0, 2268.0, 3472.0, 5058.0, 7499.0, 10832.0, 16009.0, 22959.0, 31876.0, 43997.0, 58373.0, 73203.0, 88138.0, 98776.0, 103128.0, 99331.0, 89390.0, 75465.0, 60178.0, 45332.0, 33352.0, 23984.0, 16777.0, 11390.0, 7768.0, 5292.0, 3507.0, 2340.0, 1586.0, 1018.0, 638.0, 430.0, 276.0, 181.0, 139.0, 87.0, 53.0, 30.0, 23.0, 21.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.625, -2.54437255859375, -2.4637451171875, -2.38311767578125, -2.302490234375, -2.22186279296875, -2.1412353515625, -2.06060791015625, -1.97998046875, -1.89935302734375, -1.8187255859375, -1.73809814453125, -1.657470703125, -1.57684326171875, -1.4962158203125, -1.41558837890625, -1.3349609375, -1.25433349609375, -1.1737060546875, -1.09307861328125, -1.012451171875, -0.93182373046875, -0.8511962890625, -0.77056884765625, -0.68994140625, -0.60931396484375, -0.5286865234375, -0.44805908203125, -0.367431640625, -0.28680419921875, -0.2061767578125, -0.12554931640625, -0.044921875, 0.03570556640625, 0.1163330078125, 0.19696044921875, 0.277587890625, 0.35821533203125, 0.4388427734375, 0.51947021484375, 0.60009765625, 0.68072509765625, 0.7613525390625, 0.84197998046875, 0.922607421875, 1.00323486328125, 1.0838623046875, 1.16448974609375, 1.2451171875, 1.32574462890625, 1.4063720703125, 1.48699951171875, 1.567626953125, 1.64825439453125, 1.7288818359375, 1.80950927734375, 1.89013671875, 1.97076416015625, 2.0513916015625, 2.13201904296875, 2.212646484375, 2.29327392578125, 2.3739013671875, 2.45452880859375, 2.53515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 7.0, 7.0, 5.0, 5.0, 10.0, 7.0, 14.0, 10.0, 19.0, 14.0, 12.0, 20.0, 20.0, 29.0, 22.0, 32.0, 33.0, 27.0, 42.0, 29.0, 45.0, 45.0, 34.0, 37.0, 35.0, 32.0, 42.0, 26.0, 30.0, 36.0, 17.0, 30.0, 25.0, 31.0, 18.0, 14.0, 20.0, 12.0, 17.0, 12.0, 21.0, 12.0, 12.0, 8.0, 7.0, 6.0, 1.0, 2.0, 8.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-4.328125, -4.19586181640625, -4.0635986328125, -3.93133544921875, -3.799072265625, -3.66680908203125, -3.5345458984375, -3.40228271484375, -3.27001953125, -3.13775634765625, -3.0054931640625, -2.87322998046875, -2.740966796875, -2.60870361328125, -2.4764404296875, -2.34417724609375, -2.2119140625, -2.07965087890625, -1.9473876953125, -1.81512451171875, -1.682861328125, -1.55059814453125, -1.4183349609375, -1.28607177734375, -1.15380859375, -1.02154541015625, -0.8892822265625, -0.75701904296875, -0.624755859375, -0.49249267578125, -0.3602294921875, -0.22796630859375, -0.095703125, 0.03656005859375, 0.1688232421875, 0.30108642578125, 0.433349609375, 0.56561279296875, 0.6978759765625, 0.83013916015625, 0.96240234375, 1.09466552734375, 1.2269287109375, 1.35919189453125, 1.491455078125, 1.62371826171875, 1.7559814453125, 1.88824462890625, 2.0205078125, 2.15277099609375, 2.2850341796875, 2.41729736328125, 2.549560546875, 2.68182373046875, 2.8140869140625, 2.94635009765625, 3.07861328125, 3.21087646484375, 3.3431396484375, 3.47540283203125, 3.607666015625, 3.73992919921875, 3.8721923828125, 4.00445556640625, 4.13671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 9.0, 12.0, 25.0, 40.0, 30.0, 84.0, 94.0, 146.0, 270.0, 414.0, 559.0, 933.0, 1478.0, 2295.0, 3427.0, 5488.0, 8457.0, 13296.0, 19824.0, 29802.0, 43267.0, 60655.0, 80979.0, 100984.0, 115287.0, 118620.0, 110729.0, 93645.0, 73086.0, 53598.0, 37398.0, 25482.0, 17212.0, 10997.0, 7202.0, 4438.0, 2949.0, 1894.0, 1245.0, 781.0, 476.0, 319.0, 241.0, 124.0, 90.0, 65.0, 41.0, 29.0, 16.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-3.29296875, -3.194091796875, -3.09521484375, -2.996337890625, -2.8974609375, -2.798583984375, -2.69970703125, -2.600830078125, -2.501953125, -2.403076171875, -2.30419921875, -2.205322265625, -2.1064453125, -2.007568359375, -1.90869140625, -1.809814453125, -1.7109375, -1.612060546875, -1.51318359375, -1.414306640625, -1.3154296875, -1.216552734375, -1.11767578125, -1.018798828125, -0.919921875, -0.821044921875, -0.72216796875, -0.623291015625, -0.5244140625, -0.425537109375, -0.32666015625, -0.227783203125, -0.12890625, -0.030029296875, 0.06884765625, 0.167724609375, 0.2666015625, 0.365478515625, 0.46435546875, 0.563232421875, 0.662109375, 0.760986328125, 0.85986328125, 0.958740234375, 1.0576171875, 1.156494140625, 1.25537109375, 1.354248046875, 1.453125, 1.552001953125, 1.65087890625, 1.749755859375, 1.8486328125, 1.947509765625, 2.04638671875, 2.145263671875, 2.244140625, 2.343017578125, 2.44189453125, 2.540771484375, 2.6396484375, 2.738525390625, 2.83740234375, 2.936279296875, 3.03515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 8.0, 13.0, 10.0, 12.0, 26.0, 11.0, 17.0, 19.0, 20.0, 26.0, 26.0, 35.0, 39.0, 35.0, 44.0, 31.0, 42.0, 49.0, 45.0, 45.0, 49.0, 30.0, 39.0, 24.0, 33.0, 23.0, 26.0, 29.0, 22.0, 25.0, 16.0, 14.0, 16.0, 15.0, 13.0, 11.0, 7.0, 12.0, 5.0, 12.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.79852294921875, -2.7064208984375, -2.61431884765625, -2.522216796875, -2.43011474609375, -2.3380126953125, -2.24591064453125, -2.15380859375, -2.06170654296875, -1.9696044921875, -1.87750244140625, -1.785400390625, -1.69329833984375, -1.6011962890625, -1.50909423828125, -1.4169921875, -1.32489013671875, -1.2327880859375, -1.14068603515625, -1.048583984375, -0.95648193359375, -0.8643798828125, -0.77227783203125, -0.68017578125, -0.58807373046875, -0.4959716796875, -0.40386962890625, -0.311767578125, -0.21966552734375, -0.1275634765625, -0.03546142578125, 0.056640625, 0.14874267578125, 0.2408447265625, 0.33294677734375, 0.425048828125, 0.51715087890625, 0.6092529296875, 0.70135498046875, 0.79345703125, 0.88555908203125, 0.9776611328125, 1.06976318359375, 1.161865234375, 1.25396728515625, 1.3460693359375, 1.43817138671875, 1.5302734375, 1.62237548828125, 1.7144775390625, 1.80657958984375, 1.898681640625, 1.99078369140625, 2.0828857421875, 2.17498779296875, 2.26708984375, 2.35919189453125, 2.4512939453125, 2.54339599609375, 2.635498046875, 2.72760009765625, 2.8197021484375, 2.91180419921875, 3.00390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 6.0, 14.0, 11.0, 19.0, 35.0, 52.0, 63.0, 128.0, 202.0, 290.0, 482.0, 739.0, 1257.0, 2096.0, 3446.0, 5922.0, 10350.0, 17669.0, 30111.0, 50119.0, 78570.0, 114150.0, 144203.0, 156237.0, 140176.0, 106616.0, 73432.0, 45581.0, 27745.0, 16093.0, 9263.0, 5376.0, 3149.0, 1911.0, 1168.0, 724.0, 402.0, 255.0, 168.0, 104.0, 71.0, 49.0, 28.0, 20.0, 18.0, 8.0, 7.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.427734375, -1.3836822509765625, -1.339630126953125, -1.2955780029296875, -1.25152587890625, -1.2074737548828125, -1.163421630859375, -1.1193695068359375, -1.0753173828125, -1.0312652587890625, -0.987213134765625, -0.9431610107421875, -0.89910888671875, -0.8550567626953125, -0.811004638671875, -0.7669525146484375, -0.722900390625, -0.6788482666015625, -0.634796142578125, -0.5907440185546875, -0.54669189453125, -0.5026397705078125, -0.458587646484375, -0.4145355224609375, -0.3704833984375, -0.3264312744140625, -0.282379150390625, -0.2383270263671875, -0.19427490234375, -0.1502227783203125, -0.106170654296875, -0.0621185302734375, -0.01806640625, 0.0259857177734375, 0.070037841796875, 0.1140899658203125, 0.15814208984375, 0.2021942138671875, 0.246246337890625, 0.2902984619140625, 0.3343505859375, 0.3784027099609375, 0.422454833984375, 0.4665069580078125, 0.51055908203125, 0.5546112060546875, 0.598663330078125, 0.6427154541015625, 0.686767578125, 0.7308197021484375, 0.774871826171875, 0.8189239501953125, 0.86297607421875, 0.9070281982421875, 0.951080322265625, 0.9951324462890625, 1.0391845703125, 1.0832366943359375, 1.127288818359375, 1.1713409423828125, 1.21539306640625, 1.2594451904296875, 1.303497314453125, 1.3475494384765625, 1.3916015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 7.0, 6.0, 9.0, 18.0, 17.0, 20.0, 17.0, 25.0, 37.0, 30.0, 52.0, 46.0, 50.0, 50.0, 55.0, 48.0, 50.0, 60.0, 47.0, 41.0, 41.0, 46.0, 33.0, 34.0, 34.0, 18.0, 23.0, 18.0, 8.0, 9.0, 6.0, 10.0, 5.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.00014781951904296875, -0.0001433044672012329, -0.00013878941535949707, -0.00013427436351776123, -0.0001297593116760254, -0.00012524425983428955, -0.00012072920799255371, -0.00011621415615081787, -0.00011169910430908203, -0.00010718405246734619, -0.00010266900062561035, -9.815394878387451e-05, -9.363889694213867e-05, -8.912384510040283e-05, -8.460879325866699e-05, -8.009374141693115e-05, -7.557868957519531e-05, -7.106363773345947e-05, -6.654858589172363e-05, -6.203353404998779e-05, -5.751848220825195e-05, -5.300343036651611e-05, -4.8488378524780273e-05, -4.3973326683044434e-05, -3.9458274841308594e-05, -3.4943222999572754e-05, -3.0428171157836914e-05, -2.5913119316101074e-05, -2.1398067474365234e-05, -1.6883015632629395e-05, -1.2367963790893555e-05, -7.852911949157715e-06, -3.337860107421875e-06, 1.1771917343139648e-06, 5.692243576049805e-06, 1.0207295417785645e-05, 1.4722347259521484e-05, 1.9237399101257324e-05, 2.3752450942993164e-05, 2.8267502784729004e-05, 3.2782554626464844e-05, 3.7297606468200684e-05, 4.1812658309936523e-05, 4.632771015167236e-05, 5.08427619934082e-05, 5.535781383514404e-05, 5.987286567687988e-05, 6.438791751861572e-05, 6.890296936035156e-05, 7.34180212020874e-05, 7.793307304382324e-05, 8.244812488555908e-05, 8.696317672729492e-05, 9.147822856903076e-05, 9.59932804107666e-05, 0.00010050833225250244, 0.00010502338409423828, 0.00010953843593597412, 0.00011405348777770996, 0.0001185685396194458, 0.00012308359146118164, 0.00012759864330291748, 0.00013211369514465332, 0.00013662874698638916, 0.000141143798828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 14.0, 18.0, 30.0, 47.0, 65.0, 85.0, 186.0, 217.0, 389.0, 576.0, 914.0, 1501.0, 2440.0, 3906.0, 6412.0, 10494.0, 17405.0, 28463.0, 45346.0, 68429.0, 96207.0, 122784.0, 138691.0, 135310.0, 116019.0, 88517.0, 60295.0, 39903.0, 24982.0, 15418.0, 9080.0, 5523.0, 3236.0, 2043.0, 1302.0, 836.0, 516.0, 330.0, 225.0, 143.0, 79.0, 68.0, 43.0, 20.0, 18.0, 12.0, 9.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.25238037109375, -1.2117919921875, -1.17120361328125, -1.130615234375, -1.09002685546875, -1.0494384765625, -1.00885009765625, -0.96826171875, -0.92767333984375, -0.8870849609375, -0.84649658203125, -0.805908203125, -0.76531982421875, -0.7247314453125, -0.68414306640625, -0.6435546875, -0.60296630859375, -0.5623779296875, -0.52178955078125, -0.481201171875, -0.44061279296875, -0.4000244140625, -0.35943603515625, -0.31884765625, -0.27825927734375, -0.2376708984375, -0.19708251953125, -0.156494140625, -0.11590576171875, -0.0753173828125, -0.03472900390625, 0.005859375, 0.04644775390625, 0.0870361328125, 0.12762451171875, 0.168212890625, 0.20880126953125, 0.2493896484375, 0.28997802734375, 0.33056640625, 0.37115478515625, 0.4117431640625, 0.45233154296875, 0.492919921875, 0.53350830078125, 0.5740966796875, 0.61468505859375, 0.6552734375, 0.69586181640625, 0.7364501953125, 0.77703857421875, 0.817626953125, 0.85821533203125, 0.8988037109375, 0.93939208984375, 0.97998046875, 1.02056884765625, 1.0611572265625, 1.10174560546875, 1.142333984375, 1.18292236328125, 1.2235107421875, 1.26409912109375, 1.3046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 0.0, 4.0, 7.0, 9.0, 11.0, 8.0, 25.0, 20.0, 23.0, 26.0, 30.0, 40.0, 43.0, 51.0, 56.0, 48.0, 48.0, 63.0, 46.0, 52.0, 43.0, 53.0, 59.0, 36.0, 32.0, 39.0, 19.0, 20.0, 18.0, 17.0, 12.0, 10.0, 7.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5170059204101562, -0.4998321533203125, -0.48265838623046875, -0.465484619140625, -0.44831085205078125, -0.4311370849609375, -0.41396331787109375, -0.39678955078125, -0.37961578369140625, -0.3624420166015625, -0.34526824951171875, -0.328094482421875, -0.31092071533203125, -0.2937469482421875, -0.27657318115234375, -0.2593994140625, -0.24222564697265625, -0.2250518798828125, -0.20787811279296875, -0.190704345703125, -0.17353057861328125, -0.1563568115234375, -0.13918304443359375, -0.12200927734375, -0.10483551025390625, -0.0876617431640625, -0.07048797607421875, -0.053314208984375, -0.03614044189453125, -0.0189666748046875, -0.00179290771484375, 0.015380859375, 0.03255462646484375, 0.0497283935546875, 0.06690216064453125, 0.084075927734375, 0.10124969482421875, 0.1184234619140625, 0.13559722900390625, 0.15277099609375, 0.16994476318359375, 0.1871185302734375, 0.20429229736328125, 0.221466064453125, 0.23863983154296875, 0.2558135986328125, 0.27298736572265625, 0.2901611328125, 0.30733489990234375, 0.3245086669921875, 0.34168243408203125, 0.358856201171875, 0.37602996826171875, 0.3932037353515625, 0.41037750244140625, 0.42755126953125, 0.44472503662109375, 0.4618988037109375, 0.47907257080078125, 0.496246337890625, 0.5134201049804688, 0.5305938720703125, 0.5477676391601562, 0.56494140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 7.0, 12.0, 6.0, 14.0, 14.0, 20.0, 15.0, 26.0, 29.0, 28.0, 42.0, 45.0, 39.0, 55.0, 44.0, 46.0, 47.0, 52.0, 38.0, 44.0, 55.0, 42.0, 36.0, 34.0, 32.0, 22.0, 26.0, 21.0, 19.0, 9.0, 15.0, 18.0, 7.0, 9.0, 5.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.517250061035156, -4.383393287658691, -4.249536037445068, -4.115678787231445, -3.9818220138549805, -3.8479650020599365, -3.7141079902648926, -3.5802509784698486, -3.4463939666748047, -3.3125369548797607, -3.178679943084717, -3.044822931289673, -2.910965919494629, -2.777108907699585, -2.643251895904541, -2.509394884109497, -2.375537872314453, -2.241680860519409, -2.1078238487243652, -1.9739668369293213, -1.8401098251342773, -1.7062528133392334, -1.5723958015441895, -1.4385387897491455, -1.3046817779541016, -1.1708247661590576, -1.0369677543640137, -0.9031107425689697, -0.7692537307739258, -0.6353967189788818, -0.5015397071838379, -0.36768269538879395, -0.2338252067565918, -0.09996819496154785, 0.033888816833496094, 0.16774582862854004, 0.301602840423584, 0.43545985221862793, 0.5693168640136719, 0.7031738758087158, 0.8370308876037598, 0.9708878993988037, 1.1047449111938477, 1.2386019229888916, 1.3724589347839355, 1.5063159465789795, 1.6401729583740234, 1.7740299701690674, 1.9078869819641113, 2.0417439937591553, 2.175601005554199, 2.309458017349243, 2.443315029144287, 2.577172040939331, 2.711029052734375, 2.844886064529419, 2.978743076324463, 3.112600088119507, 3.246457099914551, 3.3803141117095947, 3.5141711235046387, 3.6480281352996826, 3.7818851470947266, 3.9157421588897705, 4.0495991706848145]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 12.0, 11.0, 10.0, 14.0, 13.0, 13.0, 18.0, 21.0, 16.0, 33.0, 35.0, 30.0, 27.0, 34.0, 38.0, 50.0, 32.0, 31.0, 48.0, 47.0, 47.0, 46.0, 33.0, 34.0, 25.0, 35.0, 35.0, 32.0, 27.0, 29.0, 19.0, 16.0, 10.0, 13.0, 11.0, 17.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.927131175994873, -4.772489070892334, -4.617846965789795, -4.463205337524414, -4.308563232421875, -4.153921127319336, -3.999279022216797, -3.844636917114258, -3.689995050430298, -3.535352945327759, -3.380711078643799, -3.2260689735412598, -3.0714268684387207, -2.9167850017547607, -2.7621428966522217, -2.6075010299682617, -2.4528589248657227, -2.2982168197631836, -2.1435749530792236, -1.9889328479766846, -1.834290862083435, -1.6796488761901855, -1.5250067710876465, -1.370364785194397, -1.2157227993011475, -1.061080813407898, -0.9064387679100037, -0.7517967224121094, -0.5971547365188599, -0.44251275062561035, -0.28787070512771606, -0.13322865962982178, 0.021413326263427734, 0.17605534195899963, 0.33069735765457153, 0.48533937335014343, 0.6399813890457153, 0.7946233749389648, 0.9492654204368591, 1.1039074659347534, 1.258549451828003, 1.4131914377212524, 1.567833423614502, 1.722475528717041, 1.8771175146102905, 2.03175950050354, 2.186401605606079, 2.341043472290039, 2.495685577392578, 2.650327682495117, 2.804969549179077, 2.959611654281616, 3.114253520965576, 3.2688956260681152, 3.4235377311706543, 3.5781798362731934, 3.7328217029571533, 3.8874638080596924, 4.042105674743652, 4.196747779846191, 4.3513898849487305, 4.5060319900512695, 4.66067361831665, 4.8153157234191895, 4.9699578285217285]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 8.0, 7.0, 9.0, 15.0, 20.0, 46.0, 60.0, 72.0, 128.0, 167.0, 294.0, 439.0, 659.0, 1162.0, 1853.0, 2914.0, 5021.0, 8364.0, 14458.0, 25868.0, 46923.0, 88425.0, 167392.0, 311332.0, 521665.0, 718165.0, 762541.0, 619107.0, 403294.0, 227633.0, 120956.0, 64211.0, 34775.0, 19219.0, 10934.0, 6307.0, 3820.0, 2326.0, 1336.0, 892.0, 510.0, 315.0, 227.0, 149.0, 103.0, 63.0, 45.0, 20.0, 21.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.707489013671875, -3.58880615234375, -3.470123291015625, -3.3514404296875, -3.232757568359375, -3.11407470703125, -2.995391845703125, -2.876708984375, -2.758026123046875, -2.63934326171875, -2.520660400390625, -2.4019775390625, -2.283294677734375, -2.16461181640625, -2.045928955078125, -1.92724609375, -1.808563232421875, -1.68988037109375, -1.571197509765625, -1.4525146484375, -1.333831787109375, -1.21514892578125, -1.096466064453125, -0.977783203125, -0.859100341796875, -0.74041748046875, -0.621734619140625, -0.5030517578125, -0.384368896484375, -0.26568603515625, -0.147003173828125, -0.0283203125, 0.090362548828125, 0.20904541015625, 0.327728271484375, 0.4464111328125, 0.565093994140625, 0.68377685546875, 0.802459716796875, 0.921142578125, 1.039825439453125, 1.15850830078125, 1.277191162109375, 1.3958740234375, 1.514556884765625, 1.63323974609375, 1.751922607421875, 1.87060546875, 1.989288330078125, 2.10797119140625, 2.226654052734375, 2.3453369140625, 2.464019775390625, 2.58270263671875, 2.701385498046875, 2.820068359375, 2.938751220703125, 3.05743408203125, 3.176116943359375, 3.2947998046875, 3.413482666015625, 3.53216552734375, 3.650848388671875, 3.76953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 8.0, 13.0, 9.0, 16.0, 12.0, 20.0, 13.0, 19.0, 15.0, 33.0, 31.0, 32.0, 30.0, 22.0, 27.0, 31.0, 37.0, 43.0, 25.0, 49.0, 28.0, 45.0, 39.0, 37.0, 34.0, 31.0, 27.0, 32.0, 35.0, 20.0, 30.0, 22.0, 11.0, 12.0, 9.0, 16.0, 10.0, 8.0, 11.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.87890625, -3.75872802734375, -3.6385498046875, -3.51837158203125, -3.398193359375, -3.27801513671875, -3.1578369140625, -3.03765869140625, -2.91748046875, -2.79730224609375, -2.6771240234375, -2.55694580078125, -2.436767578125, -2.31658935546875, -2.1964111328125, -2.07623291015625, -1.9560546875, -1.83587646484375, -1.7156982421875, -1.59552001953125, -1.475341796875, -1.35516357421875, -1.2349853515625, -1.11480712890625, -0.99462890625, -0.87445068359375, -0.7542724609375, -0.63409423828125, -0.513916015625, -0.39373779296875, -0.2735595703125, -0.15338134765625, -0.033203125, 0.08697509765625, 0.2071533203125, 0.32733154296875, 0.447509765625, 0.56768798828125, 0.6878662109375, 0.80804443359375, 0.92822265625, 1.04840087890625, 1.1685791015625, 1.28875732421875, 1.408935546875, 1.52911376953125, 1.6492919921875, 1.76947021484375, 1.8896484375, 2.00982666015625, 2.1300048828125, 2.25018310546875, 2.370361328125, 2.49053955078125, 2.6107177734375, 2.73089599609375, 2.85107421875, 2.97125244140625, 3.0914306640625, 3.21160888671875, 3.331787109375, 3.45196533203125, 3.5721435546875, 3.69232177734375, 3.8125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 0.0, 10.0, 12.0, 21.0, 19.0, 53.0, 100.0, 139.0, 201.0, 293.0, 464.0, 693.0, 1205.0, 1951.0, 3078.0, 5060.0, 8458.0, 14085.0, 23353.0, 40170.0, 68439.0, 115537.0, 193743.0, 313634.0, 475423.0, 628638.0, 674546.0, 572039.0, 406812.0, 259965.0, 157344.0, 93431.0, 55099.0, 32226.0, 19010.0, 11335.0, 6887.0, 4143.0, 2456.0, 1607.0, 1000.0, 576.0, 358.0, 227.0, 159.0, 101.0, 67.0, 51.0, 25.0, 27.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.6942138671875, -3.568115234375, -3.4420166015625, -3.31591796875, -3.1898193359375, -3.063720703125, -2.9376220703125, -2.8115234375, -2.6854248046875, -2.559326171875, -2.4332275390625, -2.30712890625, -2.1810302734375, -2.054931640625, -1.9288330078125, -1.802734375, -1.6766357421875, -1.550537109375, -1.4244384765625, -1.29833984375, -1.1722412109375, -1.046142578125, -0.9200439453125, -0.7939453125, -0.6678466796875, -0.541748046875, -0.4156494140625, -0.28955078125, -0.1634521484375, -0.037353515625, 0.0887451171875, 0.21484375, 0.3409423828125, 0.467041015625, 0.5931396484375, 0.71923828125, 0.8453369140625, 0.971435546875, 1.0975341796875, 1.2236328125, 1.3497314453125, 1.475830078125, 1.6019287109375, 1.72802734375, 1.8541259765625, 1.980224609375, 2.1063232421875, 2.232421875, 2.3585205078125, 2.484619140625, 2.6107177734375, 2.73681640625, 2.8629150390625, 2.989013671875, 3.1151123046875, 3.2412109375, 3.3673095703125, 3.493408203125, 3.6195068359375, 3.74560546875, 3.8717041015625, 3.997802734375, 4.1239013671875, 4.25]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 7.0, 7.0, 8.0, 2.0, 7.0, 6.0, 8.0, 11.0, 16.0, 25.0, 31.0, 45.0, 35.0, 51.0, 68.0, 74.0, 90.0, 113.0, 146.0, 154.0, 167.0, 195.0, 200.0, 227.0, 231.0, 216.0, 246.0, 227.0, 203.0, 213.0, 167.0, 152.0, 131.0, 102.0, 100.0, 82.0, 85.0, 41.0, 37.0, 32.0, 30.0, 17.0, 17.0, 13.0, 10.0, 8.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.541015625, -1.4871826171875, -1.433349609375, -1.3795166015625, -1.32568359375, -1.2718505859375, -1.218017578125, -1.1641845703125, -1.1103515625, -1.0565185546875, -1.002685546875, -0.9488525390625, -0.89501953125, -0.8411865234375, -0.787353515625, -0.7335205078125, -0.6796875, -0.6258544921875, -0.572021484375, -0.5181884765625, -0.46435546875, -0.4105224609375, -0.356689453125, -0.3028564453125, -0.2490234375, -0.1951904296875, -0.141357421875, -0.0875244140625, -0.03369140625, 0.0201416015625, 0.073974609375, 0.1278076171875, 0.181640625, 0.2354736328125, 0.289306640625, 0.3431396484375, 0.39697265625, 0.4508056640625, 0.504638671875, 0.5584716796875, 0.6123046875, 0.6661376953125, 0.719970703125, 0.7738037109375, 0.82763671875, 0.8814697265625, 0.935302734375, 0.9891357421875, 1.04296875, 1.0968017578125, 1.150634765625, 1.2044677734375, 1.25830078125, 1.3121337890625, 1.365966796875, 1.4197998046875, 1.4736328125, 1.5274658203125, 1.581298828125, 1.6351318359375, 1.68896484375, 1.7427978515625, 1.796630859375, 1.8504638671875, 1.904296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 10.0, 7.0, 13.0, 14.0, 11.0, 26.0, 28.0, 28.0, 32.0, 34.0, 30.0, 46.0, 47.0, 48.0, 53.0, 46.0, 42.0, 46.0, 58.0, 36.0, 42.0, 50.0, 35.0, 35.0, 17.0, 25.0, 22.0, 18.0, 15.0, 11.0, 12.0, 12.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.336487770080566, -4.20129919052124, -4.066110134124756, -3.9309213161468506, -3.7957324981689453, -3.660543918609619, -3.525355100631714, -3.3901662826538086, -3.2549774646759033, -3.119788646697998, -2.9845998287200928, -2.8494110107421875, -2.7142224311828613, -2.579033374786377, -2.443844795227051, -2.3086559772491455, -2.1734671592712402, -2.038278341293335, -1.9030895233154297, -1.767900824546814, -1.6327120065689087, -1.4975231885910034, -1.3623344898223877, -1.2271456718444824, -1.0919568538665771, -0.9567680358886719, -0.8215792775154114, -0.6863905191421509, -0.5512017011642456, -0.41601288318634033, -0.28082412481307983, -0.14563536643981934, -0.01044607162475586, 0.12474271655082703, 0.2599315047264099, 0.3951202929019928, 0.5303090810775757, 0.665497899055481, 0.8006866574287415, 0.935875415802002, 1.0710642337799072, 1.2062530517578125, 1.3414418697357178, 1.4766305685043335, 1.6118193864822388, 1.747008204460144, 1.8821969032287598, 2.017385721206665, 2.1525745391845703, 2.2877633571624756, 2.422952175140381, 2.558140993118286, 2.6933298110961914, 2.8285183906555176, 2.963707208633423, 3.098896026611328, 3.2340848445892334, 3.3692736625671387, 3.504462480545044, 3.639651298522949, 3.7748398780822754, 3.9100289344787598, 4.045217514038086, 4.18040657043457, 4.3155951499938965]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 5.0, 8.0, 7.0, 8.0, 6.0, 6.0, 8.0, 9.0, 11.0, 14.0, 15.0, 14.0, 23.0, 21.0, 29.0, 29.0, 21.0, 36.0, 35.0, 38.0, 40.0, 34.0, 35.0, 30.0, 38.0, 45.0, 28.0, 30.0, 42.0, 30.0, 20.0, 42.0, 28.0, 26.0, 31.0, 17.0, 25.0, 17.0, 11.0, 15.0, 13.0, 14.0, 11.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2254228591918945, -4.087362289428711, -3.9493019580841064, -3.811241388320923, -3.6731810569763184, -3.5351204872131348, -3.397059917449951, -3.2589993476867676, -3.120939016342163, -2.9828784465789795, -2.844818115234375, -2.7067575454711914, -2.568696975708008, -2.4306366443634033, -2.2925760746002197, -2.1545157432556152, -2.0164551734924316, -1.8783947229385376, -1.7403342723846436, -1.60227370262146, -1.464213252067566, -1.3261528015136719, -1.1880922317504883, -1.0500317811965942, -0.9119713306427002, -0.7739108800888062, -0.6358503699302673, -0.4977898895740509, -0.3597294092178345, -0.22166895866394043, -0.08360844850540161, 0.05445206165313721, 0.19251251220703125, 0.3305729925632477, 0.4686334729194641, 0.6066939830780029, 0.744754433631897, 0.882814884185791, 1.0208754539489746, 1.1589359045028687, 1.2969963550567627, 1.4350568056106567, 1.5731172561645508, 1.7111778259277344, 1.8492382764816284, 1.9872987270355225, 2.125359296798706, 2.2634196281433105, 2.401480197906494, 2.5395407676696777, 2.6776010990142822, 2.815661668777466, 2.9537220001220703, 3.091782569885254, 3.2298431396484375, 3.367903709411621, 3.5059640407562256, 3.644024610519409, 3.7820849418640137, 3.9201455116271973, 4.058206081390381, 4.196266174316406, 4.33432674407959, 4.472387313842773, 4.610447883605957]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 9.0, 16.0, 8.0, 21.0, 30.0, 45.0, 61.0, 89.0, 137.0, 177.0, 299.0, 478.0, 688.0, 1194.0, 2021.0, 3539.0, 6368.0, 12033.0, 23271.0, 45822.0, 90603.0, 163339.0, 227768.0, 204964.0, 126699.0, 67087.0, 33646.0, 17502.0, 8988.0, 4835.0, 2633.0, 1577.0, 911.0, 599.0, 341.0, 237.0, 151.0, 111.0, 64.0, 50.0, 39.0, 29.0, 16.0, 22.0, 15.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.2608642578125, -1.217041015625, -1.1732177734375, -1.12939453125, -1.0855712890625, -1.041748046875, -0.9979248046875, -0.9541015625, -0.9102783203125, -0.866455078125, -0.8226318359375, -0.77880859375, -0.7349853515625, -0.691162109375, -0.6473388671875, -0.603515625, -0.5596923828125, -0.515869140625, -0.4720458984375, -0.42822265625, -0.3843994140625, -0.340576171875, -0.2967529296875, -0.2529296875, -0.2091064453125, -0.165283203125, -0.1214599609375, -0.07763671875, -0.0338134765625, 0.010009765625, 0.0538330078125, 0.09765625, 0.1414794921875, 0.185302734375, 0.2291259765625, 0.27294921875, 0.3167724609375, 0.360595703125, 0.4044189453125, 0.4482421875, 0.4920654296875, 0.535888671875, 0.5797119140625, 0.62353515625, 0.6673583984375, 0.711181640625, 0.7550048828125, 0.798828125, 0.8426513671875, 0.886474609375, 0.9302978515625, 0.97412109375, 1.0179443359375, 1.061767578125, 1.1055908203125, 1.1494140625, 1.1932373046875, 1.237060546875, 1.2808837890625, 1.32470703125, 1.3685302734375, 1.412353515625, 1.4561767578125, 1.5]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 6.0, 11.0, 4.0, 9.0, 8.0, 16.0, 18.0, 13.0, 15.0, 26.0, 33.0, 26.0, 37.0, 33.0, 35.0, 41.0, 35.0, 38.0, 51.0, 43.0, 43.0, 48.0, 41.0, 28.0, 32.0, 37.0, 49.0, 27.0, 33.0, 16.0, 14.0, 21.0, 24.0, 17.0, 19.0, 6.0, 13.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.90960693359375, -4.7489013671875, -4.58819580078125, -4.427490234375, -4.26678466796875, -4.1060791015625, -3.94537353515625, -3.78466796875, -3.62396240234375, -3.4632568359375, -3.30255126953125, -3.141845703125, -2.98114013671875, -2.8204345703125, -2.65972900390625, -2.4990234375, -2.33831787109375, -2.1776123046875, -2.01690673828125, -1.856201171875, -1.69549560546875, -1.5347900390625, -1.37408447265625, -1.21337890625, -1.05267333984375, -0.8919677734375, -0.73126220703125, -0.570556640625, -0.40985107421875, -0.2491455078125, -0.08843994140625, 0.072265625, 0.23297119140625, 0.3936767578125, 0.55438232421875, 0.715087890625, 0.87579345703125, 1.0364990234375, 1.19720458984375, 1.35791015625, 1.51861572265625, 1.6793212890625, 1.84002685546875, 2.000732421875, 2.16143798828125, 2.3221435546875, 2.48284912109375, 2.6435546875, 2.80426025390625, 2.9649658203125, 3.12567138671875, 3.286376953125, 3.44708251953125, 3.6077880859375, 3.76849365234375, 3.92919921875, 4.08990478515625, 4.2506103515625, 4.41131591796875, 4.572021484375, 4.73272705078125, 4.8934326171875, 5.05413818359375, 5.21484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 15.0, 26.0, 18.0, 29.0, 41.0, 65.0, 93.0, 106.0, 151.0, 218.0, 392.0, 662.0, 1398.0, 3103.0, 8354.0, 25357.0, 404555.0, 561223.0, 27035.0, 8992.0, 3341.0, 1458.0, 724.0, 380.0, 222.0, 156.0, 101.0, 69.0, 70.0, 36.0, 27.0, 20.0, 16.0, 19.0, 19.0, 3.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.2265625, -5.05810546875, -4.8896484375, -4.72119140625, -4.552734375, -4.38427734375, -4.2158203125, -4.04736328125, -3.87890625, -3.71044921875, -3.5419921875, -3.37353515625, -3.205078125, -3.03662109375, -2.8681640625, -2.69970703125, -2.53125, -2.36279296875, -2.1943359375, -2.02587890625, -1.857421875, -1.68896484375, -1.5205078125, -1.35205078125, -1.18359375, -1.01513671875, -0.8466796875, -0.67822265625, -0.509765625, -0.34130859375, -0.1728515625, -0.00439453125, 0.1640625, 0.33251953125, 0.5009765625, 0.66943359375, 0.837890625, 1.00634765625, 1.1748046875, 1.34326171875, 1.51171875, 1.68017578125, 1.8486328125, 2.01708984375, 2.185546875, 2.35400390625, 2.5224609375, 2.69091796875, 2.859375, 3.02783203125, 3.1962890625, 3.36474609375, 3.533203125, 3.70166015625, 3.8701171875, 4.03857421875, 4.20703125, 4.37548828125, 4.5439453125, 4.71240234375, 4.880859375, 5.04931640625, 5.2177734375, 5.38623046875, 5.5546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 8.0, 17.0, 10.0, 14.0, 13.0, 20.0, 24.0, 18.0, 24.0, 31.0, 33.0, 35.0, 31.0, 54.0, 47.0, 51.0, 52.0, 30.0, 44.0, 45.0, 36.0, 33.0, 37.0, 34.0, 28.0, 25.0, 21.0, 25.0, 20.0, 20.0, 24.0, 8.0, 13.0, 10.0, 13.0, 10.0, 6.0, 4.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.505859375, -3.399383544921875, -3.29290771484375, -3.186431884765625, -3.0799560546875, -2.973480224609375, -2.86700439453125, -2.760528564453125, -2.654052734375, -2.547576904296875, -2.44110107421875, -2.334625244140625, -2.2281494140625, -2.121673583984375, -2.01519775390625, -1.908721923828125, -1.80224609375, -1.695770263671875, -1.58929443359375, -1.482818603515625, -1.3763427734375, -1.269866943359375, -1.16339111328125, -1.056915283203125, -0.950439453125, -0.843963623046875, -0.73748779296875, -0.631011962890625, -0.5245361328125, -0.418060302734375, -0.31158447265625, -0.205108642578125, -0.0986328125, 0.007843017578125, 0.11431884765625, 0.220794677734375, 0.3272705078125, 0.433746337890625, 0.54022216796875, 0.646697998046875, 0.753173828125, 0.859649658203125, 0.96612548828125, 1.072601318359375, 1.1790771484375, 1.285552978515625, 1.39202880859375, 1.498504638671875, 1.60498046875, 1.711456298828125, 1.81793212890625, 1.924407958984375, 2.0308837890625, 2.137359619140625, 2.24383544921875, 2.350311279296875, 2.456787109375, 2.563262939453125, 2.66973876953125, 2.776214599609375, 2.8826904296875, 2.989166259765625, 3.09564208984375, 3.202117919921875, 3.30859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 6.0, 9.0, 4.0, 6.0, 12.0, 17.0, 21.0, 36.0, 41.0, 43.0, 73.0, 86.0, 113.0, 179.0, 221.0, 382.0, 457.0, 709.0, 1209.0, 2013.0, 3360.0, 5825.0, 10413.0, 19353.0, 47208.0, 721203.0, 172623.0, 28694.0, 14538.0, 7840.0, 4529.0, 2644.0, 1607.0, 937.0, 625.0, 447.0, 285.0, 224.0, 159.0, 108.0, 84.0, 47.0, 47.0, 26.0, 29.0, 19.0, 16.0, 5.0, 3.0, 7.0, 5.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.224365234375, -0.217071533203125, -0.20977783203125, -0.202484130859375, -0.1951904296875, -0.187896728515625, -0.18060302734375, -0.173309326171875, -0.166015625, -0.158721923828125, -0.15142822265625, -0.144134521484375, -0.1368408203125, -0.129547119140625, -0.12225341796875, -0.114959716796875, -0.107666015625, -0.100372314453125, -0.09307861328125, -0.085784912109375, -0.0784912109375, -0.071197509765625, -0.06390380859375, -0.056610107421875, -0.04931640625, -0.042022705078125, -0.03472900390625, -0.027435302734375, -0.0201416015625, -0.012847900390625, -0.00555419921875, 0.001739501953125, 0.009033203125, 0.016326904296875, 0.02362060546875, 0.030914306640625, 0.0382080078125, 0.045501708984375, 0.05279541015625, 0.060089111328125, 0.0673828125, 0.074676513671875, 0.08197021484375, 0.089263916015625, 0.0965576171875, 0.103851318359375, 0.11114501953125, 0.118438720703125, 0.125732421875, 0.133026123046875, 0.14031982421875, 0.147613525390625, 0.1549072265625, 0.162200927734375, 0.16949462890625, 0.176788330078125, 0.18408203125, 0.191375732421875, 0.19866943359375, 0.205963134765625, 0.2132568359375, 0.220550537109375, 0.22784423828125, 0.235137939453125, 0.242431640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 6.0, 10.0, 16.0, 18.0, 28.0, 34.0, 27.0, 42.0, 53.0, 56.0, 66.0, 55.0, 87.0, 54.0, 66.0, 62.0, 51.0, 54.0, 41.0, 29.0, 24.0, 23.0, 18.0, 13.0, 8.0, 8.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1576881408691406e-05, -2.091936767101288e-05, -2.026185393333435e-05, -1.9604340195655823e-05, -1.8946826457977295e-05, -1.8289312720298767e-05, -1.763179898262024e-05, -1.697428524494171e-05, -1.6316771507263184e-05, -1.5659257769584656e-05, -1.5001744031906128e-05, -1.43442302942276e-05, -1.3686716556549072e-05, -1.3029202818870544e-05, -1.2371689081192017e-05, -1.1714175343513489e-05, -1.1056661605834961e-05, -1.0399147868156433e-05, -9.741634130477905e-06, -9.084120392799377e-06, -8.42660665512085e-06, -7.769092917442322e-06, -7.111579179763794e-06, -6.454065442085266e-06, -5.796551704406738e-06, -5.1390379667282104e-06, -4.481524229049683e-06, -3.824010491371155e-06, -3.166496753692627e-06, -2.508983016014099e-06, -1.8514692783355713e-06, -1.1939555406570435e-06, -5.364418029785156e-07, 1.210719347000122e-07, 7.7858567237854e-07, 1.4360994100570679e-06, 2.0936131477355957e-06, 2.7511268854141235e-06, 3.4086406230926514e-06, 4.066154360771179e-06, 4.723668098449707e-06, 5.381181836128235e-06, 6.038695573806763e-06, 6.6962093114852905e-06, 7.353723049163818e-06, 8.011236786842346e-06, 8.668750524520874e-06, 9.326264262199402e-06, 9.98377799987793e-06, 1.0641291737556458e-05, 1.1298805475234985e-05, 1.1956319212913513e-05, 1.2613832950592041e-05, 1.3271346688270569e-05, 1.3928860425949097e-05, 1.4586374163627625e-05, 1.5243887901306152e-05, 1.590140163898468e-05, 1.6558915376663208e-05, 1.7216429114341736e-05, 1.7873942852020264e-05, 1.853145658969879e-05, 1.918897032737732e-05, 1.9846484065055847e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 16.0, 20.0, 28.0, 52.0, 80.0, 108.0, 161.0, 251.0, 362.0, 543.0, 817.0, 1220.0, 1941.0, 3016.0, 4939.0, 7900.0, 12762.0, 21358.0, 34597.0, 55250.0, 84444.0, 121167.0, 154028.0, 157896.0, 130484.0, 92973.0, 61085.0, 38836.0, 23822.0, 14586.0, 8892.0, 5454.0, 3392.0, 2177.0, 1354.0, 863.0, 563.0, 360.0, 229.0, 161.0, 122.0, 77.0, 57.0, 30.0, 31.0, 15.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21728515625, -0.21030235290527344, -0.20331954956054688, -0.1963367462158203, -0.18935394287109375, -0.1823711395263672, -0.17538833618164062, -0.16840553283691406, -0.1614227294921875, -0.15443992614746094, -0.14745712280273438, -0.1404743194580078, -0.13349151611328125, -0.1265087127685547, -0.11952590942382812, -0.11254310607910156, -0.105560302734375, -0.09857749938964844, -0.09159469604492188, -0.08461189270019531, -0.07762908935546875, -0.07064628601074219, -0.06366348266601562, -0.05668067932128906, -0.0496978759765625, -0.04271507263183594, -0.035732269287109375, -0.028749465942382812, -0.02176666259765625, -0.014783859252929688, -0.007801055908203125, -0.0008182525634765625, 0.00616455078125, 0.013147354125976562, 0.020130157470703125, 0.027112960815429688, 0.03409576416015625, 0.04107856750488281, 0.048061370849609375, 0.05504417419433594, 0.0620269775390625, 0.06900978088378906, 0.07599258422851562, 0.08297538757324219, 0.08995819091796875, 0.09694099426269531, 0.10392379760742188, 0.11090660095214844, 0.117889404296875, 0.12487220764160156, 0.13185501098632812, 0.1388378143310547, 0.14582061767578125, 0.1528034210205078, 0.15978622436523438, 0.16676902770996094, 0.1737518310546875, 0.18073463439941406, 0.18771743774414062, 0.1947002410888672, 0.20168304443359375, 0.2086658477783203, 0.21564865112304688, 0.22263145446777344, 0.2296142578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 5.0, 11.0, 8.0, 11.0, 11.0, 9.0, 19.0, 24.0, 34.0, 49.0, 35.0, 42.0, 34.0, 43.0, 37.0, 38.0, 38.0, 50.0, 35.0, 46.0, 38.0, 44.0, 34.0, 50.0, 32.0, 31.0, 31.0, 26.0, 33.0, 21.0, 22.0, 13.0, 9.0, 3.0, 12.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09735107421875, -0.09438514709472656, -0.09141921997070312, -0.08845329284667969, -0.08548736572265625, -0.08252143859863281, -0.07955551147460938, -0.07658958435058594, -0.0736236572265625, -0.07065773010253906, -0.06769180297851562, -0.06472587585449219, -0.06175994873046875, -0.05879402160644531, -0.055828094482421875, -0.05286216735839844, -0.049896240234375, -0.04693031311035156, -0.043964385986328125, -0.04099845886230469, -0.03803253173828125, -0.03506660461425781, -0.032100677490234375, -0.029134750366210938, -0.0261688232421875, -0.023202896118164062, -0.020236968994140625, -0.017271041870117188, -0.01430511474609375, -0.011339187622070312, -0.008373260498046875, -0.0054073333740234375, -0.00244140625, 0.0005245208740234375, 0.003490447998046875, 0.0064563751220703125, 0.00942230224609375, 0.012388229370117188, 0.015354156494140625, 0.018320083618164062, 0.0212860107421875, 0.024251937866210938, 0.027217864990234375, 0.030183792114257812, 0.03314971923828125, 0.03611564636230469, 0.039081573486328125, 0.04204750061035156, 0.045013427734375, 0.04797935485839844, 0.050945281982421875, 0.05391120910644531, 0.05687713623046875, 0.05984306335449219, 0.06280899047851562, 0.06577491760253906, 0.0687408447265625, 0.07170677185058594, 0.07467269897460938, 0.07763862609863281, 0.08060455322265625, 0.08357048034667969, 0.08653640747070312, 0.08950233459472656, 0.09246826171875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 1.0, 2.0, 10.0, 9.0, 19.0, 11.0, 13.0, 17.0, 23.0, 19.0, 28.0, 39.0, 28.0, 36.0, 45.0, 49.0, 43.0, 56.0, 37.0, 42.0, 46.0, 54.0, 46.0, 42.0, 40.0, 35.0, 37.0, 18.0, 22.0, 25.0, 15.0, 17.0, 9.0, 11.0, 16.0, 6.0, 9.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.275643825531006, -4.145768642425537, -4.015893459320068, -3.8860180377960205, -3.7561428546905518, -3.626267671585083, -3.496392250061035, -3.3665170669555664, -3.2366418838500977, -3.106766700744629, -2.97689151763916, -2.8470160961151123, -2.7171409130096436, -2.587265729904175, -2.457390308380127, -2.327515125274658, -2.1976399421691895, -2.0677647590637207, -1.9378894567489624, -1.808014154434204, -1.6781389713287354, -1.5482637882232666, -1.4183884859085083, -1.28851318359375, -1.1586380004882812, -1.0287628173828125, -0.8988875150680542, -0.7690122723579407, -0.6391370296478271, -0.5092617869377136, -0.3793865442276001, -0.24951130151748657, -0.11963653564453125, 0.010238707065582275, 0.1401139497756958, 0.2699891924858093, 0.39986443519592285, 0.5297396779060364, 0.6596149206161499, 0.7894901633262634, 0.919365406036377, 1.0492405891418457, 1.179115891456604, 1.3089911937713623, 1.438866376876831, 1.5687415599822998, 1.698616862297058, 1.8284921646118164, 1.9583673477172852, 2.088242530822754, 2.2181177139282227, 2.3479931354522705, 2.4778683185577393, 2.607743501663208, 2.737618923187256, 2.8674941062927246, 2.9973692893981934, 3.127244472503662, 3.257119655609131, 3.3869950771331787, 3.5168702602386475, 3.646745443344116, 3.776620864868164, 3.906496047973633, 4.036371231079102]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 7.0, 7.0, 9.0, 5.0, 5.0, 10.0, 8.0, 11.0, 19.0, 14.0, 18.0, 18.0, 29.0, 30.0, 26.0, 25.0, 33.0, 40.0, 37.0, 37.0, 35.0, 34.0, 29.0, 47.0, 30.0, 31.0, 38.0, 41.0, 17.0, 34.0, 32.0, 30.0, 21.0, 31.0, 19.0, 23.0, 13.0, 14.0, 14.0, 9.0, 18.0, 13.0, 7.0, 6.0, 11.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.095715045928955, -3.959784746170044, -3.823854446411133, -3.6879239082336426, -3.5519936084747314, -3.4160633087158203, -3.28013277053833, -3.144202470779419, -3.008272171020508, -2.8723418712615967, -2.7364115715026855, -2.6004810333251953, -2.464550733566284, -2.328620433807373, -2.192689895629883, -2.0567595958709717, -1.9208292961120605, -1.7848989963531494, -1.6489685773849487, -1.513038158416748, -1.377107858657837, -1.2411775588989258, -1.105247139930725, -0.9693167805671692, -0.8333864212036133, -0.6974560618400574, -0.5615257024765015, -0.42559534311294556, -0.28966498374938965, -0.15373462438583374, -0.017804265022277832, 0.11812609434127808, 0.254056453704834, 0.3899868130683899, 0.5259171724319458, 0.6618475317955017, 0.7977778911590576, 0.9337082505226135, 1.0696386098861694, 1.2055690288543701, 1.3414993286132812, 1.4774296283721924, 1.613360047340393, 1.7492904663085938, 1.8852207660675049, 2.021151065826416, 2.1570816040039062, 2.2930119037628174, 2.4289422035217285, 2.5648725032806396, 2.700802803039551, 2.836733341217041, 2.972663640975952, 3.1085939407348633, 3.2445244789123535, 3.3804547786712646, 3.516385078430176, 3.652315378189087, 3.788245677947998, 3.9241762161254883, 4.06010627746582, 4.1960368156433105, 4.331967353820801, 4.467897415161133, 4.603827953338623]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 11.0, 15.0, 20.0, 34.0, 57.0, 104.0, 170.0, 287.0, 436.0, 648.0, 1037.0, 1654.0, 2538.0, 3926.0, 6156.0, 9672.0, 14567.0, 21221.0, 31418.0, 43730.0, 58599.0, 75715.0, 91020.0, 104108.0, 107725.0, 103856.0, 92171.0, 76495.0, 60373.0, 44633.0, 31802.0, 22059.0, 14791.0, 9916.0, 6323.0, 4077.0, 2686.0, 1710.0, 1062.0, 694.0, 371.0, 253.0, 145.0, 115.0, 59.0, 41.0, 20.0, 13.0, 10.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.80078125, -2.717254638671875, -2.63372802734375, -2.550201416015625, -2.4666748046875, -2.383148193359375, -2.29962158203125, -2.216094970703125, -2.132568359375, -2.049041748046875, -1.96551513671875, -1.881988525390625, -1.7984619140625, -1.714935302734375, -1.63140869140625, -1.547882080078125, -1.46435546875, -1.380828857421875, -1.29730224609375, -1.213775634765625, -1.1302490234375, -1.046722412109375, -0.96319580078125, -0.879669189453125, -0.796142578125, -0.712615966796875, -0.62908935546875, -0.545562744140625, -0.4620361328125, -0.378509521484375, -0.29498291015625, -0.211456298828125, -0.1279296875, -0.044403076171875, 0.03912353515625, 0.122650146484375, 0.2061767578125, 0.289703369140625, 0.37322998046875, 0.456756591796875, 0.540283203125, 0.623809814453125, 0.70733642578125, 0.790863037109375, 0.8743896484375, 0.957916259765625, 1.04144287109375, 1.124969482421875, 1.20849609375, 1.292022705078125, 1.37554931640625, 1.459075927734375, 1.5426025390625, 1.626129150390625, 1.70965576171875, 1.793182373046875, 1.876708984375, 1.960235595703125, 2.04376220703125, 2.127288818359375, 2.2108154296875, 2.294342041015625, 2.37786865234375, 2.461395263671875, 2.544921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 5.0, 2.0, 10.0, 13.0, 6.0, 18.0, 12.0, 13.0, 14.0, 27.0, 27.0, 23.0, 25.0, 25.0, 32.0, 35.0, 36.0, 37.0, 42.0, 31.0, 36.0, 41.0, 30.0, 30.0, 30.0, 25.0, 37.0, 34.0, 32.0, 34.0, 28.0, 29.0, 19.0, 16.0, 21.0, 20.0, 11.0, 14.0, 8.0, 13.0, 14.0, 6.0, 9.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.15234375, -4.01678466796875, -3.8812255859375, -3.74566650390625, -3.610107421875, -3.47454833984375, -3.3389892578125, -3.20343017578125, -3.06787109375, -2.93231201171875, -2.7967529296875, -2.66119384765625, -2.525634765625, -2.39007568359375, -2.2545166015625, -2.11895751953125, -1.9833984375, -1.84783935546875, -1.7122802734375, -1.57672119140625, -1.441162109375, -1.30560302734375, -1.1700439453125, -1.03448486328125, -0.89892578125, -0.76336669921875, -0.6278076171875, -0.49224853515625, -0.356689453125, -0.22113037109375, -0.0855712890625, 0.04998779296875, 0.185546875, 0.32110595703125, 0.4566650390625, 0.59222412109375, 0.727783203125, 0.86334228515625, 0.9989013671875, 1.13446044921875, 1.27001953125, 1.40557861328125, 1.5411376953125, 1.67669677734375, 1.812255859375, 1.94781494140625, 2.0833740234375, 2.21893310546875, 2.3544921875, 2.49005126953125, 2.6256103515625, 2.76116943359375, 2.896728515625, 3.03228759765625, 3.1678466796875, 3.30340576171875, 3.43896484375, 3.57452392578125, 3.7100830078125, 3.84564208984375, 3.981201171875, 4.11676025390625, 4.2523193359375, 4.38787841796875, 4.5234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 8.0, 10.0, 16.0, 24.0, 29.0, 71.0, 113.0, 210.0, 332.0, 519.0, 890.0, 1348.0, 2398.0, 3791.0, 5970.0, 9412.0, 14687.0, 22921.0, 34169.0, 49469.0, 68090.0, 89094.0, 107316.0, 117745.0, 116946.0, 105596.0, 87866.0, 66726.0, 48605.0, 33376.0, 21967.0, 14392.0, 9279.0, 5789.0, 3590.0, 2233.0, 1383.0, 812.0, 550.0, 338.0, 188.0, 109.0, 78.0, 44.0, 22.0, 26.0, 4.0, 10.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-3.41796875, -3.320220947265625, -3.22247314453125, -3.124725341796875, -3.0269775390625, -2.929229736328125, -2.83148193359375, -2.733734130859375, -2.635986328125, -2.538238525390625, -2.44049072265625, -2.342742919921875, -2.2449951171875, -2.147247314453125, -2.04949951171875, -1.951751708984375, -1.85400390625, -1.756256103515625, -1.65850830078125, -1.560760498046875, -1.4630126953125, -1.365264892578125, -1.26751708984375, -1.169769287109375, -1.072021484375, -0.974273681640625, -0.87652587890625, -0.778778076171875, -0.6810302734375, -0.583282470703125, -0.48553466796875, -0.387786865234375, -0.2900390625, -0.192291259765625, -0.09454345703125, 0.003204345703125, 0.1009521484375, 0.198699951171875, 0.29644775390625, 0.394195556640625, 0.491943359375, 0.589691162109375, 0.68743896484375, 0.785186767578125, 0.8829345703125, 0.980682373046875, 1.07843017578125, 1.176177978515625, 1.27392578125, 1.371673583984375, 1.46942138671875, 1.567169189453125, 1.6649169921875, 1.762664794921875, 1.86041259765625, 1.958160400390625, 2.055908203125, 2.153656005859375, 2.25140380859375, 2.349151611328125, 2.4468994140625, 2.544647216796875, 2.64239501953125, 2.740142822265625, 2.837890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 8.0, 6.0, 8.0, 12.0, 13.0, 11.0, 17.0, 17.0, 29.0, 25.0, 26.0, 27.0, 43.0, 33.0, 45.0, 35.0, 42.0, 45.0, 36.0, 36.0, 44.0, 38.0, 49.0, 42.0, 38.0, 31.0, 31.0, 27.0, 18.0, 31.0, 19.0, 23.0, 18.0, 15.0, 9.0, 13.0, 9.0, 11.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.30859375, -3.208831787109375, -3.10906982421875, -3.009307861328125, -2.9095458984375, -2.809783935546875, -2.71002197265625, -2.610260009765625, -2.510498046875, -2.410736083984375, -2.31097412109375, -2.211212158203125, -2.1114501953125, -2.011688232421875, -1.91192626953125, -1.812164306640625, -1.71240234375, -1.612640380859375, -1.51287841796875, -1.413116455078125, -1.3133544921875, -1.213592529296875, -1.11383056640625, -1.014068603515625, -0.914306640625, -0.814544677734375, -0.71478271484375, -0.615020751953125, -0.5152587890625, -0.415496826171875, -0.31573486328125, -0.215972900390625, -0.1162109375, -0.016448974609375, 0.08331298828125, 0.183074951171875, 0.2828369140625, 0.382598876953125, 0.48236083984375, 0.582122802734375, 0.681884765625, 0.781646728515625, 0.88140869140625, 0.981170654296875, 1.0809326171875, 1.180694580078125, 1.28045654296875, 1.380218505859375, 1.47998046875, 1.579742431640625, 1.67950439453125, 1.779266357421875, 1.8790283203125, 1.978790283203125, 2.07855224609375, 2.178314208984375, 2.278076171875, 2.377838134765625, 2.47760009765625, 2.577362060546875, 2.6771240234375, 2.776885986328125, 2.87664794921875, 2.976409912109375, 3.076171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 14.0, 16.0, 29.0, 28.0, 53.0, 82.0, 162.0, 273.0, 461.0, 707.0, 1167.0, 1991.0, 3433.0, 5841.0, 10036.0, 16423.0, 27324.0, 43432.0, 65854.0, 93444.0, 119587.0, 136704.0, 135526.0, 118930.0, 92357.0, 65252.0, 42602.0, 26871.0, 16205.0, 9770.0, 5709.0, 3321.0, 1992.0, 1180.0, 716.0, 417.0, 244.0, 154.0, 87.0, 68.0, 42.0, 23.0, 11.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.1935882568359375, -1.153778076171875, -1.1139678955078125, -1.07415771484375, -1.0343475341796875, -0.994537353515625, -0.9547271728515625, -0.9149169921875, -0.8751068115234375, -0.835296630859375, -0.7954864501953125, -0.75567626953125, -0.7158660888671875, -0.676055908203125, -0.6362457275390625, -0.596435546875, -0.5566253662109375, -0.516815185546875, -0.4770050048828125, -0.43719482421875, -0.3973846435546875, -0.357574462890625, -0.3177642822265625, -0.2779541015625, -0.2381439208984375, -0.198333740234375, -0.1585235595703125, -0.11871337890625, -0.0789031982421875, -0.039093017578125, 0.0007171630859375, 0.04052734375, 0.0803375244140625, 0.120147705078125, 0.1599578857421875, 0.19976806640625, 0.2395782470703125, 0.279388427734375, 0.3191986083984375, 0.3590087890625, 0.3988189697265625, 0.438629150390625, 0.4784393310546875, 0.51824951171875, 0.5580596923828125, 0.597869873046875, 0.6376800537109375, 0.677490234375, 0.7173004150390625, 0.757110595703125, 0.7969207763671875, 0.83673095703125, 0.8765411376953125, 0.916351318359375, 0.9561614990234375, 0.9959716796875, 1.0357818603515625, 1.075592041015625, 1.1154022216796875, 1.15521240234375, 1.1950225830078125, 1.234832763671875, 1.2746429443359375, 1.314453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 13.0, 14.0, 22.0, 21.0, 33.0, 27.0, 29.0, 42.0, 49.0, 47.0, 51.0, 61.0, 50.0, 57.0, 56.0, 51.0, 46.0, 40.0, 44.0, 45.0, 36.0, 22.0, 25.0, 29.0, 11.0, 9.0, 16.0, 9.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001493692398071289, -0.0001444350928068161, -0.0001395009458065033, -0.0001345667988061905, -0.00012963265180587769, -0.00012469850480556488, -0.00011976435780525208, -0.00011483021080493927, -0.00010989606380462646, -0.00010496191680431366, -0.00010002776980400085, -9.509362280368805e-05, -9.015947580337524e-05, -8.522532880306244e-05, -8.029118180274963e-05, -7.535703480243683e-05, -7.042288780212402e-05, -6.548874080181122e-05, -6.055459380149841e-05, -5.562044680118561e-05, -5.06862998008728e-05, -4.575215280056e-05, -4.081800580024719e-05, -3.588385879993439e-05, -3.094971179962158e-05, -2.6015564799308777e-05, -2.108141779899597e-05, -1.6147270798683167e-05, -1.1213123798370361e-05, -6.278976798057556e-06, -1.344829797744751e-06, 3.589317202568054e-06, 8.52346420288086e-06, 1.3457611203193665e-05, 1.839175820350647e-05, 2.3325905203819275e-05, 2.826005220413208e-05, 3.3194199204444885e-05, 3.812834620475769e-05, 4.3062493205070496e-05, 4.79966402053833e-05, 5.2930787205696106e-05, 5.786493420600891e-05, 6.279908120632172e-05, 6.773322820663452e-05, 7.266737520694733e-05, 7.760152220726013e-05, 8.253566920757294e-05, 8.746981620788574e-05, 9.240396320819855e-05, 9.733811020851135e-05, 0.00010227225720882416, 0.00010720640420913696, 0.00011214055120944977, 0.00011707469820976257, 0.00012200884521007538, 0.00012694299221038818, 0.000131877139210701, 0.0001368112862110138, 0.0001417454332113266, 0.0001466795802116394, 0.0001516137272119522, 0.00015654787421226501, 0.00016148202121257782, 0.00016641616821289062]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 11.0, 15.0, 23.0, 30.0, 45.0, 71.0, 130.0, 179.0, 323.0, 505.0, 828.0, 1380.0, 2291.0, 4003.0, 6482.0, 10755.0, 18084.0, 29045.0, 45545.0, 67861.0, 93790.0, 118026.0, 133707.0, 132126.0, 115536.0, 90535.0, 64418.0, 43449.0, 27213.0, 17025.0, 10092.0, 6086.0, 3467.0, 2124.0, 1281.0, 825.0, 449.0, 302.0, 162.0, 111.0, 78.0, 47.0, 33.0, 22.0, 14.0, 13.0, 5.0, 7.0, 9.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.37109375, -1.3306884765625, -1.290283203125, -1.2498779296875, -1.20947265625, -1.1690673828125, -1.128662109375, -1.0882568359375, -1.0478515625, -1.0074462890625, -0.967041015625, -0.9266357421875, -0.88623046875, -0.8458251953125, -0.805419921875, -0.7650146484375, -0.724609375, -0.6842041015625, -0.643798828125, -0.6033935546875, -0.56298828125, -0.5225830078125, -0.482177734375, -0.4417724609375, -0.4013671875, -0.3609619140625, -0.320556640625, -0.2801513671875, -0.23974609375, -0.1993408203125, -0.158935546875, -0.1185302734375, -0.078125, -0.0377197265625, 0.002685546875, 0.0430908203125, 0.08349609375, 0.1239013671875, 0.164306640625, 0.2047119140625, 0.2451171875, 0.2855224609375, 0.325927734375, 0.3663330078125, 0.40673828125, 0.4471435546875, 0.487548828125, 0.5279541015625, 0.568359375, 0.6087646484375, 0.649169921875, 0.6895751953125, 0.72998046875, 0.7703857421875, 0.810791015625, 0.8511962890625, 0.8916015625, 0.9320068359375, 0.972412109375, 1.0128173828125, 1.05322265625, 1.0936279296875, 1.134033203125, 1.1744384765625, 1.21484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 8.0, 12.0, 19.0, 22.0, 21.0, 19.0, 19.0, 43.0, 27.0, 46.0, 53.0, 53.0, 52.0, 36.0, 51.0, 40.0, 47.0, 37.0, 36.0, 42.0, 34.0, 38.0, 36.0, 32.0, 21.0, 21.0, 24.0, 18.0, 15.0, 14.0, 14.0, 9.0, 7.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4318962097167969, -0.41628265380859375, -0.4006690979003906, -0.3850555419921875, -0.3694419860839844, -0.35382843017578125, -0.3382148742675781, -0.322601318359375, -0.3069877624511719, -0.29137420654296875, -0.2757606506347656, -0.2601470947265625, -0.24453353881835938, -0.22891998291015625, -0.21330642700195312, -0.19769287109375, -0.18207931518554688, -0.16646575927734375, -0.15085220336914062, -0.1352386474609375, -0.11962509155273438, -0.10401153564453125, -0.08839797973632812, -0.072784423828125, -0.057170867919921875, -0.04155731201171875, -0.025943756103515625, -0.0103302001953125, 0.005283355712890625, 0.02089691162109375, 0.036510467529296875, 0.0521240234375, 0.06773757934570312, 0.08335113525390625, 0.09896469116210938, 0.1145782470703125, 0.13019180297851562, 0.14580535888671875, 0.16141891479492188, 0.177032470703125, 0.19264602661132812, 0.20825958251953125, 0.22387313842773438, 0.2394866943359375, 0.2551002502441406, 0.27071380615234375, 0.2863273620605469, 0.30194091796875, 0.3175544738769531, 0.33316802978515625, 0.3487815856933594, 0.3643951416015625, 0.3800086975097656, 0.39562225341796875, 0.4112358093261719, 0.426849365234375, 0.4424629211425781, 0.45807647705078125, 0.4736900329589844, 0.4893035888671875, 0.5049171447753906, 0.5205307006835938, 0.5361442565917969, 0.5517578125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 8.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 17.0, 24.0, 27.0, 26.0, 40.0, 38.0, 37.0, 48.0, 51.0, 52.0, 49.0, 42.0, 53.0, 36.0, 54.0, 57.0, 55.0, 46.0, 35.0, 29.0, 25.0, 19.0, 16.0, 17.0, 16.0, 17.0, 4.0, 10.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9852094650268555, -4.84262752532959, -4.700045585632324, -4.557464122772217, -4.414882183074951, -4.2723002433776855, -4.12971830368042, -3.9871363639831543, -3.8445546627044678, -3.701972723007202, -3.5593910217285156, -3.41680908203125, -3.2742271423339844, -3.131645441055298, -2.9890635013580322, -2.8464818000793457, -2.70389986038208, -2.5613179206848145, -2.418736219406128, -2.2761542797088623, -2.133572578430176, -1.9909906387329102, -1.8484086990356445, -1.7058268785476685, -1.5632450580596924, -1.4206632375717163, -1.2780814170837402, -1.1354994773864746, -0.9929176568984985, -0.8503358364105225, -0.7077539563179016, -0.5651720762252808, -0.4225897789001465, -0.280007928609848, -0.13742607831954956, 0.005155771970748901, 0.14773762226104736, 0.29031944274902344, 0.4329013228416443, 0.5754832029342651, 0.7180650234222412, 0.8606468439102173, 1.0032286643981934, 1.145810604095459, 1.288392424583435, 1.4309742450714111, 1.5735561847686768, 1.7161380052566528, 1.858719825744629, 2.0013017654418945, 2.143883466720581, 2.2864654064178467, 2.429047107696533, 2.571629047393799, 2.7142109870910645, 2.85679292678833, 2.9993746280670166, 3.1419565677642822, 3.2845382690429688, 3.4271202087402344, 3.5697021484375, 3.7122838497161865, 3.854865789413452, 3.9974474906921387, 4.140029430389404]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 9.0, 10.0, 11.0, 11.0, 15.0, 14.0, 19.0, 21.0, 28.0, 29.0, 17.0, 20.0, 41.0, 31.0, 31.0, 34.0, 42.0, 38.0, 37.0, 37.0, 46.0, 43.0, 43.0, 47.0, 34.0, 26.0, 26.0, 24.0, 30.0, 16.0, 21.0, 22.0, 16.0, 19.0, 17.0, 7.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.297093391418457, -5.1462554931640625, -4.995417594909668, -4.844579696655273, -4.693741798400879, -4.542904376983643, -4.392066478729248, -4.2412285804748535, -4.090390682220459, -3.9395527839660645, -3.78871488571167, -3.6378772258758545, -3.48703932762146, -3.3362014293670654, -3.18536376953125, -3.0345258712768555, -2.883687973022461, -2.7328500747680664, -2.582012176513672, -2.4311745166778564, -2.280336618423462, -2.1294987201690674, -1.9786609411239624, -1.8278231620788574, -1.676985263824463, -1.5261473655700684, -1.3753095865249634, -1.2244718074798584, -1.0736339092254639, -0.9227960705757141, -0.7719582319259644, -0.6211204528808594, -0.47028207778930664, -0.3194442391395569, -0.16860640048980713, -0.017768561840057373, 0.13306927680969238, 0.28390711545944214, 0.4347449541091919, 0.5855827331542969, 0.7364206314086914, 0.8872584700584412, 1.038096308708191, 1.188934087753296, 1.3397719860076904, 1.490609884262085, 1.64144766330719, 1.792285442352295, 1.9431233406066895, 2.093961238861084, 2.2447991371154785, 2.395636796951294, 2.5464746952056885, 2.697312593460083, 2.8481502532958984, 2.998988151550293, 3.1498260498046875, 3.300663948059082, 3.4515018463134766, 3.602339506149292, 3.7531774044036865, 3.904015302658081, 4.0548529624938965, 4.205690860748291, 4.3565287590026855]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 11.0, 15.0, 18.0, 28.0, 39.0, 74.0, 93.0, 152.0, 209.0, 323.0, 470.0, 810.0, 1182.0, 1835.0, 2754.0, 4417.0, 7080.0, 10926.0, 18128.0, 30426.0, 51431.0, 88034.0, 153743.0, 260088.0, 413547.0, 574077.0, 664365.0, 626413.0, 487053.0, 324856.0, 196912.0, 113116.0, 65557.0, 37685.0, 22536.0, 13357.0, 8333.0, 5270.0, 3172.0, 1925.0, 1307.0, 867.0, 569.0, 358.0, 243.0, 159.0, 121.0, 75.0, 48.0, 27.0, 17.0, 23.0, 8.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.333984375, -3.2254638671875, -3.116943359375, -3.0084228515625, -2.89990234375, -2.7913818359375, -2.682861328125, -2.5743408203125, -2.4658203125, -2.3572998046875, -2.248779296875, -2.1402587890625, -2.03173828125, -1.9232177734375, -1.814697265625, -1.7061767578125, -1.59765625, -1.4891357421875, -1.380615234375, -1.2720947265625, -1.16357421875, -1.0550537109375, -0.946533203125, -0.8380126953125, -0.7294921875, -0.6209716796875, -0.512451171875, -0.4039306640625, -0.29541015625, -0.1868896484375, -0.078369140625, 0.0301513671875, 0.138671875, 0.2471923828125, 0.355712890625, 0.4642333984375, 0.57275390625, 0.6812744140625, 0.789794921875, 0.8983154296875, 1.0068359375, 1.1153564453125, 1.223876953125, 1.3323974609375, 1.44091796875, 1.5494384765625, 1.657958984375, 1.7664794921875, 1.875, 1.9835205078125, 2.092041015625, 2.2005615234375, 2.30908203125, 2.4176025390625, 2.526123046875, 2.6346435546875, 2.7431640625, 2.8516845703125, 2.960205078125, 3.0687255859375, 3.17724609375, 3.2857666015625, 3.394287109375, 3.5028076171875, 3.611328125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 8.0, 10.0, 16.0, 12.0, 17.0, 23.0, 17.0, 18.0, 28.0, 19.0, 31.0, 27.0, 31.0, 38.0, 29.0, 34.0, 48.0, 46.0, 35.0, 39.0, 44.0, 39.0, 57.0, 31.0, 25.0, 39.0, 25.0, 19.0, 22.0, 26.0, 20.0, 28.0, 9.0, 20.0, 11.0, 9.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0], "bins": [-4.91015625, -4.77490234375, -4.6396484375, -4.50439453125, -4.369140625, -4.23388671875, -4.0986328125, -3.96337890625, -3.828125, -3.69287109375, -3.5576171875, -3.42236328125, -3.287109375, -3.15185546875, -3.0166015625, -2.88134765625, -2.74609375, -2.61083984375, -2.4755859375, -2.34033203125, -2.205078125, -2.06982421875, -1.9345703125, -1.79931640625, -1.6640625, -1.52880859375, -1.3935546875, -1.25830078125, -1.123046875, -0.98779296875, -0.8525390625, -0.71728515625, -0.58203125, -0.44677734375, -0.3115234375, -0.17626953125, -0.041015625, 0.09423828125, 0.2294921875, 0.36474609375, 0.5, 0.63525390625, 0.7705078125, 0.90576171875, 1.041015625, 1.17626953125, 1.3115234375, 1.44677734375, 1.58203125, 1.71728515625, 1.8525390625, 1.98779296875, 2.123046875, 2.25830078125, 2.3935546875, 2.52880859375, 2.6640625, 2.79931640625, 2.9345703125, 3.06982421875, 3.205078125, 3.34033203125, 3.4755859375, 3.61083984375, 3.74609375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 14.0, 16.0, 21.0, 47.0, 70.0, 100.0, 138.0, 279.0, 415.0, 707.0, 1211.0, 1958.0, 3388.0, 5953.0, 10591.0, 18642.0, 34205.0, 61187.0, 109536.0, 193523.0, 327550.0, 508321.0, 675302.0, 710119.0, 582112.0, 395828.0, 240508.0, 137640.0, 77583.0, 43046.0, 23555.0, 13165.0, 7448.0, 4165.0, 2427.0, 1393.0, 805.0, 487.0, 325.0, 184.0, 114.0, 77.0, 48.0, 36.0, 15.0, 9.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.2650146484375, -4.123779296875, -3.9825439453125, -3.84130859375, -3.7000732421875, -3.558837890625, -3.4176025390625, -3.2763671875, -3.1351318359375, -2.993896484375, -2.8526611328125, -2.71142578125, -2.5701904296875, -2.428955078125, -2.2877197265625, -2.146484375, -2.0052490234375, -1.864013671875, -1.7227783203125, -1.58154296875, -1.4403076171875, -1.299072265625, -1.1578369140625, -1.0166015625, -0.8753662109375, -0.734130859375, -0.5928955078125, -0.45166015625, -0.3104248046875, -0.169189453125, -0.0279541015625, 0.11328125, 0.2545166015625, 0.395751953125, 0.5369873046875, 0.67822265625, 0.8194580078125, 0.960693359375, 1.1019287109375, 1.2431640625, 1.3843994140625, 1.525634765625, 1.6668701171875, 1.80810546875, 1.9493408203125, 2.090576171875, 2.2318115234375, 2.373046875, 2.5142822265625, 2.655517578125, 2.7967529296875, 2.93798828125, 3.0792236328125, 3.220458984375, 3.3616943359375, 3.5029296875, 3.6441650390625, 3.785400390625, 3.9266357421875, 4.06787109375, 4.2091064453125, 4.350341796875, 4.4915771484375, 4.6328125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 8.0, 15.0, 11.0, 28.0, 33.0, 43.0, 64.0, 75.0, 99.0, 109.0, 147.0, 153.0, 196.0, 225.0, 238.0, 230.0, 289.0, 255.0, 285.0, 264.0, 228.0, 201.0, 155.0, 140.0, 135.0, 106.0, 70.0, 73.0, 43.0, 38.0, 35.0, 22.0, 18.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.4311676025390625, -2.362335205078125, -2.2935028076171875, -2.22467041015625, -2.1558380126953125, -2.087005615234375, -2.0181732177734375, -1.9493408203125, -1.8805084228515625, -1.811676025390625, -1.7428436279296875, -1.67401123046875, -1.6051788330078125, -1.536346435546875, -1.4675140380859375, -1.398681640625, -1.3298492431640625, -1.261016845703125, -1.1921844482421875, -1.12335205078125, -1.0545196533203125, -0.985687255859375, -0.9168548583984375, -0.8480224609375, -0.7791900634765625, -0.710357666015625, -0.6415252685546875, -0.57269287109375, -0.5038604736328125, -0.435028076171875, -0.3661956787109375, -0.29736328125, -0.2285308837890625, -0.159698486328125, -0.0908660888671875, -0.02203369140625, 0.0467987060546875, 0.115631103515625, 0.1844635009765625, 0.2532958984375, 0.3221282958984375, 0.390960693359375, 0.4597930908203125, 0.52862548828125, 0.5974578857421875, 0.666290283203125, 0.7351226806640625, 0.803955078125, 0.8727874755859375, 0.941619873046875, 1.0104522705078125, 1.07928466796875, 1.1481170654296875, 1.216949462890625, 1.2857818603515625, 1.3546142578125, 1.4234466552734375, 1.492279052734375, 1.5611114501953125, 1.62994384765625, 1.6987762451171875, 1.767608642578125, 1.8364410400390625, 1.9052734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 7.0, 2.0, 10.0, 9.0, 7.0, 13.0, 12.0, 16.0, 10.0, 19.0, 23.0, 13.0, 34.0, 29.0, 29.0, 46.0, 46.0, 37.0, 43.0, 48.0, 30.0, 55.0, 48.0, 42.0, 43.0, 47.0, 37.0, 31.0, 36.0, 24.0, 21.0, 18.0, 19.0, 6.0, 16.0, 8.0, 14.0, 11.0, 10.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.257075786590576, -4.127053260803223, -3.9970312118530273, -3.867008924484253, -3.7369866371154785, -3.606964111328125, -3.4769418239593506, -3.346919536590576, -3.2168972492218018, -3.0868749618530273, -2.956852674484253, -2.8268303871154785, -2.696807861328125, -2.5667858123779297, -2.436763286590576, -2.3067409992218018, -2.1767187118530273, -2.046696424484253, -1.9166741371154785, -1.7866517305374146, -1.6566294431686401, -1.5266071557998657, -1.3965847492218018, -1.2665624618530273, -1.136540174484253, -1.0065178871154785, -0.8764955401420593, -0.7464731931686401, -0.6164509057998657, -0.4864286184310913, -0.3564062714576721, -0.22638392448425293, -0.09636211395263672, 0.03366020321846008, 0.16368252038955688, 0.2937048375606537, 0.4237271547317505, 0.5537494421005249, 0.6837717890739441, 0.8137941360473633, 0.9438164234161377, 1.073838710784912, 1.2038609981536865, 1.3338834047317505, 1.463905692100525, 1.5939279794692993, 1.7239503860473633, 1.8539726734161377, 1.983994960784912, 2.1140172481536865, 2.244039535522461, 2.3740618228912354, 2.5040841102600098, 2.6341066360473633, 2.7641289234161377, 2.894151210784912, 3.0241734981536865, 3.154195785522461, 3.2842180728912354, 3.4142403602600098, 3.5442628860473633, 3.6742849349975586, 3.804307460784912, 3.9343297481536865, 4.064352035522461]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 19.0, 17.0, 17.0, 15.0, 13.0, 24.0, 18.0, 33.0, 29.0, 31.0, 39.0, 31.0, 36.0, 31.0, 49.0, 33.0, 46.0, 45.0, 46.0, 39.0, 41.0, 39.0, 26.0, 30.0, 25.0, 24.0, 31.0, 16.0, 20.0, 9.0, 16.0, 17.0, 12.0, 11.0, 7.0, 8.0, 8.0, 3.0, 10.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.991561412811279, -4.837640285491943, -4.683719635009766, -4.52979850769043, -4.375877857208252, -4.221956729888916, -4.068036079406738, -3.9141149520874023, -3.7601940631866455, -3.6062731742858887, -3.452352285385132, -3.298431396484375, -3.144510269165039, -2.9905896186828613, -2.8366684913635254, -2.6827476024627686, -2.5288267135620117, -2.374905824661255, -2.220984935760498, -2.067064046859741, -1.9131430387496948, -1.759222149848938, -1.6053011417388916, -1.4513802528381348, -1.297459363937378, -1.143538475036621, -0.9896175265312195, -0.8356965780258179, -0.681775689125061, -0.5278548002243042, -0.3739338517189026, -0.22001290321350098, -0.06609249114990234, 0.08782842755317688, 0.2417493462562561, 0.3956702649593353, 0.5495911836624146, 0.7035120725631714, 0.857433021068573, 1.0113539695739746, 1.1652748584747314, 1.3191957473754883, 1.4731166362762451, 1.6270376443862915, 1.7809585332870483, 1.9348794221878052, 2.0888004302978516, 2.2427213191986084, 2.3966422080993652, 2.550563097000122, 2.704483985900879, 2.8584048748016357, 3.0123257637023926, 3.1662468910217285, 3.3201677799224854, 3.474088668823242, 3.628009557723999, 3.781930446624756, 3.9358513355255127, 4.0897722244262695, 4.2436933517456055, 4.397614002227783, 4.551535129547119, 4.705455780029297, 4.859376907348633]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 10.0, 14.0, 12.0, 24.0, 48.0, 72.0, 102.0, 164.0, 226.0, 297.0, 579.0, 861.0, 1464.0, 2441.0, 4224.0, 6932.0, 12041.0, 20775.0, 35963.0, 61427.0, 101338.0, 151015.0, 183919.0, 167209.0, 118391.0, 74073.0, 43843.0, 25325.0, 14693.0, 8535.0, 4827.0, 3006.0, 1793.0, 1074.0, 626.0, 415.0, 269.0, 168.0, 101.0, 88.0, 53.0, 36.0, 29.0, 29.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86328125, -0.83514404296875, -0.8070068359375, -0.77886962890625, -0.750732421875, -0.72259521484375, -0.6944580078125, -0.66632080078125, -0.63818359375, -0.61004638671875, -0.5819091796875, -0.55377197265625, -0.525634765625, -0.49749755859375, -0.4693603515625, -0.44122314453125, -0.4130859375, -0.38494873046875, -0.3568115234375, -0.32867431640625, -0.300537109375, -0.27239990234375, -0.2442626953125, -0.21612548828125, -0.18798828125, -0.15985107421875, -0.1317138671875, -0.10357666015625, -0.075439453125, -0.04730224609375, -0.0191650390625, 0.00897216796875, 0.037109375, 0.06524658203125, 0.0933837890625, 0.12152099609375, 0.149658203125, 0.17779541015625, 0.2059326171875, 0.23406982421875, 0.26220703125, 0.29034423828125, 0.3184814453125, 0.34661865234375, 0.374755859375, 0.40289306640625, 0.4310302734375, 0.45916748046875, 0.4873046875, 0.51544189453125, 0.5435791015625, 0.57171630859375, 0.599853515625, 0.62799072265625, 0.6561279296875, 0.68426513671875, 0.71240234375, 0.74053955078125, 0.7686767578125, 0.79681396484375, 0.824951171875, 0.85308837890625, 0.8812255859375, 0.90936279296875, 0.9375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 12.0, 7.0, 13.0, 18.0, 15.0, 13.0, 12.0, 15.0, 18.0, 23.0, 20.0, 24.0, 36.0, 34.0, 25.0, 32.0, 35.0, 44.0, 37.0, 53.0, 40.0, 43.0, 39.0, 33.0, 41.0, 31.0, 24.0, 30.0, 28.0, 23.0, 30.0, 21.0, 18.0, 12.0, 8.0, 12.0, 12.0, 11.0, 8.0, 10.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0], "bins": [-5.28125, -5.130615234375, -4.97998046875, -4.829345703125, -4.6787109375, -4.528076171875, -4.37744140625, -4.226806640625, -4.076171875, -3.925537109375, -3.77490234375, -3.624267578125, -3.4736328125, -3.322998046875, -3.17236328125, -3.021728515625, -2.87109375, -2.720458984375, -2.56982421875, -2.419189453125, -2.2685546875, -2.117919921875, -1.96728515625, -1.816650390625, -1.666015625, -1.515380859375, -1.36474609375, -1.214111328125, -1.0634765625, -0.912841796875, -0.76220703125, -0.611572265625, -0.4609375, -0.310302734375, -0.15966796875, -0.009033203125, 0.1416015625, 0.292236328125, 0.44287109375, 0.593505859375, 0.744140625, 0.894775390625, 1.04541015625, 1.196044921875, 1.3466796875, 1.497314453125, 1.64794921875, 1.798583984375, 1.94921875, 2.099853515625, 2.25048828125, 2.401123046875, 2.5517578125, 2.702392578125, 2.85302734375, 3.003662109375, 3.154296875, 3.304931640625, 3.45556640625, 3.606201171875, 3.7568359375, 3.907470703125, 4.05810546875, 4.208740234375, 4.359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 6.0, 5.0, 9.0, 11.0, 25.0, 34.0, 45.0, 65.0, 107.0, 195.0, 403.0, 1079.0, 3538.0, 13488.0, 70755.0, 907455.0, 38815.0, 8674.0, 2321.0, 784.0, 301.0, 177.0, 77.0, 51.0, 32.0, 22.0, 20.0, 6.0, 8.0, 3.0, 7.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.83203125, -4.67791748046875, -4.5238037109375, -4.36968994140625, -4.215576171875, -4.06146240234375, -3.9073486328125, -3.75323486328125, -3.59912109375, -3.44500732421875, -3.2908935546875, -3.13677978515625, -2.982666015625, -2.82855224609375, -2.6744384765625, -2.52032470703125, -2.3662109375, -2.21209716796875, -2.0579833984375, -1.90386962890625, -1.749755859375, -1.59564208984375, -1.4415283203125, -1.28741455078125, -1.13330078125, -0.97918701171875, -0.8250732421875, -0.67095947265625, -0.516845703125, -0.36273193359375, -0.2086181640625, -0.05450439453125, 0.099609375, 0.25372314453125, 0.4078369140625, 0.56195068359375, 0.716064453125, 0.87017822265625, 1.0242919921875, 1.17840576171875, 1.33251953125, 1.48663330078125, 1.6407470703125, 1.79486083984375, 1.948974609375, 2.10308837890625, 2.2572021484375, 2.41131591796875, 2.5654296875, 2.71954345703125, 2.8736572265625, 3.02777099609375, 3.181884765625, 3.33599853515625, 3.4901123046875, 3.64422607421875, 3.79833984375, 3.95245361328125, 4.1065673828125, 4.26068115234375, 4.414794921875, 4.56890869140625, 4.7230224609375, 4.87713623046875, 5.03125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 10.0, 15.0, 9.0, 12.0, 18.0, 15.0, 18.0, 19.0, 24.0, 33.0, 39.0, 45.0, 42.0, 31.0, 40.0, 48.0, 50.0, 51.0, 43.0, 51.0, 46.0, 39.0, 46.0, 38.0, 36.0, 18.0, 23.0, 19.0, 17.0, 21.0, 15.0, 12.0, 11.0, 12.0, 13.0, 6.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.326141357421875, -4.20306396484375, -4.079986572265625, -3.9569091796875, -3.833831787109375, -3.71075439453125, -3.587677001953125, -3.464599609375, -3.341522216796875, -3.21844482421875, -3.095367431640625, -2.9722900390625, -2.849212646484375, -2.72613525390625, -2.603057861328125, -2.47998046875, -2.356903076171875, -2.23382568359375, -2.110748291015625, -1.9876708984375, -1.864593505859375, -1.74151611328125, -1.618438720703125, -1.495361328125, -1.372283935546875, -1.24920654296875, -1.126129150390625, -1.0030517578125, -0.879974365234375, -0.75689697265625, -0.633819580078125, -0.5107421875, -0.387664794921875, -0.26458740234375, -0.141510009765625, -0.0184326171875, 0.104644775390625, 0.22772216796875, 0.350799560546875, 0.473876953125, 0.596954345703125, 0.72003173828125, 0.843109130859375, 0.9661865234375, 1.089263916015625, 1.21234130859375, 1.335418701171875, 1.45849609375, 1.581573486328125, 1.70465087890625, 1.827728271484375, 1.9508056640625, 2.073883056640625, 2.19696044921875, 2.320037841796875, 2.443115234375, 2.566192626953125, 2.68927001953125, 2.812347412109375, 2.9354248046875, 3.058502197265625, 3.18157958984375, 3.304656982421875, 3.427734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 14.0, 27.0, 29.0, 41.0, 79.0, 81.0, 154.0, 216.0, 373.0, 632.0, 1117.0, 2038.0, 4109.0, 8060.0, 16323.0, 36772.0, 641405.0, 278331.0, 30299.0, 14080.0, 6760.0, 3437.0, 1762.0, 941.0, 546.0, 296.0, 189.0, 137.0, 71.0, 68.0, 42.0, 23.0, 24.0, 16.0, 11.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.231689453125, -0.22418975830078125, -0.2166900634765625, -0.20919036865234375, -0.201690673828125, -0.19419097900390625, -0.1866912841796875, -0.17919158935546875, -0.17169189453125, -0.16419219970703125, -0.1566925048828125, -0.14919281005859375, -0.141693115234375, -0.13419342041015625, -0.1266937255859375, -0.11919403076171875, -0.1116943359375, -0.10419464111328125, -0.0966949462890625, -0.08919525146484375, -0.081695556640625, -0.07419586181640625, -0.0666961669921875, -0.05919647216796875, -0.05169677734375, -0.04419708251953125, -0.0366973876953125, -0.02919769287109375, -0.021697998046875, -0.01419830322265625, -0.0066986083984375, 0.00080108642578125, 0.00830078125, 0.01580047607421875, 0.0233001708984375, 0.03079986572265625, 0.038299560546875, 0.04579925537109375, 0.0532989501953125, 0.06079864501953125, 0.06829833984375, 0.07579803466796875, 0.0832977294921875, 0.09079742431640625, 0.098297119140625, 0.10579681396484375, 0.1132965087890625, 0.12079620361328125, 0.1282958984375, 0.13579559326171875, 0.1432952880859375, 0.15079498291015625, 0.158294677734375, 0.16579437255859375, 0.1732940673828125, 0.18079376220703125, 0.18829345703125, 0.19579315185546875, 0.2032928466796875, 0.21079254150390625, 0.218292236328125, 0.22579193115234375, 0.2332916259765625, 0.24079132080078125, 0.248291015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 13.0, 5.0, 10.0, 8.0, 12.0, 21.0, 14.0, 33.0, 22.0, 30.0, 41.0, 61.0, 50.0, 43.0, 56.0, 54.0, 68.0, 42.0, 40.0, 53.0, 55.0, 53.0, 39.0, 23.0, 26.0, 22.0, 23.0, 22.0, 10.0, 12.0, 12.0, 5.0, 6.0, 3.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1265277862548828e-05, -1.0919757187366486e-05, -1.0574236512184143e-05, -1.02287158370018e-05, -9.883195161819458e-06, -9.537674486637115e-06, -9.192153811454773e-06, -8.84663313627243e-06, -8.501112461090088e-06, -8.155591785907745e-06, -7.810071110725403e-06, -7.46455043554306e-06, -7.119029760360718e-06, -6.773509085178375e-06, -6.427988409996033e-06, -6.08246773481369e-06, -5.736947059631348e-06, -5.391426384449005e-06, -5.045905709266663e-06, -4.70038503408432e-06, -4.3548643589019775e-06, -4.009343683719635e-06, -3.6638230085372925e-06, -3.31830233335495e-06, -2.9727816581726074e-06, -2.627260982990265e-06, -2.2817403078079224e-06, -1.93621963262558e-06, -1.5906989574432373e-06, -1.2451782822608948e-06, -8.996576070785522e-07, -5.541369318962097e-07, -2.086162567138672e-07, 1.3690441846847534e-07, 4.824250936508179e-07, 8.279457688331604e-07, 1.173466444015503e-06, 1.5189871191978455e-06, 1.864507794380188e-06, 2.2100284695625305e-06, 2.555549144744873e-06, 2.9010698199272156e-06, 3.246590495109558e-06, 3.5921111702919006e-06, 3.937631845474243e-06, 4.283152520656586e-06, 4.628673195838928e-06, 4.974193871021271e-06, 5.319714546203613e-06, 5.665235221385956e-06, 6.010755896568298e-06, 6.356276571750641e-06, 6.701797246932983e-06, 7.047317922115326e-06, 7.3928385972976685e-06, 7.738359272480011e-06, 8.083879947662354e-06, 8.429400622844696e-06, 8.774921298027039e-06, 9.120441973209381e-06, 9.465962648391724e-06, 9.811483323574066e-06, 1.0157003998756409e-05, 1.0502524673938751e-05, 1.0848045349121094e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 12.0, 18.0, 25.0, 29.0, 26.0, 58.0, 100.0, 160.0, 196.0, 360.0, 547.0, 840.0, 1272.0, 2039.0, 3269.0, 5509.0, 8626.0, 13740.0, 22174.0, 35029.0, 54799.0, 82978.0, 119491.0, 152072.0, 156051.0, 129183.0, 92205.0, 60974.0, 39823.0, 25024.0, 15768.0, 9846.0, 6096.0, 3916.0, 2368.0, 1453.0, 923.0, 504.0, 377.0, 261.0, 140.0, 81.0, 74.0, 37.0, 23.0, 27.0, 17.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.159912109375, -0.15477561950683594, -0.14963912963867188, -0.1445026397705078, -0.13936614990234375, -0.1342296600341797, -0.12909317016601562, -0.12395668029785156, -0.1188201904296875, -0.11368370056152344, -0.10854721069335938, -0.10341072082519531, -0.09827423095703125, -0.09313774108886719, -0.08800125122070312, -0.08286476135253906, -0.077728271484375, -0.07259178161621094, -0.06745529174804688, -0.06231880187988281, -0.05718231201171875, -0.05204582214355469, -0.046909332275390625, -0.04177284240722656, -0.0366363525390625, -0.03149986267089844, -0.026363372802734375, -0.021226882934570312, -0.01609039306640625, -0.010953903198242188, -0.005817413330078125, -0.0006809234619140625, 0.00445556640625, 0.009592056274414062, 0.014728546142578125, 0.019865036010742188, 0.02500152587890625, 0.030138015747070312, 0.035274505615234375, 0.04041099548339844, 0.0455474853515625, 0.05068397521972656, 0.055820465087890625, 0.06095695495605469, 0.06609344482421875, 0.07122993469238281, 0.07636642456054688, 0.08150291442871094, 0.086639404296875, 0.09177589416503906, 0.09691238403320312, 0.10204887390136719, 0.10718536376953125, 0.11232185363769531, 0.11745834350585938, 0.12259483337402344, 0.1277313232421875, 0.13286781311035156, 0.13800430297851562, 0.1431407928466797, 0.14827728271484375, 0.1534137725830078, 0.15855026245117188, 0.16368675231933594, 0.1688232421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 3.0, 10.0, 4.0, 16.0, 11.0, 11.0, 17.0, 12.0, 21.0, 31.0, 36.0, 34.0, 44.0, 37.0, 33.0, 59.0, 48.0, 69.0, 52.0, 45.0, 59.0, 49.0, 46.0, 41.0, 22.0, 24.0, 31.0, 23.0, 11.0, 7.0, 16.0, 10.0, 13.0, 13.0, 3.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06591796875, -0.06386280059814453, -0.06180763244628906, -0.059752464294433594, -0.057697296142578125, -0.055642127990722656, -0.05358695983886719, -0.05153179168701172, -0.04947662353515625, -0.04742145538330078, -0.04536628723144531, -0.043311119079589844, -0.041255950927734375, -0.039200782775878906, -0.03714561462402344, -0.03509044647216797, -0.0330352783203125, -0.03098011016845703, -0.028924942016601562, -0.026869773864746094, -0.024814605712890625, -0.022759437561035156, -0.020704269409179688, -0.01864910125732422, -0.01659393310546875, -0.014538764953613281, -0.012483596801757812, -0.010428428649902344, -0.008373260498046875, -0.006318092346191406, -0.0042629241943359375, -0.0022077560424804688, -0.000152587890625, 0.0019025802612304688, 0.0039577484130859375, 0.006012916564941406, 0.008068084716796875, 0.010123252868652344, 0.012178421020507812, 0.014233589172363281, 0.01628875732421875, 0.01834392547607422, 0.020399093627929688, 0.022454261779785156, 0.024509429931640625, 0.026564598083496094, 0.028619766235351562, 0.03067493438720703, 0.0327301025390625, 0.03478527069091797, 0.03684043884277344, 0.038895606994628906, 0.040950775146484375, 0.043005943298339844, 0.04506111145019531, 0.04711627960205078, 0.04917144775390625, 0.05122661590576172, 0.05328178405761719, 0.055336952209472656, 0.057392120361328125, 0.059447288513183594, 0.06150245666503906, 0.06355762481689453, 0.06561279296875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 16.0, 10.0, 15.0, 21.0, 19.0, 31.0, 31.0, 30.0, 46.0, 36.0, 44.0, 40.0, 53.0, 30.0, 42.0, 58.0, 45.0, 46.0, 45.0, 32.0, 39.0, 34.0, 27.0, 21.0, 21.0, 15.0, 11.0, 12.0, 14.0, 6.0, 10.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.430865287780762, -4.29975700378418, -4.168649196624756, -4.037540912628174, -3.906432867050171, -3.775324821472168, -3.644216537475586, -3.513108491897583, -3.38200044631958, -3.250892400741577, -3.119784116744995, -2.988676071166992, -2.8575680255889893, -2.7264599800109863, -2.5953516960144043, -2.4642436504364014, -2.3331353664398193, -2.2020273208618164, -2.0709190368652344, -1.9398109912872314, -1.8087029457092285, -1.677594780921936, -1.5464866161346436, -1.4153785705566406, -1.2842704057693481, -1.1531622409820557, -1.0220541954040527, -0.8909460306167603, -0.7598379254341125, -0.6287298202514648, -0.49762165546417236, -0.36651355028152466, -0.23540568351745605, -0.10429756343364716, 0.026810556650161743, 0.15791869163513184, 0.28902679681777954, 0.42013490200042725, 0.5512430667877197, 0.6823511719703674, 0.8134592771530151, 0.9445673823356628, 1.0756754875183105, 1.206783652305603, 1.3378918170928955, 1.4689998626708984, 1.600108027458191, 1.7312161922454834, 1.8623242378234863, 1.9934324026107788, 2.1245405673980713, 2.255648612976074, 2.386756658554077, 2.51786470413208, 2.648972988128662, 2.780081033706665, 2.911189079284668, 3.042297124862671, 3.173405408859253, 3.304513454437256, 3.435621500015259, 3.5667295455932617, 3.6978378295898438, 3.8289458751678467, 3.9600541591644287]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 5.0, 11.0, 21.0, 15.0, 16.0, 16.0, 14.0, 24.0, 20.0, 28.0, 32.0, 31.0, 38.0, 30.0, 37.0, 35.0, 44.0, 32.0, 49.0, 44.0, 46.0, 37.0, 44.0, 39.0, 26.0, 30.0, 24.0, 22.0, 31.0, 16.0, 21.0, 12.0, 13.0, 19.0, 11.0, 11.0, 7.0, 10.0, 8.0, 4.0, 8.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.994941711425781, -4.841762065887451, -4.688582897186279, -4.535403251647949, -4.382224082946777, -4.229044437408447, -4.075865268707275, -3.9226856231689453, -3.7695062160491943, -3.6163268089294434, -3.4631474018096924, -3.3099679946899414, -3.1567883491516113, -3.0036091804504395, -2.8504295349121094, -2.6972501277923584, -2.5440707206726074, -2.3908913135528564, -2.2377119064331055, -2.0845324993133545, -1.931352972984314, -1.778173565864563, -1.6249940395355225, -1.4718146324157715, -1.3186352252960205, -1.1654558181762695, -1.0122764110565186, -0.859096884727478, -0.705917477607727, -0.5527380704879761, -0.3995586037635803, -0.24637913703918457, -0.09319925308227539, 0.059980183839797974, 0.21315962076187134, 0.3663390576839447, 0.5195184946060181, 0.672697901725769, 0.8258773684501648, 0.9790568351745605, 1.1322362422943115, 1.2854156494140625, 1.4385950565338135, 1.591774582862854, 1.744953989982605, 1.898133397102356, 2.0513129234313965, 2.2044923305511475, 2.3576717376708984, 2.5108511447906494, 2.6640305519104004, 2.8172099590301514, 2.9703893661499023, 3.1235690116882324, 3.2767484188079834, 3.4299278259277344, 3.5831072330474854, 3.7362866401672363, 3.8894660472869873, 4.042645454406738, 4.195825099945068, 4.34900426864624, 4.50218391418457, 4.655363082885742, 4.808542728424072]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 10.0, 12.0, 9.0, 18.0, 24.0, 54.0, 98.0, 148.0, 209.0, 325.0, 498.0, 811.0, 1156.0, 1918.0, 2938.0, 4373.0, 6679.0, 10024.0, 14977.0, 21687.0, 30680.0, 42384.0, 57595.0, 73085.0, 88073.0, 99906.0, 104913.0, 102025.0, 92124.0, 77106.0, 61112.0, 46218.0, 33750.0, 23726.0, 16903.0, 11367.0, 7568.0, 4887.0, 3180.0, 2180.0, 1304.0, 903.0, 578.0, 391.0, 211.0, 141.0, 118.0, 65.0, 38.0, 34.0, 12.0, 11.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.548828125, -2.46826171875, -2.3876953125, -2.30712890625, -2.2265625, -2.14599609375, -2.0654296875, -1.98486328125, -1.904296875, -1.82373046875, -1.7431640625, -1.66259765625, -1.58203125, -1.50146484375, -1.4208984375, -1.34033203125, -1.259765625, -1.17919921875, -1.0986328125, -1.01806640625, -0.9375, -0.85693359375, -0.7763671875, -0.69580078125, -0.615234375, -0.53466796875, -0.4541015625, -0.37353515625, -0.29296875, -0.21240234375, -0.1318359375, -0.05126953125, 0.029296875, 0.10986328125, 0.1904296875, 0.27099609375, 0.3515625, 0.43212890625, 0.5126953125, 0.59326171875, 0.673828125, 0.75439453125, 0.8349609375, 0.91552734375, 0.99609375, 1.07666015625, 1.1572265625, 1.23779296875, 1.318359375, 1.39892578125, 1.4794921875, 1.56005859375, 1.640625, 1.72119140625, 1.8017578125, 1.88232421875, 1.962890625, 2.04345703125, 2.1240234375, 2.20458984375, 2.28515625, 2.36572265625, 2.4462890625, 2.52685546875, 2.607421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 10.0, 12.0, 10.0, 11.0, 9.0, 24.0, 22.0, 20.0, 17.0, 16.0, 36.0, 29.0, 34.0, 41.0, 42.0, 45.0, 44.0, 41.0, 36.0, 59.0, 41.0, 31.0, 39.0, 38.0, 23.0, 38.0, 24.0, 33.0, 26.0, 19.0, 14.0, 14.0, 18.0, 11.0, 17.0, 13.0, 9.0, 8.0, 6.0, 10.0, 1.0, 0.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9375, -4.77923583984375, -4.6209716796875, -4.46270751953125, -4.304443359375, -4.14617919921875, -3.9879150390625, -3.82965087890625, -3.67138671875, -3.51312255859375, -3.3548583984375, -3.19659423828125, -3.038330078125, -2.88006591796875, -2.7218017578125, -2.56353759765625, -2.4052734375, -2.24700927734375, -2.0887451171875, -1.93048095703125, -1.772216796875, -1.61395263671875, -1.4556884765625, -1.29742431640625, -1.13916015625, -0.98089599609375, -0.8226318359375, -0.66436767578125, -0.506103515625, -0.34783935546875, -0.1895751953125, -0.03131103515625, 0.126953125, 0.28521728515625, 0.4434814453125, 0.60174560546875, 0.760009765625, 0.91827392578125, 1.0765380859375, 1.23480224609375, 1.39306640625, 1.55133056640625, 1.7095947265625, 1.86785888671875, 2.026123046875, 2.18438720703125, 2.3426513671875, 2.50091552734375, 2.6591796875, 2.81744384765625, 2.9757080078125, 3.13397216796875, 3.292236328125, 3.45050048828125, 3.6087646484375, 3.76702880859375, 3.92529296875, 4.08355712890625, 4.2418212890625, 4.40008544921875, 4.558349609375, 4.71661376953125, 4.8748779296875, 5.03314208984375, 5.19140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 11.0, 7.0, 17.0, 42.0, 37.0, 83.0, 110.0, 159.0, 290.0, 438.0, 713.0, 1058.0, 1698.0, 2731.0, 4147.0, 6593.0, 9995.0, 15201.0, 23157.0, 33912.0, 48423.0, 65581.0, 84940.0, 101119.0, 112317.0, 112583.0, 103953.0, 88692.0, 69465.0, 51690.0, 36608.0, 25231.0, 16685.0, 11086.0, 7110.0, 4638.0, 2922.0, 1883.0, 1226.0, 749.0, 446.0, 301.0, 203.0, 107.0, 80.0, 38.0, 37.0, 21.0, 13.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.7568359375, -2.662109375, -2.5673828125, -2.47265625, -2.3779296875, -2.283203125, -2.1884765625, -2.09375, -1.9990234375, -1.904296875, -1.8095703125, -1.71484375, -1.6201171875, -1.525390625, -1.4306640625, -1.3359375, -1.2412109375, -1.146484375, -1.0517578125, -0.95703125, -0.8623046875, -0.767578125, -0.6728515625, -0.578125, -0.4833984375, -0.388671875, -0.2939453125, -0.19921875, -0.1044921875, -0.009765625, 0.0849609375, 0.1796875, 0.2744140625, 0.369140625, 0.4638671875, 0.55859375, 0.6533203125, 0.748046875, 0.8427734375, 0.9375, 1.0322265625, 1.126953125, 1.2216796875, 1.31640625, 1.4111328125, 1.505859375, 1.6005859375, 1.6953125, 1.7900390625, 1.884765625, 1.9794921875, 2.07421875, 2.1689453125, 2.263671875, 2.3583984375, 2.453125, 2.5478515625, 2.642578125, 2.7373046875, 2.83203125, 2.9267578125, 3.021484375, 3.1162109375, 3.2109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 10.0, 12.0, 7.0, 11.0, 24.0, 16.0, 24.0, 21.0, 19.0, 27.0, 26.0, 29.0, 45.0, 33.0, 35.0, 34.0, 34.0, 44.0, 46.0, 48.0, 43.0, 40.0, 43.0, 24.0, 39.0, 37.0, 31.0, 26.0, 19.0, 19.0, 19.0, 21.0, 18.0, 15.0, 10.0, 7.0, 5.0, 9.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4609375, -3.357574462890625, -3.25421142578125, -3.150848388671875, -3.0474853515625, -2.944122314453125, -2.84075927734375, -2.737396240234375, -2.634033203125, -2.530670166015625, -2.42730712890625, -2.323944091796875, -2.2205810546875, -2.117218017578125, -2.01385498046875, -1.910491943359375, -1.80712890625, -1.703765869140625, -1.60040283203125, -1.497039794921875, -1.3936767578125, -1.290313720703125, -1.18695068359375, -1.083587646484375, -0.980224609375, -0.876861572265625, -0.77349853515625, -0.670135498046875, -0.5667724609375, -0.463409423828125, -0.36004638671875, -0.256683349609375, -0.1533203125, -0.049957275390625, 0.05340576171875, 0.156768798828125, 0.2601318359375, 0.363494873046875, 0.46685791015625, 0.570220947265625, 0.673583984375, 0.776947021484375, 0.88031005859375, 0.983673095703125, 1.0870361328125, 1.190399169921875, 1.29376220703125, 1.397125244140625, 1.50048828125, 1.603851318359375, 1.70721435546875, 1.810577392578125, 1.9139404296875, 2.017303466796875, 2.12066650390625, 2.224029541015625, 2.327392578125, 2.430755615234375, 2.53411865234375, 2.637481689453125, 2.7408447265625, 2.844207763671875, 2.94757080078125, 3.050933837890625, 3.154296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 19.0, 23.0, 52.0, 73.0, 109.0, 158.0, 234.0, 373.0, 585.0, 999.0, 1512.0, 2574.0, 4028.0, 6601.0, 10375.0, 16489.0, 25194.0, 37713.0, 54411.0, 74534.0, 96371.0, 113604.0, 121458.0, 117329.0, 102120.0, 81171.0, 59726.0, 42153.0, 28168.0, 18555.0, 11918.0, 7500.0, 4667.0, 2930.0, 1789.0, 1044.0, 733.0, 454.0, 294.0, 173.0, 109.0, 80.0, 55.0, 42.0, 13.0, 14.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.091796875, -1.058349609375, -1.02490234375, -0.991455078125, -0.9580078125, -0.924560546875, -0.89111328125, -0.857666015625, -0.82421875, -0.790771484375, -0.75732421875, -0.723876953125, -0.6904296875, -0.656982421875, -0.62353515625, -0.590087890625, -0.556640625, -0.523193359375, -0.48974609375, -0.456298828125, -0.4228515625, -0.389404296875, -0.35595703125, -0.322509765625, -0.2890625, -0.255615234375, -0.22216796875, -0.188720703125, -0.1552734375, -0.121826171875, -0.08837890625, -0.054931640625, -0.021484375, 0.011962890625, 0.04541015625, 0.078857421875, 0.1123046875, 0.145751953125, 0.17919921875, 0.212646484375, 0.24609375, 0.279541015625, 0.31298828125, 0.346435546875, 0.3798828125, 0.413330078125, 0.44677734375, 0.480224609375, 0.513671875, 0.547119140625, 0.58056640625, 0.614013671875, 0.6474609375, 0.680908203125, 0.71435546875, 0.747802734375, 0.78125, 0.814697265625, 0.84814453125, 0.881591796875, 0.9150390625, 0.948486328125, 0.98193359375, 1.015380859375, 1.048828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 8.0, 1.0, 16.0, 12.0, 12.0, 14.0, 27.0, 28.0, 34.0, 32.0, 30.0, 37.0, 37.0, 42.0, 50.0, 63.0, 59.0, 50.0, 55.0, 47.0, 48.0, 43.0, 56.0, 29.0, 38.0, 24.0, 21.0, 13.0, 20.0, 11.0, 13.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001373291015625, -0.00013284571468830109, -0.00012836232781410217, -0.00012387894093990326, -0.00011939555406570435, -0.00011491216719150543, -0.00011042878031730652, -0.0001059453934431076, -0.00010146200656890869, -9.697861969470978e-05, -9.249523282051086e-05, -8.801184594631195e-05, -8.352845907211304e-05, -7.904507219791412e-05, -7.456168532371521e-05, -7.00782984495163e-05, -6.559491157531738e-05, -6.111152470111847e-05, -5.6628137826919556e-05, -5.214475095272064e-05, -4.766136407852173e-05, -4.3177977204322815e-05, -3.86945903301239e-05, -3.421120345592499e-05, -2.9727816581726074e-05, -2.524442970752716e-05, -2.0761042833328247e-05, -1.6277655959129333e-05, -1.179426908493042e-05, -7.310882210731506e-06, -2.8274953365325928e-06, 1.6558915376663208e-06, 6.139278411865234e-06, 1.0622665286064148e-05, 1.5106052160263062e-05, 1.9589439034461975e-05, 2.407282590866089e-05, 2.8556212782859802e-05, 3.3039599657058716e-05, 3.752298653125763e-05, 4.200637340545654e-05, 4.6489760279655457e-05, 5.097314715385437e-05, 5.5456534028053284e-05, 5.99399209022522e-05, 6.442330777645111e-05, 6.890669465065002e-05, 7.339008152484894e-05, 7.787346839904785e-05, 8.235685527324677e-05, 8.684024214744568e-05, 9.132362902164459e-05, 9.58070158958435e-05, 0.00010029040277004242, 0.00010477378964424133, 0.00010925717651844025, 0.00011374056339263916, 0.00011822395026683807, 0.000122707337141037, 0.0001271907240152359, 0.00013167411088943481, 0.00013615749776363373, 0.00014064088463783264, 0.00014512427151203156, 0.00014960765838623047]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 20.0, 28.0, 34.0, 57.0, 68.0, 114.0, 184.0, 280.0, 433.0, 640.0, 973.0, 1406.0, 2219.0, 3449.0, 5153.0, 7898.0, 11885.0, 17723.0, 26066.0, 37325.0, 51696.0, 68184.0, 85347.0, 99418.0, 108138.0, 107279.0, 99014.0, 84194.0, 66783.0, 50494.0, 36036.0, 25201.0, 17234.0, 11582.0, 7497.0, 5012.0, 3161.0, 2182.0, 1409.0, 926.0, 572.0, 441.0, 258.0, 183.0, 106.0, 93.0, 55.0, 36.0, 24.0, 17.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.99365234375, -0.9615554809570312, -0.9294586181640625, -0.8973617553710938, -0.865264892578125, -0.8331680297851562, -0.8010711669921875, -0.7689743041992188, -0.73687744140625, -0.7047805786132812, -0.6726837158203125, -0.6405868530273438, -0.608489990234375, -0.5763931274414062, -0.5442962646484375, -0.5121994018554688, -0.4801025390625, -0.44800567626953125, -0.4159088134765625, -0.38381195068359375, -0.351715087890625, -0.31961822509765625, -0.2875213623046875, -0.25542449951171875, -0.22332763671875, -0.19123077392578125, -0.1591339111328125, -0.12703704833984375, -0.094940185546875, -0.06284332275390625, -0.0307464599609375, 0.00135040283203125, 0.033447265625, 0.06554412841796875, 0.0976409912109375, 0.12973785400390625, 0.161834716796875, 0.19393157958984375, 0.2260284423828125, 0.25812530517578125, 0.29022216796875, 0.32231903076171875, 0.3544158935546875, 0.38651275634765625, 0.418609619140625, 0.45070648193359375, 0.4828033447265625, 0.5149002075195312, 0.5469970703125, 0.5790939331054688, 0.6111907958984375, 0.6432876586914062, 0.675384521484375, 0.7074813842773438, 0.7395782470703125, 0.7716751098632812, 0.80377197265625, 0.8358688354492188, 0.8679656982421875, 0.9000625610351562, 0.932159423828125, 0.9642562866210938, 0.9963531494140625, 1.0284500122070312, 1.060546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 11.0, 16.0, 15.0, 12.0, 29.0, 24.0, 26.0, 28.0, 31.0, 38.0, 35.0, 29.0, 46.0, 24.0, 37.0, 39.0, 33.0, 30.0, 40.0, 35.0, 30.0, 32.0, 24.0, 32.0, 25.0, 30.0, 35.0, 25.0, 26.0, 24.0, 19.0, 13.0, 23.0, 9.0, 12.0, 11.0, 11.0, 8.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3221893310546875, -0.309173583984375, -0.2961578369140625, -0.28314208984375, -0.2701263427734375, -0.257110595703125, -0.2440948486328125, -0.2310791015625, -0.2180633544921875, -0.205047607421875, -0.1920318603515625, -0.17901611328125, -0.1660003662109375, -0.152984619140625, -0.1399688720703125, -0.126953125, -0.1139373779296875, -0.100921630859375, -0.0879058837890625, -0.07489013671875, -0.0618743896484375, -0.048858642578125, -0.0358428955078125, -0.0228271484375, -0.0098114013671875, 0.003204345703125, 0.0162200927734375, 0.02923583984375, 0.0422515869140625, 0.055267333984375, 0.0682830810546875, 0.081298828125, 0.0943145751953125, 0.107330322265625, 0.1203460693359375, 0.13336181640625, 0.1463775634765625, 0.159393310546875, 0.1724090576171875, 0.1854248046875, 0.1984405517578125, 0.211456298828125, 0.2244720458984375, 0.23748779296875, 0.2505035400390625, 0.263519287109375, 0.2765350341796875, 0.28955078125, 0.3025665283203125, 0.315582275390625, 0.3285980224609375, 0.34161376953125, 0.3546295166015625, 0.367645263671875, 0.3806610107421875, 0.3936767578125, 0.4066925048828125, 0.419708251953125, 0.4327239990234375, 0.44573974609375, 0.4587554931640625, 0.471771240234375, 0.4847869873046875, 0.497802734375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 2.0, 13.0, 6.0, 9.0, 10.0, 14.0, 11.0, 8.0, 19.0, 24.0, 29.0, 25.0, 39.0, 35.0, 32.0, 36.0, 36.0, 43.0, 30.0, 48.0, 52.0, 45.0, 45.0, 48.0, 36.0, 38.0, 29.0, 23.0, 32.0, 31.0, 20.0, 15.0, 13.0, 12.0, 15.0, 11.0, 11.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.211418628692627, -4.087204933166504, -3.962991714477539, -3.838778257369995, -3.714564800262451, -3.590351104736328, -3.4661378860473633, -3.3419241905212402, -3.2177107334136963, -3.0934972763061523, -2.9692838191986084, -2.8450703620910645, -2.7208569049835205, -2.5966434478759766, -2.4724297523498535, -2.3482162952423096, -2.2240028381347656, -2.0997893810272217, -1.9755759239196777, -1.8513624668121338, -1.7271488904953003, -1.6029354333877563, -1.4787219762802124, -1.354508399963379, -1.230295181274414, -1.1060817241668701, -0.9818682074546814, -0.8576547503471375, -0.7334412336349487, -0.6092277765274048, -0.48501431941986084, -0.3608008027076721, -0.2365872859954834, -0.11237380653619766, 0.011839672923088074, 0.1360531449317932, 0.26026663184165955, 0.3844801187515259, 0.5086935758590698, 0.6329070925712585, 0.7571205496788025, 0.8813340067863464, 1.0055475234985352, 1.129760980606079, 1.253974437713623, 1.378187894821167, 1.502401351928711, 1.6266149282455444, 1.7508283853530884, 1.8750418424606323, 1.9992552995681763, 2.1234688758850098, 2.2476823329925537, 2.3718957901000977, 2.4961092472076416, 2.6203227043151855, 2.7445361614227295, 2.8687496185302734, 2.9929630756378174, 3.1171765327453613, 3.2413899898529053, 3.365603446960449, 3.4898171424865723, 3.614030599594116, 3.73824405670166]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 0.0, 2.0, 6.0, 6.0, 4.0, 8.0, 8.0, 9.0, 20.0, 13.0, 20.0, 23.0, 18.0, 21.0, 27.0, 30.0, 39.0, 38.0, 38.0, 41.0, 47.0, 42.0, 32.0, 36.0, 46.0, 36.0, 34.0, 33.0, 32.0, 25.0, 29.0, 31.0, 26.0, 37.0, 28.0, 15.0, 15.0, 19.0, 12.0, 8.0, 10.0, 10.0, 14.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.886139392852783, -4.7204108238220215, -4.55468225479126, -4.388953685760498, -4.2232255935668945, -4.057497024536133, -3.891768455505371, -3.7260398864746094, -3.5603113174438477, -3.394582748413086, -3.228854179382324, -3.0631258487701416, -2.89739727973938, -2.731668710708618, -2.5659403800964355, -2.400211811065674, -2.234483242034912, -2.0687546730041504, -1.9030262231826782, -1.737297773361206, -1.5715692043304443, -1.4058406352996826, -1.2401121854782104, -1.0743837356567383, -0.9086551666259766, -0.7429266571998596, -0.5771981477737427, -0.41146963834762573, -0.2457411289215088, -0.08001261949539185, 0.0857158899307251, 0.25144433975219727, 0.417172908782959, 0.5829014182090759, 0.7486299276351929, 0.9143584370613098, 1.0800869464874268, 1.2458155155181885, 1.4115439653396606, 1.5772724151611328, 1.7430009841918945, 1.9087295532226562, 2.074458122253418, 2.2401864528656006, 2.4059150218963623, 2.571643590927124, 2.7373719215393066, 2.9031004905700684, 3.06882905960083, 3.234557628631592, 3.4002861976623535, 3.566014528274536, 3.731743097305298, 3.8974716663360596, 4.063199996948242, 4.228928565979004, 4.394657135009766, 4.560385704040527, 4.726114273071289, 4.891842842102051, 5.0575714111328125, 5.223299503326416, 5.389028072357178, 5.5547566413879395, 5.720485210418701]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 14.0, 15.0, 29.0, 56.0, 44.0, 100.0, 156.0, 231.0, 364.0, 559.0, 1013.0, 1584.0, 2643.0, 4375.0, 7435.0, 13046.0, 22944.0, 41423.0, 77867.0, 146401.0, 271616.0, 464650.0, 671563.0, 767077.0, 664969.0, 455144.0, 265978.0, 142978.0, 75869.0, 40972.0, 22605.0, 12598.0, 7133.0, 4163.0, 2536.0, 1492.0, 917.0, 583.0, 395.0, 260.0, 169.0, 90.0, 66.0, 51.0, 40.0, 19.0, 21.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-4.41015625, -4.2784423828125, -4.146728515625, -4.0150146484375, -3.88330078125, -3.7515869140625, -3.619873046875, -3.4881591796875, -3.3564453125, -3.2247314453125, -3.093017578125, -2.9613037109375, -2.82958984375, -2.6978759765625, -2.566162109375, -2.4344482421875, -2.302734375, -2.1710205078125, -2.039306640625, -1.9075927734375, -1.77587890625, -1.6441650390625, -1.512451171875, -1.3807373046875, -1.2490234375, -1.1173095703125, -0.985595703125, -0.8538818359375, -0.72216796875, -0.5904541015625, -0.458740234375, -0.3270263671875, -0.1953125, -0.0635986328125, 0.068115234375, 0.1998291015625, 0.33154296875, 0.4632568359375, 0.594970703125, 0.7266845703125, 0.8583984375, 0.9901123046875, 1.121826171875, 1.2535400390625, 1.38525390625, 1.5169677734375, 1.648681640625, 1.7803955078125, 1.912109375, 2.0438232421875, 2.175537109375, 2.3072509765625, 2.43896484375, 2.5706787109375, 2.702392578125, 2.8341064453125, 2.9658203125, 3.0975341796875, 3.229248046875, 3.3609619140625, 3.49267578125, 3.6243896484375, 3.756103515625, 3.8878173828125, 4.01953125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 5.0, 6.0, 4.0, 11.0, 7.0, 14.0, 13.0, 17.0, 20.0, 17.0, 20.0, 20.0, 33.0, 26.0, 36.0, 38.0, 42.0, 32.0, 39.0, 45.0, 40.0, 44.0, 42.0, 35.0, 33.0, 39.0, 27.0, 25.0, 29.0, 29.0, 27.0, 24.0, 31.0, 18.0, 19.0, 14.0, 10.0, 16.0, 9.0, 16.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.220458984375, -4.07763671875, -3.934814453125, -3.7919921875, -3.649169921875, -3.50634765625, -3.363525390625, -3.220703125, -3.077880859375, -2.93505859375, -2.792236328125, -2.6494140625, -2.506591796875, -2.36376953125, -2.220947265625, -2.078125, -1.935302734375, -1.79248046875, -1.649658203125, -1.5068359375, -1.364013671875, -1.22119140625, -1.078369140625, -0.935546875, -0.792724609375, -0.64990234375, -0.507080078125, -0.3642578125, -0.221435546875, -0.07861328125, 0.064208984375, 0.20703125, 0.349853515625, 0.49267578125, 0.635498046875, 0.7783203125, 0.921142578125, 1.06396484375, 1.206787109375, 1.349609375, 1.492431640625, 1.63525390625, 1.778076171875, 1.9208984375, 2.063720703125, 2.20654296875, 2.349365234375, 2.4921875, 2.635009765625, 2.77783203125, 2.920654296875, 3.0634765625, 3.206298828125, 3.34912109375, 3.491943359375, 3.634765625, 3.777587890625, 3.92041015625, 4.063232421875, 4.2060546875, 4.348876953125, 4.49169921875, 4.634521484375, 4.77734375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 6.0, 28.0, 28.0, 39.0, 53.0, 94.0, 161.0, 219.0, 341.0, 617.0, 927.0, 1485.0, 2374.0, 3965.0, 6505.0, 11066.0, 18524.0, 32292.0, 55153.0, 93860.0, 158103.0, 259578.0, 397627.0, 546680.0, 637726.0, 613161.0, 488528.0, 338536.0, 213973.0, 129186.0, 75600.0, 44538.0, 25678.0, 14908.0, 9064.0, 5235.0, 3268.0, 2041.0, 1112.0, 706.0, 489.0, 314.0, 164.0, 109.0, 82.0, 45.0, 36.0, 18.0, 16.0, 15.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.1693115234375, -4.033935546875, -3.8985595703125, -3.76318359375, -3.6278076171875, -3.492431640625, -3.3570556640625, -3.2216796875, -3.0863037109375, -2.950927734375, -2.8155517578125, -2.68017578125, -2.5447998046875, -2.409423828125, -2.2740478515625, -2.138671875, -2.0032958984375, -1.867919921875, -1.7325439453125, -1.59716796875, -1.4617919921875, -1.326416015625, -1.1910400390625, -1.0556640625, -0.9202880859375, -0.784912109375, -0.6495361328125, -0.51416015625, -0.3787841796875, -0.243408203125, -0.1080322265625, 0.02734375, 0.1627197265625, 0.298095703125, 0.4334716796875, 0.56884765625, 0.7042236328125, 0.839599609375, 0.9749755859375, 1.1103515625, 1.2457275390625, 1.381103515625, 1.5164794921875, 1.65185546875, 1.7872314453125, 1.922607421875, 2.0579833984375, 2.193359375, 2.3287353515625, 2.464111328125, 2.5994873046875, 2.73486328125, 2.8702392578125, 3.005615234375, 3.1409912109375, 3.2763671875, 3.4117431640625, 3.547119140625, 3.6824951171875, 3.81787109375, 3.9532470703125, 4.088623046875, 4.2239990234375, 4.359375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 7.0, 8.0, 9.0, 14.0, 17.0, 19.0, 29.0, 29.0, 42.0, 53.0, 50.0, 51.0, 69.0, 101.0, 111.0, 107.0, 130.0, 166.0, 174.0, 167.0, 187.0, 181.0, 220.0, 210.0, 184.0, 168.0, 180.0, 174.0, 154.0, 169.0, 142.0, 99.0, 89.0, 105.0, 87.0, 72.0, 53.0, 35.0, 46.0, 34.0, 22.0, 25.0, 21.0, 17.0, 9.0, 15.0, 6.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.775390625, -1.721405029296875, -1.66741943359375, -1.613433837890625, -1.5594482421875, -1.505462646484375, -1.45147705078125, -1.397491455078125, -1.343505859375, -1.289520263671875, -1.23553466796875, -1.181549072265625, -1.1275634765625, -1.073577880859375, -1.01959228515625, -0.965606689453125, -0.91162109375, -0.857635498046875, -0.80364990234375, -0.749664306640625, -0.6956787109375, -0.641693115234375, -0.58770751953125, -0.533721923828125, -0.479736328125, -0.425750732421875, -0.37176513671875, -0.317779541015625, -0.2637939453125, -0.209808349609375, -0.15582275390625, -0.101837158203125, -0.0478515625, 0.006134033203125, 0.06011962890625, 0.114105224609375, 0.1680908203125, 0.222076416015625, 0.27606201171875, 0.330047607421875, 0.384033203125, 0.438018798828125, 0.49200439453125, 0.545989990234375, 0.5999755859375, 0.653961181640625, 0.70794677734375, 0.761932373046875, 0.81591796875, 0.869903564453125, 0.92388916015625, 0.977874755859375, 1.0318603515625, 1.085845947265625, 1.13983154296875, 1.193817138671875, 1.247802734375, 1.301788330078125, 1.35577392578125, 1.409759521484375, 1.4637451171875, 1.517730712890625, 1.57171630859375, 1.625701904296875, 1.6796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 15.0, 9.0, 16.0, 13.0, 24.0, 27.0, 31.0, 28.0, 41.0, 40.0, 46.0, 48.0, 47.0, 46.0, 52.0, 48.0, 62.0, 47.0, 49.0, 44.0, 42.0, 29.0, 32.0, 18.0, 23.0, 23.0, 21.0, 9.0, 8.0, 8.0, 8.0, 5.0, 3.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.787500858306885, -4.627196311950684, -4.466892242431641, -4.3065876960754395, -4.146283149719238, -3.985978603363037, -3.825674295425415, -3.665369987487793, -3.505065441131592, -3.3447608947753906, -3.1844565868377686, -3.0241522789001465, -2.8638477325439453, -2.703543186187744, -2.543238878250122, -2.3829345703125, -2.222630023956299, -2.0623254776000977, -1.9020211696624756, -1.741716742515564, -1.5814123153686523, -1.4211078882217407, -1.260803461074829, -1.1004990339279175, -0.9401946067810059, -0.7798901796340942, -0.6195857524871826, -0.459281325340271, -0.2989768981933594, -0.13867247104644775, 0.021631956100463867, 0.1819363832473755, 0.3422412872314453, 0.5025457143783569, 0.6628501415252686, 0.8231545686721802, 0.9834589958190918, 1.1437634229660034, 1.304067850112915, 1.4643722772598267, 1.6246767044067383, 1.78498113155365, 1.9452855587005615, 2.1055898666381836, 2.2658944129943848, 2.426198959350586, 2.586503267288208, 2.74680757522583, 2.9071121215820312, 3.0674166679382324, 3.2277209758758545, 3.3880252838134766, 3.5483298301696777, 3.708634376525879, 3.868938684463501, 4.029242992401123, 4.189547538757324, 4.349852085113525, 4.510156631469727, 4.6704607009887695, 4.830765247344971, 4.991069793701172, 5.151373863220215, 5.311678409576416, 5.471982955932617]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 9.0, 10.0, 3.0, 4.0, 13.0, 16.0, 34.0, 31.0, 23.0, 35.0, 28.0, 39.0, 37.0, 52.0, 42.0, 43.0, 47.0, 51.0, 38.0, 43.0, 42.0, 35.0, 28.0, 37.0, 27.0, 32.0, 27.0, 30.0, 22.0, 23.0, 17.0, 16.0, 12.0, 13.0, 9.0, 11.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.982348918914795, -5.798638343811035, -5.614927291870117, -5.431216716766357, -5.247506141662598, -5.06379508972168, -4.88008451461792, -4.69637393951416, -4.512662887573242, -4.328952312469482, -4.1452412605285645, -3.9615306854248047, -3.777820110321045, -3.594109296798706, -3.410398483276367, -3.2266879081726074, -3.0429773330688477, -2.859266519546509, -2.675555944442749, -2.49184513092041, -2.3081345558166504, -2.1244237422943115, -1.9407129287719727, -1.7570022344589233, -1.573291540145874, -1.3895808458328247, -1.2058701515197754, -1.0221593379974365, -0.8384486436843872, -0.6547379493713379, -0.471027135848999, -0.2873164415359497, -0.10360527038574219, 0.08010545372962952, 0.2638161778450012, 0.4475269317626953, 0.6312376260757446, 0.814948320388794, 0.9986591339111328, 1.1823698282241821, 1.3660805225372314, 1.5497912168502808, 1.73350191116333, 1.917212724685669, 2.100923538208008, 2.2846341133117676, 2.4683449268341064, 2.6520557403564453, 2.835766315460205, 3.019477128982544, 3.2031877040863037, 3.3868985176086426, 3.5706090927124023, 3.754319906234741, 3.93803071975708, 4.12174129486084, 4.305452346801758, 4.489162921905518, 4.6728739738464355, 4.856584548950195, 5.040295124053955, 5.224005699157715, 5.407716751098633, 5.591427326202393, 5.775137901306152]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 15.0, 21.0, 29.0, 41.0, 62.0, 96.0, 148.0, 246.0, 448.0, 619.0, 951.0, 1487.0, 2409.0, 3992.0, 6603.0, 11166.0, 19546.0, 34337.0, 59875.0, 100610.0, 153598.0, 189697.0, 171134.0, 118753.0, 72659.0, 41716.0, 24019.0, 13913.0, 7999.0, 4674.0, 2930.0, 1738.0, 1068.0, 670.0, 473.0, 274.0, 184.0, 127.0, 79.0, 41.0, 39.0, 33.0, 17.0, 4.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.777099609375, -0.7490234375, -0.720947265625, -0.69287109375, -0.664794921875, -0.63671875, -0.608642578125, -0.58056640625, -0.552490234375, -0.5244140625, -0.496337890625, -0.46826171875, -0.440185546875, -0.412109375, -0.384033203125, -0.35595703125, -0.327880859375, -0.2998046875, -0.271728515625, -0.24365234375, -0.215576171875, -0.1875, -0.159423828125, -0.13134765625, -0.103271484375, -0.0751953125, -0.047119140625, -0.01904296875, 0.009033203125, 0.037109375, 0.065185546875, 0.09326171875, 0.121337890625, 0.1494140625, 0.177490234375, 0.20556640625, 0.233642578125, 0.26171875, 0.289794921875, 0.31787109375, 0.345947265625, 0.3740234375, 0.402099609375, 0.43017578125, 0.458251953125, 0.486328125, 0.514404296875, 0.54248046875, 0.570556640625, 0.5986328125, 0.626708984375, 0.65478515625, 0.682861328125, 0.7109375, 0.739013671875, 0.76708984375, 0.795166015625, 0.8232421875, 0.851318359375, 0.87939453125, 0.907470703125, 0.935546875, 0.963623046875, 0.99169921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 11.0, 9.0, 14.0, 20.0, 23.0, 29.0, 39.0, 30.0, 37.0, 35.0, 38.0, 33.0, 46.0, 39.0, 42.0, 46.0, 38.0, 40.0, 40.0, 30.0, 33.0, 31.0, 34.0, 33.0, 35.0, 25.0, 20.0, 25.0, 18.0, 19.0, 16.0, 10.0, 5.0, 8.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.59375, -6.41064453125, -6.2275390625, -6.04443359375, -5.861328125, -5.67822265625, -5.4951171875, -5.31201171875, -5.12890625, -4.94580078125, -4.7626953125, -4.57958984375, -4.396484375, -4.21337890625, -4.0302734375, -3.84716796875, -3.6640625, -3.48095703125, -3.2978515625, -3.11474609375, -2.931640625, -2.74853515625, -2.5654296875, -2.38232421875, -2.19921875, -2.01611328125, -1.8330078125, -1.64990234375, -1.466796875, -1.28369140625, -1.1005859375, -0.91748046875, -0.734375, -0.55126953125, -0.3681640625, -0.18505859375, -0.001953125, 0.18115234375, 0.3642578125, 0.54736328125, 0.73046875, 0.91357421875, 1.0966796875, 1.27978515625, 1.462890625, 1.64599609375, 1.8291015625, 2.01220703125, 2.1953125, 2.37841796875, 2.5615234375, 2.74462890625, 2.927734375, 3.11083984375, 3.2939453125, 3.47705078125, 3.66015625, 3.84326171875, 4.0263671875, 4.20947265625, 4.392578125, 4.57568359375, 4.7587890625, 4.94189453125, 5.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 17.0, 31.0, 38.0, 58.0, 113.0, 143.0, 249.0, 446.0, 741.0, 1177.0, 2059.0, 3750.0, 6572.0, 12164.0, 23677.0, 77075.0, 706183.0, 151261.0, 30079.0, 14458.0, 7897.0, 4294.0, 2524.0, 1385.0, 816.0, 537.0, 318.0, 192.0, 99.0, 61.0, 53.0, 25.0, 26.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.801910400390625, -1.74835205078125, -1.694793701171875, -1.6412353515625, -1.587677001953125, -1.53411865234375, -1.480560302734375, -1.427001953125, -1.373443603515625, -1.31988525390625, -1.266326904296875, -1.2127685546875, -1.159210205078125, -1.10565185546875, -1.052093505859375, -0.99853515625, -0.944976806640625, -0.89141845703125, -0.837860107421875, -0.7843017578125, -0.730743408203125, -0.67718505859375, -0.623626708984375, -0.570068359375, -0.516510009765625, -0.46295166015625, -0.409393310546875, -0.3558349609375, -0.302276611328125, -0.24871826171875, -0.195159912109375, -0.1416015625, -0.088043212890625, -0.03448486328125, 0.019073486328125, 0.0726318359375, 0.126190185546875, 0.17974853515625, 0.233306884765625, 0.286865234375, 0.340423583984375, 0.39398193359375, 0.447540283203125, 0.5010986328125, 0.554656982421875, 0.60821533203125, 0.661773681640625, 0.71533203125, 0.768890380859375, 0.82244873046875, 0.876007080078125, 0.9295654296875, 0.983123779296875, 1.03668212890625, 1.090240478515625, 1.143798828125, 1.197357177734375, 1.25091552734375, 1.304473876953125, 1.3580322265625, 1.411590576171875, 1.46514892578125, 1.518707275390625, 1.572265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 4.0, 3.0, 14.0, 11.0, 9.0, 13.0, 22.0, 17.0, 25.0, 23.0, 22.0, 30.0, 38.0, 32.0, 40.0, 42.0, 37.0, 41.0, 41.0, 42.0, 47.0, 47.0, 36.0, 22.0, 38.0, 38.0, 41.0, 24.0, 26.0, 24.0, 28.0, 14.0, 17.0, 12.0, 14.0, 10.0, 12.0, 9.0, 10.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.078125, -3.9554443359375, -3.832763671875, -3.7100830078125, -3.58740234375, -3.4647216796875, -3.342041015625, -3.2193603515625, -3.0966796875, -2.9739990234375, -2.851318359375, -2.7286376953125, -2.60595703125, -2.4832763671875, -2.360595703125, -2.2379150390625, -2.115234375, -1.9925537109375, -1.869873046875, -1.7471923828125, -1.62451171875, -1.5018310546875, -1.379150390625, -1.2564697265625, -1.1337890625, -1.0111083984375, -0.888427734375, -0.7657470703125, -0.64306640625, -0.5203857421875, -0.397705078125, -0.2750244140625, -0.15234375, -0.0296630859375, 0.093017578125, 0.2156982421875, 0.33837890625, 0.4610595703125, 0.583740234375, 0.7064208984375, 0.8291015625, 0.9517822265625, 1.074462890625, 1.1971435546875, 1.31982421875, 1.4425048828125, 1.565185546875, 1.6878662109375, 1.810546875, 1.9332275390625, 2.055908203125, 2.1785888671875, 2.30126953125, 2.4239501953125, 2.546630859375, 2.6693115234375, 2.7919921875, 2.9146728515625, 3.037353515625, 3.1600341796875, 3.28271484375, 3.4053955078125, 3.528076171875, 3.6507568359375, 3.7734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 5.0, 10.0, 16.0, 21.0, 23.0, 35.0, 51.0, 73.0, 133.0, 204.0, 270.0, 398.0, 580.0, 917.0, 1555.0, 2330.0, 3970.0, 6586.0, 11236.0, 19670.0, 41903.0, 676485.0, 213563.0, 29618.0, 15753.0, 8891.0, 5399.0, 3261.0, 1991.0, 1178.0, 832.0, 484.0, 344.0, 224.0, 168.0, 117.0, 83.0, 54.0, 41.0, 24.0, 16.0, 17.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1898193359375, -0.18345260620117188, -0.17708587646484375, -0.17071914672851562, -0.1643524169921875, -0.15798568725585938, -0.15161895751953125, -0.14525222778320312, -0.138885498046875, -0.13251876831054688, -0.12615203857421875, -0.11978530883789062, -0.1134185791015625, -0.10705184936523438, -0.10068511962890625, -0.09431838989257812, -0.08795166015625, -0.08158493041992188, -0.07521820068359375, -0.06885147094726562, -0.0624847412109375, -0.056118011474609375, -0.04975128173828125, -0.043384552001953125, -0.037017822265625, -0.030651092529296875, -0.02428436279296875, -0.017917633056640625, -0.0115509033203125, -0.005184173583984375, 0.00118255615234375, 0.007549285888671875, 0.013916015625, 0.020282745361328125, 0.02664947509765625, 0.033016204833984375, 0.0393829345703125, 0.045749664306640625, 0.05211639404296875, 0.058483123779296875, 0.064849853515625, 0.07121658325195312, 0.07758331298828125, 0.08395004272460938, 0.0903167724609375, 0.09668350219726562, 0.10305023193359375, 0.10941696166992188, 0.11578369140625, 0.12215042114257812, 0.12851715087890625, 0.13488388061523438, 0.1412506103515625, 0.14761734008789062, 0.15398406982421875, 0.16035079956054688, 0.166717529296875, 0.17308425903320312, 0.17945098876953125, 0.18581771850585938, 0.1921844482421875, 0.19855117797851562, 0.20491790771484375, 0.21128463745117188, 0.2176513671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 4.0, 6.0, 15.0, 12.0, 11.0, 20.0, 18.0, 22.0, 24.0, 34.0, 51.0, 40.0, 35.0, 46.0, 48.0, 51.0, 50.0, 39.0, 59.0, 47.0, 48.0, 50.0, 36.0, 37.0, 26.0, 28.0, 29.0, 20.0, 19.0, 10.0, 8.0, 6.0, 7.0, 11.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -8.99285078048706e-06, -8.687376976013184e-06, -8.381903171539307e-06, -8.07642936706543e-06, -7.770955562591553e-06, -7.465481758117676e-06, -7.160007953643799e-06, -6.854534149169922e-06, -6.549060344696045e-06, -6.243586540222168e-06, -5.938112735748291e-06, -5.632638931274414e-06, -5.327165126800537e-06, -5.02169132232666e-06, -4.716217517852783e-06, -4.410743713378906e-06, -4.105269908905029e-06, -3.7997961044311523e-06, -3.4943222999572754e-06, -3.1888484954833984e-06, -2.8833746910095215e-06, -2.5779008865356445e-06, -2.2724270820617676e-06, -1.9669532775878906e-06, -1.6614794731140137e-06, -1.3560056686401367e-06, -1.0505318641662598e-06, -7.450580596923828e-07, -4.3958425521850586e-07, -1.341104507446289e-07, 1.7136335372924805e-07, 4.76837158203125e-07, 7.82310962677002e-07, 1.087784767150879e-06, 1.3932585716247559e-06, 1.6987323760986328e-06, 2.0042061805725098e-06, 2.3096799850463867e-06, 2.6151537895202637e-06, 2.9206275939941406e-06, 3.2261013984680176e-06, 3.5315752029418945e-06, 3.8370490074157715e-06, 4.1425228118896484e-06, 4.447996616363525e-06, 4.753470420837402e-06, 5.058944225311279e-06, 5.364418029785156e-06, 5.669891834259033e-06, 5.97536563873291e-06, 6.280839443206787e-06, 6.586313247680664e-06, 6.891787052154541e-06, 7.197260856628418e-06, 7.502734661102295e-06, 7.808208465576172e-06, 8.113682270050049e-06, 8.419156074523926e-06, 8.724629878997803e-06, 9.03010368347168e-06, 9.335577487945557e-06, 9.641051292419434e-06, 9.94652509689331e-06, 1.0251998901367188e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 9.0, 16.0, 22.0, 35.0, 52.0, 90.0, 114.0, 132.0, 229.0, 324.0, 446.0, 617.0, 898.0, 1289.0, 1804.0, 2598.0, 3649.0, 5330.0, 7812.0, 11569.0, 17610.0, 25970.0, 39432.0, 58444.0, 84308.0, 116010.0, 139483.0, 141002.0, 118133.0, 86907.0, 60467.0, 40735.0, 26902.0, 17800.0, 12076.0, 8146.0, 5497.0, 3741.0, 2562.0, 1900.0, 1292.0, 929.0, 657.0, 443.0, 304.0, 257.0, 153.0, 107.0, 69.0, 51.0, 40.0, 37.0, 26.0, 7.0, 8.0, 5.0, 7.0], "bins": [-0.146728515625, -0.14241790771484375, -0.1381072998046875, -0.13379669189453125, -0.129486083984375, -0.12517547607421875, -0.1208648681640625, -0.11655426025390625, -0.11224365234375, -0.10793304443359375, -0.1036224365234375, -0.09931182861328125, -0.095001220703125, -0.09069061279296875, -0.0863800048828125, -0.08206939697265625, -0.0777587890625, -0.07344818115234375, -0.0691375732421875, -0.06482696533203125, -0.060516357421875, -0.05620574951171875, -0.0518951416015625, -0.04758453369140625, -0.04327392578125, -0.03896331787109375, -0.0346527099609375, -0.03034210205078125, -0.026031494140625, -0.02172088623046875, -0.0174102783203125, -0.01309967041015625, -0.0087890625, -0.00447845458984375, -0.0001678466796875, 0.00414276123046875, 0.008453369140625, 0.01276397705078125, 0.0170745849609375, 0.02138519287109375, 0.02569580078125, 0.03000640869140625, 0.0343170166015625, 0.03862762451171875, 0.042938232421875, 0.04724884033203125, 0.0515594482421875, 0.05587005615234375, 0.0601806640625, 0.06449127197265625, 0.0688018798828125, 0.07311248779296875, 0.077423095703125, 0.08173370361328125, 0.0860443115234375, 0.09035491943359375, 0.09466552734375, 0.09897613525390625, 0.1032867431640625, 0.10759735107421875, 0.111907958984375, 0.11621856689453125, 0.1205291748046875, 0.12483978271484375, 0.129150390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 10.0, 6.0, 12.0, 17.0, 27.0, 18.0, 30.0, 28.0, 41.0, 36.0, 49.0, 45.0, 46.0, 44.0, 49.0, 57.0, 47.0, 48.0, 51.0, 53.0, 34.0, 41.0, 34.0, 33.0, 21.0, 20.0, 17.0, 17.0, 9.0, 11.0, 14.0, 6.0, 5.0, 0.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06768798828125, -0.06573677062988281, -0.06378555297851562, -0.06183433532714844, -0.05988311767578125, -0.05793190002441406, -0.055980682373046875, -0.05402946472167969, -0.0520782470703125, -0.05012702941894531, -0.048175811767578125, -0.04622459411621094, -0.04427337646484375, -0.04232215881347656, -0.040370941162109375, -0.03841972351074219, -0.036468505859375, -0.03451728820800781, -0.032566070556640625, -0.030614852905273438, -0.02866363525390625, -0.026712417602539062, -0.024761199951171875, -0.022809982299804688, -0.0208587646484375, -0.018907546997070312, -0.016956329345703125, -0.015005111694335938, -0.01305389404296875, -0.011102676391601562, -0.009151458740234375, -0.0072002410888671875, -0.0052490234375, -0.0032978057861328125, -0.001346588134765625, 0.0006046295166015625, 0.00255584716796875, 0.0045070648193359375, 0.006458282470703125, 0.008409500122070312, 0.0103607177734375, 0.012311935424804688, 0.014263153076171875, 0.016214370727539062, 0.01816558837890625, 0.020116806030273438, 0.022068023681640625, 0.024019241333007812, 0.025970458984375, 0.027921676635742188, 0.029872894287109375, 0.03182411193847656, 0.03377532958984375, 0.03572654724121094, 0.037677764892578125, 0.03962898254394531, 0.0415802001953125, 0.04353141784667969, 0.045482635498046875, 0.04743385314941406, 0.04938507080078125, 0.05133628845214844, 0.053287506103515625, 0.05523872375488281, 0.05718994140625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 3.0, 11.0, 11.0, 14.0, 16.0, 14.0, 22.0, 25.0, 36.0, 32.0, 37.0, 38.0, 41.0, 54.0, 50.0, 47.0, 46.0, 50.0, 53.0, 64.0, 34.0, 46.0, 38.0, 33.0, 28.0, 20.0, 22.0, 20.0, 20.0, 12.0, 7.0, 10.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.613295555114746, -4.457451820373535, -4.301608085632324, -4.145764350891113, -3.9899206161499023, -3.8340768814086914, -3.6782329082489014, -3.5223891735076904, -3.3665454387664795, -3.2107017040252686, -3.0548579692840576, -2.8990142345428467, -2.7431702613830566, -2.5873265266418457, -2.4314827919006348, -2.275639057159424, -2.119795322418213, -1.963951587677002, -1.808107852935791, -1.6522639989852905, -1.4964202642440796, -1.3405765295028687, -1.1847326755523682, -1.0288889408111572, -0.8730452060699463, -0.7172014713287354, -0.5613576769828796, -0.4055139124393463, -0.249670147895813, -0.09382641315460205, 0.06201738119125366, 0.21786117553710938, 0.3737044334411621, 0.529548168182373, 0.6853919625282288, 0.8412357568740845, 0.9970794916152954, 1.1529232263565063, 1.3087670803070068, 1.4646108150482178, 1.6204545497894287, 1.7762982845306396, 1.9321420192718506, 2.0879857540130615, 2.2438297271728516, 2.3996734619140625, 2.5555171966552734, 2.7113609313964844, 2.8672046661376953, 3.0230484008789062, 3.178892135620117, 3.334735870361328, 3.490579605102539, 3.64642333984375, 3.80226731300354, 3.958111047744751, 4.113954544067383, 4.269798278808594, 4.425642013549805, 4.581485748291016, 4.737329483032227, 4.8931732177734375, 5.049016952514648, 5.204860687255859, 5.3607048988342285]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 5.0, 10.0, 7.0, 3.0, 5.0, 11.0, 23.0, 31.0, 32.0, 27.0, 30.0, 25.0, 46.0, 38.0, 47.0, 48.0, 45.0, 47.0, 46.0, 38.0, 46.0, 40.0, 31.0, 31.0, 37.0, 28.0, 29.0, 28.0, 34.0, 20.0, 22.0, 14.0, 16.0, 11.0, 12.0, 12.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.998411655426025, -5.814550876617432, -5.630690097808838, -5.446829319000244, -5.26296854019165, -5.079107761383057, -4.895246982574463, -4.711386203765869, -4.527525424957275, -4.343664646148682, -4.159803867340088, -3.975943088531494, -3.7920823097229004, -3.6082215309143066, -3.424360752105713, -3.240499973297119, -3.0566389560699463, -2.8727781772613525, -2.688917398452759, -2.505056619644165, -2.3211958408355713, -2.1373350620269775, -1.9534741640090942, -1.7696133852005005, -1.5857526063919067, -1.401891827583313, -1.2180310487747192, -1.034170150756836, -0.850309431552887, -0.6664486527442932, -0.4825878143310547, -0.29872703552246094, -0.11486625671386719, 0.06899453699588776, 0.2528553307056427, 0.43671613931655884, 0.6205769181251526, 0.8044376969337463, 0.9882985353469849, 1.1721593141555786, 1.3560200929641724, 1.5398808717727661, 1.7237416505813599, 1.9076025485992432, 2.091463327407837, 2.2753241062164307, 2.4591848850250244, 2.643045663833618, 2.826906442642212, 3.0107672214508057, 3.1946280002593994, 3.378488779067993, 3.562349557876587, 3.7462103366851807, 3.9300713539123535, 4.113932132720947, 4.297792911529541, 4.481653690338135, 4.6655144691467285, 4.849375247955322, 5.033236026763916, 5.21709680557251, 5.4009575843811035, 5.584818363189697, 5.768679141998291]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 12.0, 14.0, 36.0, 45.0, 66.0, 117.0, 189.0, 321.0, 516.0, 811.0, 1317.0, 2128.0, 3390.0, 5477.0, 8649.0, 13850.0, 21512.0, 32186.0, 46758.0, 64613.0, 85173.0, 103567.0, 114880.0, 116384.0, 108058.0, 91187.0, 70984.0, 52156.0, 36318.0, 24676.0, 15948.0, 10293.0, 6364.0, 4167.0, 2400.0, 1474.0, 983.0, 571.0, 360.0, 236.0, 139.0, 94.0, 43.0, 32.0, 26.0, 11.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.832550048828125, -2.73541259765625, -2.638275146484375, -2.5411376953125, -2.444000244140625, -2.34686279296875, -2.249725341796875, -2.152587890625, -2.055450439453125, -1.95831298828125, -1.861175537109375, -1.7640380859375, -1.666900634765625, -1.56976318359375, -1.472625732421875, -1.37548828125, -1.278350830078125, -1.18121337890625, -1.084075927734375, -0.9869384765625, -0.889801025390625, -0.79266357421875, -0.695526123046875, -0.598388671875, -0.501251220703125, -0.40411376953125, -0.306976318359375, -0.2098388671875, -0.112701416015625, -0.01556396484375, 0.081573486328125, 0.1787109375, 0.275848388671875, 0.37298583984375, 0.470123291015625, 0.5672607421875, 0.664398193359375, 0.76153564453125, 0.858673095703125, 0.955810546875, 1.052947998046875, 1.15008544921875, 1.247222900390625, 1.3443603515625, 1.441497802734375, 1.53863525390625, 1.635772705078125, 1.73291015625, 1.830047607421875, 1.92718505859375, 2.024322509765625, 2.1214599609375, 2.218597412109375, 2.31573486328125, 2.412872314453125, 2.510009765625, 2.607147216796875, 2.70428466796875, 2.801422119140625, 2.8985595703125, 2.995697021484375, 3.09283447265625, 3.189971923828125, 3.287109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 10.0, 13.0, 13.0, 28.0, 23.0, 27.0, 39.0, 35.0, 39.0, 37.0, 61.0, 51.0, 57.0, 43.0, 46.0, 34.0, 43.0, 35.0, 40.0, 37.0, 30.0, 24.0, 35.0, 39.0, 26.0, 21.0, 13.0, 19.0, 9.0, 14.0, 7.0, 6.0, 7.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.29296875, -6.09942626953125, -5.9058837890625, -5.71234130859375, -5.518798828125, -5.32525634765625, -5.1317138671875, -4.93817138671875, -4.74462890625, -4.55108642578125, -4.3575439453125, -4.16400146484375, -3.970458984375, -3.77691650390625, -3.5833740234375, -3.38983154296875, -3.1962890625, -3.00274658203125, -2.8092041015625, -2.61566162109375, -2.422119140625, -2.22857666015625, -2.0350341796875, -1.84149169921875, -1.64794921875, -1.45440673828125, -1.2608642578125, -1.06732177734375, -0.873779296875, -0.68023681640625, -0.4866943359375, -0.29315185546875, -0.099609375, 0.09393310546875, 0.2874755859375, 0.48101806640625, 0.674560546875, 0.86810302734375, 1.0616455078125, 1.25518798828125, 1.44873046875, 1.64227294921875, 1.8358154296875, 2.02935791015625, 2.222900390625, 2.41644287109375, 2.6099853515625, 2.80352783203125, 2.9970703125, 3.19061279296875, 3.3841552734375, 3.57769775390625, 3.771240234375, 3.96478271484375, 4.1583251953125, 4.35186767578125, 4.54541015625, 4.73895263671875, 4.9324951171875, 5.12603759765625, 5.319580078125, 5.51312255859375, 5.7066650390625, 5.90020751953125, 6.09375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 6.0, 3.0, 14.0, 14.0, 31.0, 45.0, 88.0, 114.0, 189.0, 266.0, 419.0, 690.0, 1100.0, 1577.0, 2634.0, 4267.0, 6595.0, 10029.0, 15383.0, 23439.0, 34453.0, 48786.0, 66471.0, 85399.0, 103262.0, 113359.0, 114161.0, 104300.0, 87635.0, 68400.0, 50503.0, 35459.0, 24459.0, 15702.0, 10694.0, 6772.0, 4305.0, 2744.0, 1739.0, 1147.0, 714.0, 434.0, 265.0, 177.0, 133.0, 64.0, 34.0, 27.0, 20.0, 13.0, 5.0, 4.0, 4.0, 2.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.975677490234375, -2.87322998046875, -2.770782470703125, -2.6683349609375, -2.565887451171875, -2.46343994140625, -2.360992431640625, -2.258544921875, -2.156097412109375, -2.05364990234375, -1.951202392578125, -1.8487548828125, -1.746307373046875, -1.64385986328125, -1.541412353515625, -1.43896484375, -1.336517333984375, -1.23406982421875, -1.131622314453125, -1.0291748046875, -0.926727294921875, -0.82427978515625, -0.721832275390625, -0.619384765625, -0.516937255859375, -0.41448974609375, -0.312042236328125, -0.2095947265625, -0.107147216796875, -0.00469970703125, 0.097747802734375, 0.2001953125, 0.302642822265625, 0.40509033203125, 0.507537841796875, 0.6099853515625, 0.712432861328125, 0.81488037109375, 0.917327880859375, 1.019775390625, 1.122222900390625, 1.22467041015625, 1.327117919921875, 1.4295654296875, 1.532012939453125, 1.63446044921875, 1.736907958984375, 1.83935546875, 1.941802978515625, 2.04425048828125, 2.146697998046875, 2.2491455078125, 2.351593017578125, 2.45404052734375, 2.556488037109375, 2.658935546875, 2.761383056640625, 2.86383056640625, 2.966278076171875, 3.0687255859375, 3.171173095703125, 3.27362060546875, 3.376068115234375, 3.478515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 10.0, 13.0, 21.0, 18.0, 19.0, 20.0, 24.0, 43.0, 39.0, 34.0, 47.0, 56.0, 50.0, 42.0, 50.0, 53.0, 60.0, 41.0, 52.0, 45.0, 40.0, 34.0, 44.0, 20.0, 25.0, 10.0, 20.0, 11.0, 7.0, 12.0, 3.0, 9.0, 4.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.96441650390625, -3.8233642578125, -3.68231201171875, -3.541259765625, -3.40020751953125, -3.2591552734375, -3.11810302734375, -2.97705078125, -2.83599853515625, -2.6949462890625, -2.55389404296875, -2.412841796875, -2.27178955078125, -2.1307373046875, -1.98968505859375, -1.8486328125, -1.70758056640625, -1.5665283203125, -1.42547607421875, -1.284423828125, -1.14337158203125, -1.0023193359375, -0.86126708984375, -0.72021484375, -0.57916259765625, -0.4381103515625, -0.29705810546875, -0.156005859375, -0.01495361328125, 0.1260986328125, 0.26715087890625, 0.408203125, 0.54925537109375, 0.6903076171875, 0.83135986328125, 0.972412109375, 1.11346435546875, 1.2545166015625, 1.39556884765625, 1.53662109375, 1.67767333984375, 1.8187255859375, 1.95977783203125, 2.100830078125, 2.24188232421875, 2.3829345703125, 2.52398681640625, 2.6650390625, 2.80609130859375, 2.9471435546875, 3.08819580078125, 3.229248046875, 3.37030029296875, 3.5113525390625, 3.65240478515625, 3.79345703125, 3.93450927734375, 4.0755615234375, 4.21661376953125, 4.357666015625, 4.49871826171875, 4.6397705078125, 4.78082275390625, 4.921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 15.0, 14.0, 29.0, 49.0, 62.0, 99.0, 136.0, 263.0, 400.0, 625.0, 1041.0, 1565.0, 2462.0, 3863.0, 6217.0, 9499.0, 14888.0, 22526.0, 33206.0, 47191.0, 64511.0, 84030.0, 100417.0, 111050.0, 113072.0, 105347.0, 90400.0, 70974.0, 52938.0, 37610.0, 25823.0, 17331.0, 11090.0, 7307.0, 4623.0, 2860.0, 1847.0, 1136.0, 715.0, 476.0, 290.0, 209.0, 104.0, 100.0, 50.0, 30.0, 20.0, 20.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0539398193359375, -1.019012451171875, -0.9840850830078125, -0.94915771484375, -0.9142303466796875, -0.879302978515625, -0.8443756103515625, -0.8094482421875, -0.7745208740234375, -0.739593505859375, -0.7046661376953125, -0.66973876953125, -0.6348114013671875, -0.599884033203125, -0.5649566650390625, -0.530029296875, -0.4951019287109375, -0.460174560546875, -0.4252471923828125, -0.39031982421875, -0.3553924560546875, -0.320465087890625, -0.2855377197265625, -0.2506103515625, -0.2156829833984375, -0.180755615234375, -0.1458282470703125, -0.11090087890625, -0.0759735107421875, -0.041046142578125, -0.0061187744140625, 0.02880859375, 0.0637359619140625, 0.098663330078125, 0.1335906982421875, 0.16851806640625, 0.2034454345703125, 0.238372802734375, 0.2733001708984375, 0.3082275390625, 0.3431549072265625, 0.378082275390625, 0.4130096435546875, 0.44793701171875, 0.4828643798828125, 0.517791748046875, 0.5527191162109375, 0.587646484375, 0.6225738525390625, 0.657501220703125, 0.6924285888671875, 0.72735595703125, 0.7622833251953125, 0.797210693359375, 0.8321380615234375, 0.8670654296875, 0.9019927978515625, 0.936920166015625, 0.9718475341796875, 1.00677490234375, 1.0417022705078125, 1.076629638671875, 1.1115570068359375, 1.146484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 12.0, 13.0, 22.0, 15.0, 24.0, 35.0, 21.0, 37.0, 38.0, 45.0, 55.0, 59.0, 52.0, 77.0, 59.0, 58.0, 53.0, 55.0, 46.0, 30.0, 27.0, 32.0, 28.0, 28.0, 19.0, 13.0, 9.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014841556549072266, -0.0001430865377187729, -0.00013775750994682312, -0.00013242848217487335, -0.00012709945440292358, -0.00012177042663097382, -0.00011644139885902405, -0.00011111237108707428, -0.00010578334331512451, -0.00010045431554317474, -9.512528777122498e-05, -8.979625999927521e-05, -8.446723222732544e-05, -7.913820445537567e-05, -7.38091766834259e-05, -6.848014891147614e-05, -6.315112113952637e-05, -5.78220933675766e-05, -5.249306559562683e-05, -4.716403782367706e-05, -4.1835010051727295e-05, -3.650598227977753e-05, -3.117695450782776e-05, -2.584792673587799e-05, -2.0518898963928223e-05, -1.5189871191978455e-05, -9.860843420028687e-06, -4.5318156480789185e-06, 7.972121238708496e-07, 6.126239895820618e-06, 1.1455267667770386e-05, 1.6784295439720154e-05, 2.2113323211669922e-05, 2.744235098361969e-05, 3.277137875556946e-05, 3.8100406527519226e-05, 4.3429434299468994e-05, 4.875846207141876e-05, 5.408748984336853e-05, 5.94165176153183e-05, 6.474554538726807e-05, 7.007457315921783e-05, 7.54036009311676e-05, 8.073262870311737e-05, 8.606165647506714e-05, 9.13906842470169e-05, 9.671971201896667e-05, 0.00010204873979091644, 0.00010737776756286621, 0.00011270679533481598, 0.00011803582310676575, 0.00012336485087871552, 0.00012869387865066528, 0.00013402290642261505, 0.00013935193419456482, 0.0001446809619665146, 0.00015000998973846436, 0.00015533901751041412, 0.0001606680452823639, 0.00016599707305431366, 0.00017132610082626343, 0.0001766551285982132, 0.00018198415637016296, 0.00018731318414211273, 0.0001926422119140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 2.0, 11.0, 9.0, 19.0, 26.0, 47.0, 53.0, 83.0, 141.0, 191.0, 324.0, 481.0, 727.0, 1253.0, 1904.0, 2837.0, 4490.0, 6844.0, 9932.0, 15183.0, 22071.0, 31514.0, 43382.0, 57376.0, 73517.0, 87850.0, 99073.0, 104291.0, 100916.0, 91160.0, 77165.0, 61382.0, 46780.0, 34099.0, 24184.0, 16589.0, 11200.0, 7421.0, 4884.0, 3106.0, 2121.0, 1359.0, 899.0, 584.0, 408.0, 235.0, 170.0, 102.0, 61.0, 43.0, 24.0, 14.0, 10.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9822845458984375, -0.947967529296875, -0.9136505126953125, -0.87933349609375, -0.8450164794921875, -0.810699462890625, -0.7763824462890625, -0.7420654296875, -0.7077484130859375, -0.673431396484375, -0.6391143798828125, -0.60479736328125, -0.5704803466796875, -0.536163330078125, -0.5018463134765625, -0.467529296875, -0.4332122802734375, -0.398895263671875, -0.3645782470703125, -0.33026123046875, -0.2959442138671875, -0.261627197265625, -0.2273101806640625, -0.1929931640625, -0.1586761474609375, -0.124359130859375, -0.0900421142578125, -0.05572509765625, -0.0214080810546875, 0.012908935546875, 0.0472259521484375, 0.08154296875, 0.1158599853515625, 0.150177001953125, 0.1844940185546875, 0.21881103515625, 0.2531280517578125, 0.287445068359375, 0.3217620849609375, 0.3560791015625, 0.3903961181640625, 0.424713134765625, 0.4590301513671875, 0.49334716796875, 0.5276641845703125, 0.561981201171875, 0.5962982177734375, 0.630615234375, 0.6649322509765625, 0.699249267578125, 0.7335662841796875, 0.76788330078125, 0.8022003173828125, 0.836517333984375, 0.8708343505859375, 0.9051513671875, 0.9394683837890625, 0.973785400390625, 1.0081024169921875, 1.04241943359375, 1.0767364501953125, 1.111053466796875, 1.1453704833984375, 1.1796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 7.0, 14.0, 10.0, 13.0, 15.0, 22.0, 27.0, 33.0, 26.0, 32.0, 40.0, 45.0, 45.0, 47.0, 59.0, 66.0, 54.0, 52.0, 47.0, 49.0, 36.0, 46.0, 37.0, 32.0, 30.0, 24.0, 19.0, 11.0, 9.0, 5.0, 5.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6904678344726562, -0.6699981689453125, -0.6495285034179688, -0.629058837890625, -0.6085891723632812, -0.5881195068359375, -0.5676498413085938, -0.54718017578125, -0.5267105102539062, -0.5062408447265625, -0.48577117919921875, -0.465301513671875, -0.44483184814453125, -0.4243621826171875, -0.40389251708984375, -0.3834228515625, -0.36295318603515625, -0.3424835205078125, -0.32201385498046875, -0.301544189453125, -0.28107452392578125, -0.2606048583984375, -0.24013519287109375, -0.21966552734375, -0.19919586181640625, -0.1787261962890625, -0.15825653076171875, -0.137786865234375, -0.11731719970703125, -0.0968475341796875, -0.07637786865234375, -0.055908203125, -0.03543853759765625, -0.0149688720703125, 0.00550079345703125, 0.025970458984375, 0.04644012451171875, 0.0669097900390625, 0.08737945556640625, 0.10784912109375, 0.12831878662109375, 0.1487884521484375, 0.16925811767578125, 0.189727783203125, 0.21019744873046875, 0.2306671142578125, 0.25113677978515625, 0.2716064453125, 0.29207611083984375, 0.3125457763671875, 0.33301544189453125, 0.353485107421875, 0.37395477294921875, 0.3944244384765625, 0.41489410400390625, 0.43536376953125, 0.45583343505859375, 0.4763031005859375, 0.49677276611328125, 0.517242431640625, 0.5377120971679688, 0.5581817626953125, 0.5786514282226562, 0.59912109375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 10.0, 12.0, 7.0, 17.0, 13.0, 18.0, 10.0, 26.0, 25.0, 36.0, 36.0, 41.0, 35.0, 49.0, 44.0, 44.0, 48.0, 49.0, 56.0, 49.0, 46.0, 51.0, 41.0, 34.0, 29.0, 30.0, 22.0, 26.0, 18.0, 13.0, 14.0, 9.0, 14.0, 4.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.663265228271484, -4.5053791999816895, -4.347492694854736, -4.189606666564941, -4.031720161437988, -3.8738341331481934, -3.7159481048583984, -3.5580618381500244, -3.4001755714416504, -3.2422893047332764, -3.0844030380249023, -2.9265170097351074, -2.7686307430267334, -2.6107444763183594, -2.4528584480285645, -2.2949721813201904, -2.1370859146118164, -1.9791996479034424, -1.821313500404358, -1.6634273529052734, -1.5055410861968994, -1.3476548194885254, -1.189768671989441, -1.0318825244903564, -0.8739962577819824, -0.7161100506782532, -0.5582238435745239, -0.4003376364707947, -0.24245142936706543, -0.08456522226333618, 0.07332098484039307, 0.23120713233947754, 0.38909339904785156, 0.5469796061515808, 0.7048658132553101, 0.8627520203590393, 1.0206382274627686, 1.1785244941711426, 1.336410641670227, 1.4942967891693115, 1.6521830558776855, 1.8100693225860596, 1.967955470085144, 2.1258416175842285, 2.2837278842926025, 2.4416141510009766, 2.5995001792907715, 2.7573864459991455, 2.9152727127075195, 3.0731589794158936, 3.2310452461242676, 3.3889312744140625, 3.5468175411224365, 3.7047038078308105, 3.8625898361206055, 4.020476341247559, 4.1783623695373535, 4.336248397827148, 4.494134902954102, 4.6520209312438965, 4.809906959533691, 4.9677934646606445, 5.1256794929504395, 5.283565521240234, 5.4414520263671875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 4.0, 7.0, 12.0, 21.0, 21.0, 19.0, 35.0, 30.0, 35.0, 35.0, 34.0, 43.0, 51.0, 46.0, 46.0, 57.0, 42.0, 54.0, 37.0, 38.0, 38.0, 38.0, 26.0, 19.0, 30.0, 23.0, 21.0, 24.0, 19.0, 18.0, 12.0, 6.0, 15.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.522763729095459, -7.3078436851501465, -7.092923641204834, -6.8780035972595215, -6.663083076477051, -6.448163032531738, -6.233242988586426, -6.018322944641113, -5.803402900695801, -5.588482856750488, -5.373562812805176, -5.158642768859863, -4.943722724914551, -4.728802680969238, -4.513882160186768, -4.298962116241455, -4.084042072296143, -3.86912202835083, -3.6542019844055176, -3.439281702041626, -3.2243616580963135, -3.009441614151001, -2.7945213317871094, -2.579601287841797, -2.3646812438964844, -2.149761199951172, -1.9348410367965698, -1.7199208736419678, -1.5050008296966553, -1.2900807857513428, -1.0751606225967407, -0.8602404594421387, -0.6453204154968262, -0.4304003119468689, -0.21548020839691162, -0.0005601048469543457, 0.21435999870300293, 0.42928004264831543, 0.6442002058029175, 0.8591203689575195, 1.074040412902832, 1.2889604568481445, 1.5038806200027466, 1.7188007831573486, 1.9337208271026611, 2.1486408710479736, 2.3635611534118652, 2.5784811973571777, 2.7934012413024902, 3.0083212852478027, 3.2232413291931152, 3.438161611557007, 3.6530816555023193, 3.868001699447632, 4.082921981811523, 4.297842025756836, 4.512762069702148, 4.727682113647461, 4.942602157592773, 5.157522201538086, 5.372442245483398, 5.587362289428711, 5.802282810211182, 6.017202854156494, 6.232122898101807]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 11.0, 16.0, 15.0, 22.0, 30.0, 52.0, 84.0, 127.0, 175.0, 267.0, 423.0, 629.0, 960.0, 1563.0, 2572.0, 4202.0, 6892.0, 11993.0, 20759.0, 37336.0, 67667.0, 125172.0, 230329.0, 398189.0, 603574.0, 742895.0, 701437.0, 517770.0, 319039.0, 178729.0, 97720.0, 53246.0, 29498.0, 16679.0, 9715.0, 5567.0, 3378.0, 1997.0, 1305.0, 750.0, 516.0, 332.0, 208.0, 129.0, 96.0, 75.0, 47.0, 32.0, 26.0, 17.0, 13.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -3.9991455078125, -3.849853515625, -3.7005615234375, -3.55126953125, -3.4019775390625, -3.252685546875, -3.1033935546875, -2.9541015625, -2.8048095703125, -2.655517578125, -2.5062255859375, -2.35693359375, -2.2076416015625, -2.058349609375, -1.9090576171875, -1.759765625, -1.6104736328125, -1.461181640625, -1.3118896484375, -1.16259765625, -1.0133056640625, -0.864013671875, -0.7147216796875, -0.5654296875, -0.4161376953125, -0.266845703125, -0.1175537109375, 0.03173828125, 0.1810302734375, 0.330322265625, 0.4796142578125, 0.62890625, 0.7781982421875, 0.927490234375, 1.0767822265625, 1.22607421875, 1.3753662109375, 1.524658203125, 1.6739501953125, 1.8232421875, 1.9725341796875, 2.121826171875, 2.2711181640625, 2.42041015625, 2.5697021484375, 2.718994140625, 2.8682861328125, 3.017578125, 3.1668701171875, 3.316162109375, 3.4654541015625, 3.61474609375, 3.7640380859375, 3.913330078125, 4.0626220703125, 4.2119140625, 4.3612060546875, 4.510498046875, 4.6597900390625, 4.80908203125, 4.9583740234375, 5.107666015625, 5.2569580078125, 5.40625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 11.0, 19.0, 21.0, 20.0, 30.0, 36.0, 41.0, 47.0, 39.0, 35.0, 51.0, 47.0, 52.0, 57.0, 48.0, 40.0, 55.0, 35.0, 34.0, 35.0, 23.0, 21.0, 36.0, 21.0, 23.0, 17.0, 13.0, 13.0, 10.0, 4.0, 14.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.171875, -6.9678955078125, -6.763916015625, -6.5599365234375, -6.35595703125, -6.1519775390625, -5.947998046875, -5.7440185546875, -5.5400390625, -5.3360595703125, -5.132080078125, -4.9281005859375, -4.72412109375, -4.5201416015625, -4.316162109375, -4.1121826171875, -3.908203125, -3.7042236328125, -3.500244140625, -3.2962646484375, -3.09228515625, -2.8883056640625, -2.684326171875, -2.4803466796875, -2.2763671875, -2.0723876953125, -1.868408203125, -1.6644287109375, -1.46044921875, -1.2564697265625, -1.052490234375, -0.8485107421875, -0.64453125, -0.4405517578125, -0.236572265625, -0.0325927734375, 0.17138671875, 0.3753662109375, 0.579345703125, 0.7833251953125, 0.9873046875, 1.1912841796875, 1.395263671875, 1.5992431640625, 1.80322265625, 2.0072021484375, 2.211181640625, 2.4151611328125, 2.619140625, 2.8231201171875, 3.027099609375, 3.2310791015625, 3.43505859375, 3.6390380859375, 3.843017578125, 4.0469970703125, 4.2509765625, 4.4549560546875, 4.658935546875, 4.8629150390625, 5.06689453125, 5.2708740234375, 5.474853515625, 5.6788330078125, 5.8828125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 7.0, 2.0, 4.0, 5.0, 15.0, 13.0, 10.0, 47.0, 49.0, 77.0, 126.0, 250.0, 284.0, 453.0, 698.0, 1077.0, 1831.0, 3015.0, 4887.0, 8072.0, 13724.0, 23186.0, 39076.0, 67237.0, 115111.0, 191306.0, 308110.0, 451469.0, 585244.0, 636566.0, 571270.0, 434049.0, 292843.0, 181521.0, 107800.0, 63286.0, 37123.0, 21566.0, 12750.0, 7742.0, 4747.0, 2897.0, 1776.0, 1097.0, 679.0, 453.0, 256.0, 177.0, 122.0, 74.0, 45.0, 22.0, 18.0, 18.0, 9.0, 5.0], "bins": [-5.8046875, -5.649658203125, -5.49462890625, -5.339599609375, -5.1845703125, -5.029541015625, -4.87451171875, -4.719482421875, -4.564453125, -4.409423828125, -4.25439453125, -4.099365234375, -3.9443359375, -3.789306640625, -3.63427734375, -3.479248046875, -3.32421875, -3.169189453125, -3.01416015625, -2.859130859375, -2.7041015625, -2.549072265625, -2.39404296875, -2.239013671875, -2.083984375, -1.928955078125, -1.77392578125, -1.618896484375, -1.4638671875, -1.308837890625, -1.15380859375, -0.998779296875, -0.84375, -0.688720703125, -0.53369140625, -0.378662109375, -0.2236328125, -0.068603515625, 0.08642578125, 0.241455078125, 0.396484375, 0.551513671875, 0.70654296875, 0.861572265625, 1.0166015625, 1.171630859375, 1.32666015625, 1.481689453125, 1.63671875, 1.791748046875, 1.94677734375, 2.101806640625, 2.2568359375, 2.411865234375, 2.56689453125, 2.721923828125, 2.876953125, 3.031982421875, 3.18701171875, 3.342041015625, 3.4970703125, 3.652099609375, 3.80712890625, 3.962158203125, 4.1171875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 7.0, 17.0, 24.0, 24.0, 43.0, 44.0, 55.0, 76.0, 84.0, 71.0, 125.0, 132.0, 161.0, 159.0, 183.0, 193.0, 236.0, 235.0, 237.0, 223.0, 219.0, 209.0, 186.0, 152.0, 169.0, 131.0, 89.0, 103.0, 102.0, 69.0, 60.0, 58.0, 37.0, 41.0, 31.0, 19.0, 12.0, 13.0, 7.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.67779541015625, -2.6036376953125, -2.52947998046875, -2.455322265625, -2.38116455078125, -2.3070068359375, -2.23284912109375, -2.15869140625, -2.08453369140625, -2.0103759765625, -1.93621826171875, -1.862060546875, -1.78790283203125, -1.7137451171875, -1.63958740234375, -1.5654296875, -1.49127197265625, -1.4171142578125, -1.34295654296875, -1.268798828125, -1.19464111328125, -1.1204833984375, -1.04632568359375, -0.97216796875, -0.89801025390625, -0.8238525390625, -0.74969482421875, -0.675537109375, -0.60137939453125, -0.5272216796875, -0.45306396484375, -0.37890625, -0.30474853515625, -0.2305908203125, -0.15643310546875, -0.082275390625, -0.00811767578125, 0.0660400390625, 0.14019775390625, 0.21435546875, 0.28851318359375, 0.3626708984375, 0.43682861328125, 0.510986328125, 0.58514404296875, 0.6593017578125, 0.73345947265625, 0.8076171875, 0.88177490234375, 0.9559326171875, 1.03009033203125, 1.104248046875, 1.17840576171875, 1.2525634765625, 1.32672119140625, 1.40087890625, 1.47503662109375, 1.5491943359375, 1.62335205078125, 1.697509765625, 1.77166748046875, 1.8458251953125, 1.91998291015625, 1.994140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 10.0, 11.0, 4.0, 17.0, 17.0, 27.0, 18.0, 28.0, 26.0, 31.0, 44.0, 34.0, 40.0, 37.0, 49.0, 50.0, 58.0, 37.0, 48.0, 37.0, 51.0, 46.0, 33.0, 34.0, 30.0, 26.0, 25.0, 22.0, 21.0, 14.0, 12.0, 16.0, 4.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.513049125671387, -4.347337245941162, -4.181625843048096, -4.015913963317871, -3.8502025604248047, -3.68449068069458, -3.5187790393829346, -3.353067398071289, -3.1873557567596436, -3.021644115447998, -2.8559324741363525, -2.690220832824707, -2.5245089530944824, -2.358797550201416, -2.1930856704711914, -2.027374029159546, -1.8616623878479004, -1.6959507465362549, -1.5302391052246094, -1.3645273447036743, -1.1988157033920288, -1.0331040620803833, -0.867392361164093, -0.7016806602478027, -0.5359690189361572, -0.37025734782218933, -0.20454567670822144, -0.03883400559425354, 0.12687766551971436, 0.29258930683135986, 0.45830100774765015, 0.6240127086639404, 0.7897238731384277, 0.9554355144500732, 1.1211471557617188, 1.2868589162826538, 1.4525705575942993, 1.6182821989059448, 1.7839939594268799, 1.9497056007385254, 2.115417242050171, 2.2811288833618164, 2.446840524673462, 2.6125521659851074, 2.778264045715332, 2.9439754486083984, 3.109687328338623, 3.2753989696502686, 3.441110610961914, 3.6068222522735596, 3.772533893585205, 3.9382455348968506, 4.103957176208496, 4.269669055938721, 4.435380458831787, 4.601092338562012, 4.766803741455078, 4.932515621185303, 5.098227024078369, 5.263938903808594, 5.42965030670166, 5.595362186431885, 5.761073589324951, 5.926785469055176, 6.0924973487854]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 5.0, 9.0, 6.0, 16.0, 17.0, 10.0, 28.0, 23.0, 25.0, 36.0, 32.0, 30.0, 40.0, 44.0, 36.0, 39.0, 50.0, 49.0, 44.0, 47.0, 49.0, 43.0, 38.0, 33.0, 37.0, 14.0, 28.0, 20.0, 26.0, 29.0, 16.0, 13.0, 10.0, 8.0, 7.0, 10.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.271803379058838, -7.044003963470459, -6.816204071044922, -6.588404655456543, -6.360605239868164, -6.132805347442627, -5.905005931854248, -5.677206039428711, -5.449406623840332, -5.221607208251953, -4.993807315826416, -4.766007900238037, -4.5382080078125, -4.310408592224121, -4.082609176635742, -3.854809522628784, -3.627009868621826, -3.399210214614868, -3.17141056060791, -2.9436111450195312, -2.7158114910125732, -2.4880118370056152, -2.2602124214172363, -2.0324127674102783, -1.8046131134033203, -1.5768134593963623, -1.3490139245986938, -1.1212143898010254, -0.8934147357940674, -0.6656150817871094, -0.4378155469894409, -0.21001601219177246, 0.01778411865234375, 0.24558371305465698, 0.4733833074569702, 0.7011829018592834, 0.9289824962615967, 1.1567821502685547, 1.3845816850662231, 1.6123812198638916, 1.8401808738708496, 2.0679805278778076, 2.2957801818847656, 2.5235795974731445, 2.7513792514801025, 2.9791789054870605, 3.2069783210754395, 3.4347779750823975, 3.6625776290893555, 3.8903772830963135, 4.1181769371032715, 4.34597635269165, 4.5737762451171875, 4.801575660705566, 5.029375076293945, 5.257174491882324, 5.484974384307861, 5.71277379989624, 5.940573692321777, 6.168373107910156, 6.396172523498535, 6.623972415924072, 6.851771831512451, 7.079571723937988, 7.307371139526367]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 13.0, 16.0, 40.0, 50.0, 71.0, 96.0, 154.0, 216.0, 331.0, 496.0, 788.0, 1188.0, 1738.0, 2822.0, 4463.0, 7184.0, 11660.0, 19592.0, 32623.0, 56466.0, 95577.0, 149943.0, 193222.0, 173837.0, 118761.0, 71812.0, 42094.0, 24727.0, 14693.0, 8775.0, 5448.0, 3385.0, 2169.0, 1415.0, 904.0, 594.0, 389.0, 273.0, 170.0, 99.0, 87.0, 71.0, 33.0, 20.0, 19.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1162109375, -1.0798797607421875, -1.043548583984375, -1.0072174072265625, -0.97088623046875, -0.9345550537109375, -0.898223876953125, -0.8618927001953125, -0.8255615234375, -0.7892303466796875, -0.752899169921875, -0.7165679931640625, -0.68023681640625, -0.6439056396484375, -0.607574462890625, -0.5712432861328125, -0.534912109375, -0.4985809326171875, -0.462249755859375, -0.4259185791015625, -0.38958740234375, -0.3532562255859375, -0.316925048828125, -0.2805938720703125, -0.2442626953125, -0.2079315185546875, -0.171600341796875, -0.1352691650390625, -0.09893798828125, -0.0626068115234375, -0.026275634765625, 0.0100555419921875, 0.04638671875, 0.0827178955078125, 0.119049072265625, 0.1553802490234375, 0.19171142578125, 0.2280426025390625, 0.264373779296875, 0.3007049560546875, 0.3370361328125, 0.3733673095703125, 0.409698486328125, 0.4460296630859375, 0.48236083984375, 0.5186920166015625, 0.555023193359375, 0.5913543701171875, 0.627685546875, 0.6640167236328125, 0.700347900390625, 0.7366790771484375, 0.77301025390625, 0.8093414306640625, 0.845672607421875, 0.8820037841796875, 0.9183349609375, 0.9546661376953125, 0.990997314453125, 1.0273284912109375, 1.06365966796875, 1.0999908447265625, 1.136322021484375, 1.1726531982421875, 1.208984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 9.0, 14.0, 19.0, 26.0, 18.0, 27.0, 28.0, 40.0, 34.0, 40.0, 53.0, 38.0, 47.0, 41.0, 39.0, 54.0, 49.0, 37.0, 34.0, 33.0, 51.0, 27.0, 26.0, 22.0, 22.0, 32.0, 19.0, 15.0, 14.0, 9.0, 16.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -6.998779296875, -6.76318359375, -6.527587890625, -6.2919921875, -6.056396484375, -5.82080078125, -5.585205078125, -5.349609375, -5.114013671875, -4.87841796875, -4.642822265625, -4.4072265625, -4.171630859375, -3.93603515625, -3.700439453125, -3.46484375, -3.229248046875, -2.99365234375, -2.758056640625, -2.5224609375, -2.286865234375, -2.05126953125, -1.815673828125, -1.580078125, -1.344482421875, -1.10888671875, -0.873291015625, -0.6376953125, -0.402099609375, -0.16650390625, 0.069091796875, 0.3046875, 0.540283203125, 0.77587890625, 1.011474609375, 1.2470703125, 1.482666015625, 1.71826171875, 1.953857421875, 2.189453125, 2.425048828125, 2.66064453125, 2.896240234375, 3.1318359375, 3.367431640625, 3.60302734375, 3.838623046875, 4.07421875, 4.309814453125, 4.54541015625, 4.781005859375, 5.0166015625, 5.252197265625, 5.48779296875, 5.723388671875, 5.958984375, 6.194580078125, 6.43017578125, 6.665771484375, 6.9013671875, 7.136962890625, 7.37255859375, 7.608154296875, 7.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 15.0, 26.0, 40.0, 66.0, 104.0, 168.0, 255.0, 407.0, 694.0, 1145.0, 1930.0, 3187.0, 5642.0, 10637.0, 20601.0, 57632.0, 622355.0, 252290.0, 35620.0, 16017.0, 8317.0, 4675.0, 2661.0, 1577.0, 947.0, 561.0, 368.0, 212.0, 143.0, 88.0, 63.0, 45.0, 13.0, 7.0, 10.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.318359375, -2.253631591796875, -2.18890380859375, -2.124176025390625, -2.0594482421875, -1.994720458984375, -1.92999267578125, -1.865264892578125, -1.800537109375, -1.735809326171875, -1.67108154296875, -1.606353759765625, -1.5416259765625, -1.476898193359375, -1.41217041015625, -1.347442626953125, -1.28271484375, -1.217987060546875, -1.15325927734375, -1.088531494140625, -1.0238037109375, -0.959075927734375, -0.89434814453125, -0.829620361328125, -0.764892578125, -0.700164794921875, -0.63543701171875, -0.570709228515625, -0.5059814453125, -0.441253662109375, -0.37652587890625, -0.311798095703125, -0.2470703125, -0.182342529296875, -0.11761474609375, -0.052886962890625, 0.0118408203125, 0.076568603515625, 0.14129638671875, 0.206024169921875, 0.270751953125, 0.335479736328125, 0.40020751953125, 0.464935302734375, 0.5296630859375, 0.594390869140625, 0.65911865234375, 0.723846435546875, 0.78857421875, 0.853302001953125, 0.91802978515625, 0.982757568359375, 1.0474853515625, 1.112213134765625, 1.17694091796875, 1.241668701171875, 1.306396484375, 1.371124267578125, 1.43585205078125, 1.500579833984375, 1.5653076171875, 1.630035400390625, 1.69476318359375, 1.759490966796875, 1.82421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 7.0, 8.0, 11.0, 7.0, 16.0, 11.0, 19.0, 14.0, 21.0, 19.0, 13.0, 23.0, 32.0, 30.0, 33.0, 31.0, 39.0, 39.0, 30.0, 37.0, 40.0, 48.0, 41.0, 41.0, 34.0, 41.0, 33.0, 31.0, 22.0, 33.0, 21.0, 26.0, 23.0, 13.0, 14.0, 18.0, 13.0, 15.0, 9.0, 14.0, 6.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.56640625, -4.42413330078125, -4.2818603515625, -4.13958740234375, -3.997314453125, -3.85504150390625, -3.7127685546875, -3.57049560546875, -3.42822265625, -3.28594970703125, -3.1436767578125, -3.00140380859375, -2.859130859375, -2.71685791015625, -2.5745849609375, -2.43231201171875, -2.2900390625, -2.14776611328125, -2.0054931640625, -1.86322021484375, -1.720947265625, -1.57867431640625, -1.4364013671875, -1.29412841796875, -1.15185546875, -1.00958251953125, -0.8673095703125, -0.72503662109375, -0.582763671875, -0.44049072265625, -0.2982177734375, -0.15594482421875, -0.013671875, 0.12860107421875, 0.2708740234375, 0.41314697265625, 0.555419921875, 0.69769287109375, 0.8399658203125, 0.98223876953125, 1.12451171875, 1.26678466796875, 1.4090576171875, 1.55133056640625, 1.693603515625, 1.83587646484375, 1.9781494140625, 2.12042236328125, 2.2626953125, 2.40496826171875, 2.5472412109375, 2.68951416015625, 2.831787109375, 2.97406005859375, 3.1163330078125, 3.25860595703125, 3.40087890625, 3.54315185546875, 3.6854248046875, 3.82769775390625, 3.969970703125, 4.11224365234375, 4.2545166015625, 4.39678955078125, 4.5390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 11.0, 4.0, 10.0, 16.0, 21.0, 24.0, 36.0, 38.0, 64.0, 75.0, 113.0, 156.0, 225.0, 327.0, 504.0, 763.0, 1160.0, 1745.0, 2790.0, 4634.0, 7996.0, 13927.0, 26038.0, 98710.0, 781721.0, 54350.0, 22158.0, 12198.0, 6998.0, 4310.0, 2489.0, 1672.0, 1031.0, 653.0, 413.0, 337.0, 221.0, 184.0, 113.0, 90.0, 71.0, 38.0, 32.0, 28.0, 13.0, 7.0, 14.0, 11.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.263427734375, -0.2550315856933594, -0.24663543701171875, -0.23823928833007812, -0.2298431396484375, -0.22144699096679688, -0.21305084228515625, -0.20465469360351562, -0.196258544921875, -0.18786239624023438, -0.17946624755859375, -0.17107009887695312, -0.1626739501953125, -0.15427780151367188, -0.14588165283203125, -0.13748550415039062, -0.12908935546875, -0.12069320678710938, -0.11229705810546875, -0.10390090942382812, -0.0955047607421875, -0.08710861206054688, -0.07871246337890625, -0.07031631469726562, -0.061920166015625, -0.053524017333984375, -0.04512786865234375, -0.036731719970703125, -0.0283355712890625, -0.019939422607421875, -0.01154327392578125, -0.003147125244140625, 0.0052490234375, 0.013645172119140625, 0.02204132080078125, 0.030437469482421875, 0.0388336181640625, 0.047229766845703125, 0.05562591552734375, 0.06402206420898438, 0.072418212890625, 0.08081436157226562, 0.08921051025390625, 0.09760665893554688, 0.1060028076171875, 0.11439895629882812, 0.12279510498046875, 0.13119125366210938, 0.13958740234375, 0.14798355102539062, 0.15637969970703125, 0.16477584838867188, 0.1731719970703125, 0.18156814575195312, 0.18996429443359375, 0.19836044311523438, 0.206756591796875, 0.21515274047851562, 0.22354888916015625, 0.23194503784179688, 0.2403411865234375, 0.24873733520507812, 0.25713348388671875, 0.2655296325683594, 0.27392578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 4.0, 7.0, 11.0, 14.0, 19.0, 15.0, 17.0, 32.0, 34.0, 34.0, 26.0, 28.0, 44.0, 36.0, 52.0, 47.0, 43.0, 47.0, 42.0, 46.0, 54.0, 35.0, 29.0, 36.0, 30.0, 42.0, 29.0, 23.0, 10.0, 14.0, 12.0, 18.0, 8.0, 7.0, 14.0, 10.0, 2.0, 7.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.106231689453125e-06, -7.797963917255402e-06, -7.489696145057678e-06, -7.181428372859955e-06, -6.8731606006622314e-06, -6.564892828464508e-06, -6.256625056266785e-06, -5.948357284069061e-06, -5.640089511871338e-06, -5.3318217396736145e-06, -5.023553967475891e-06, -4.715286195278168e-06, -4.407018423080444e-06, -4.098750650882721e-06, -3.7904828786849976e-06, -3.482215106487274e-06, -3.1739473342895508e-06, -2.8656795620918274e-06, -2.557411789894104e-06, -2.2491440176963806e-06, -1.9408762454986572e-06, -1.6326084733009338e-06, -1.3243407011032104e-06, -1.016072928905487e-06, -7.078051567077637e-07, -3.995373845100403e-07, -9.12696123123169e-08, 2.169981598854065e-07, 5.252659320831299e-07, 8.335337042808533e-07, 1.1418014764785767e-06, 1.4500692486763e-06, 1.7583370208740234e-06, 2.066604793071747e-06, 2.3748725652694702e-06, 2.6831403374671936e-06, 2.991408109664917e-06, 3.2996758818626404e-06, 3.6079436540603638e-06, 3.916211426258087e-06, 4.2244791984558105e-06, 4.532746970653534e-06, 4.841014742851257e-06, 5.149282515048981e-06, 5.457550287246704e-06, 5.7658180594444275e-06, 6.074085831642151e-06, 6.382353603839874e-06, 6.690621376037598e-06, 6.998889148235321e-06, 7.3071569204330444e-06, 7.615424692630768e-06, 7.923692464828491e-06, 8.231960237026215e-06, 8.540228009223938e-06, 8.848495781421661e-06, 9.156763553619385e-06, 9.465031325817108e-06, 9.773299098014832e-06, 1.0081566870212555e-05, 1.0389834642410278e-05, 1.0698102414608002e-05, 1.1006370186805725e-05, 1.1314637959003448e-05, 1.1622905731201172e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 11.0, 13.0, 11.0, 20.0, 21.0, 39.0, 46.0, 79.0, 104.0, 150.0, 253.0, 342.0, 470.0, 708.0, 1102.0, 1766.0, 2750.0, 4293.0, 6834.0, 11189.0, 18099.0, 30011.0, 49979.0, 84560.0, 137604.0, 194611.0, 185303.0, 125906.0, 75867.0, 45162.0, 27283.0, 16456.0, 10101.0, 6238.0, 3843.0, 2505.0, 1586.0, 1123.0, 715.0, 433.0, 307.0, 189.0, 131.0, 106.0, 67.0, 47.0, 44.0, 21.0, 20.0, 14.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.235107421875, -0.2277374267578125, -0.220367431640625, -0.2129974365234375, -0.20562744140625, -0.1982574462890625, -0.190887451171875, -0.1835174560546875, -0.1761474609375, -0.1687774658203125, -0.161407470703125, -0.1540374755859375, -0.14666748046875, -0.1392974853515625, -0.131927490234375, -0.1245574951171875, -0.1171875, -0.1098175048828125, -0.102447509765625, -0.0950775146484375, -0.08770751953125, -0.0803375244140625, -0.072967529296875, -0.0655975341796875, -0.0582275390625, -0.0508575439453125, -0.043487548828125, -0.0361175537109375, -0.02874755859375, -0.0213775634765625, -0.014007568359375, -0.0066375732421875, 0.000732421875, 0.0081024169921875, 0.015472412109375, 0.0228424072265625, 0.03021240234375, 0.0375823974609375, 0.044952392578125, 0.0523223876953125, 0.0596923828125, 0.0670623779296875, 0.074432373046875, 0.0818023681640625, 0.08917236328125, 0.0965423583984375, 0.103912353515625, 0.1112823486328125, 0.11865234375, 0.1260223388671875, 0.133392333984375, 0.1407623291015625, 0.14813232421875, 0.1555023193359375, 0.162872314453125, 0.1702423095703125, 0.1776123046875, 0.1849822998046875, 0.192352294921875, 0.1997222900390625, 0.20709228515625, 0.2144622802734375, 0.221832275390625, 0.2292022705078125, 0.236572265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 14.0, 16.0, 16.0, 23.0, 54.0, 59.0, 69.0, 94.0, 117.0, 106.0, 100.0, 77.0, 65.0, 39.0, 35.0, 32.0, 24.0, 16.0, 11.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115966796875, -0.11168861389160156, -0.10741043090820312, -0.10313224792480469, -0.09885406494140625, -0.09457588195800781, -0.09029769897460938, -0.08601951599121094, -0.0817413330078125, -0.07746315002441406, -0.07318496704101562, -0.06890678405761719, -0.06462860107421875, -0.06035041809082031, -0.056072235107421875, -0.05179405212402344, -0.047515869140625, -0.04323768615722656, -0.038959503173828125, -0.03468132019042969, -0.03040313720703125, -0.026124954223632812, -0.021846771240234375, -0.017568588256835938, -0.0132904052734375, -0.009012222290039062, -0.004734039306640625, -0.0004558563232421875, 0.00382232666015625, 0.008100509643554688, 0.012378692626953125, 0.016656875610351562, 0.02093505859375, 0.025213241577148438, 0.029491424560546875, 0.03376960754394531, 0.03804779052734375, 0.04232597351074219, 0.046604156494140625, 0.05088233947753906, 0.0551605224609375, 0.05943870544433594, 0.06371688842773438, 0.06799507141113281, 0.07227325439453125, 0.07655143737792969, 0.08082962036132812, 0.08510780334472656, 0.089385986328125, 0.09366416931152344, 0.09794235229492188, 0.10222053527832031, 0.10649871826171875, 0.11077690124511719, 0.11505508422851562, 0.11933326721191406, 0.1236114501953125, 0.12788963317871094, 0.13216781616210938, 0.1364459991455078, 0.14072418212890625, 0.1450023651123047, 0.14928054809570312, 0.15355873107910156, 0.1578369140625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 9.0, 6.0, 19.0, 23.0, 20.0, 28.0, 25.0, 32.0, 40.0, 36.0, 39.0, 45.0, 44.0, 50.0, 55.0, 39.0, 46.0, 45.0, 44.0, 41.0, 38.0, 33.0, 31.0, 39.0, 19.0, 25.0, 18.0, 21.0, 9.0, 12.0, 9.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.552606582641602, -4.386341094970703, -4.2200751304626465, -4.053809642791748, -3.8875439167022705, -3.721278190612793, -3.5550127029418945, -3.388746976852417, -3.2224812507629395, -3.056215524673462, -2.8899500370025635, -2.723684310913086, -2.5574185848236084, -2.391152858734131, -2.2248873710632324, -2.058621644973755, -1.8923561573028564, -1.7260905504226685, -1.559824824333191, -1.393559217453003, -1.2272934913635254, -1.0610278844833374, -0.8947622776031494, -0.7284965515136719, -0.5622309446334839, -0.3959652781486511, -0.22969964146614075, -0.06343400478363037, 0.10283166170120239, 0.26909732818603516, 0.43536293506622314, 0.6016286611557007, 0.7678942680358887, 0.9341599345207214, 1.1004256010055542, 1.2666912078857422, 1.4329569339752197, 1.5992225408554077, 1.7654881477355957, 1.9317538738250732, 2.098019599914551, 2.2642853260040283, 2.4305508136749268, 2.5968165397644043, 2.763082265853882, 2.9293479919433594, 3.095613479614258, 3.2618792057037354, 3.428144693374634, 3.5944104194641113, 3.7606759071350098, 3.9269416332244873, 4.093207359313965, 4.259472846984863, 4.425738334655762, 4.592004299163818, 4.758269786834717, 4.924535274505615, 5.090801239013672, 5.25706672668457, 5.423332214355469, 5.589598178863525, 5.755863666534424, 5.9221296310424805, 6.088395118713379]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 6.0, 2.0, 6.0, 8.0, 6.0, 14.0, 19.0, 12.0, 26.0, 21.0, 24.0, 39.0, 28.0, 32.0, 40.0, 40.0, 40.0, 37.0, 51.0, 49.0, 42.0, 46.0, 50.0, 43.0, 40.0, 32.0, 35.0, 19.0, 25.0, 24.0, 23.0, 27.0, 20.0, 13.0, 10.0, 7.0, 6.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.203718662261963, -6.977792739868164, -6.751866817474365, -6.525940895080566, -6.300014972686768, -6.074089050292969, -5.848163604736328, -5.622237205505371, -5.3963117599487305, -5.170385837554932, -4.944459915161133, -4.718533992767334, -4.492608070373535, -4.266682147979736, -4.0407562255859375, -3.8148305416107178, -3.58890438079834, -3.362978458404541, -3.137052536010742, -2.9111266136169434, -2.6852006912231445, -2.4592747688293457, -2.233349084854126, -2.007423162460327, -1.7814972400665283, -1.5555713176727295, -1.3296453952789307, -1.1037195920944214, -0.8777936697006226, -0.6518677473068237, -0.42594194412231445, -0.20001602172851562, 0.025909423828125, 0.25183531641960144, 0.4777612090110779, 0.7036870718002319, 0.9296129941940308, 1.1555389165878296, 1.3814647197723389, 1.6073906421661377, 1.8333165645599365, 2.0592424869537354, 2.285168409347534, 2.511094093322754, 2.7370200157165527, 2.9629459381103516, 3.1888718605041504, 3.414797782897949, 3.640723705291748, 3.866649627685547, 4.092575550079346, 4.3185014724731445, 4.544427394866943, 4.770353317260742, 4.996278762817383, 5.22220516204834, 5.4481306076049805, 5.674056529998779, 5.899982452392578, 6.125908374786377, 6.351834297180176, 6.577760219573975, 6.803686141967773, 7.029611587524414, 7.255537986755371]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 10.0, 28.0, 30.0, 41.0, 65.0, 86.0, 126.0, 188.0, 292.0, 506.0, 816.0, 1226.0, 1899.0, 3188.0, 5195.0, 8434.0, 13601.0, 22024.0, 34937.0, 53872.0, 78468.0, 105831.0, 128032.0, 136268.0, 127407.0, 104307.0, 77270.0, 53417.0, 34277.0, 21910.0, 13407.0, 7970.0, 5144.0, 3034.0, 1816.0, 1256.0, 816.0, 471.0, 319.0, 189.0, 110.0, 85.0, 50.0, 44.0, 27.0, 21.0, 15.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-4.73046875, -4.58917236328125, -4.4478759765625, -4.30657958984375, -4.165283203125, -4.02398681640625, -3.8826904296875, -3.74139404296875, -3.60009765625, -3.45880126953125, -3.3175048828125, -3.17620849609375, -3.034912109375, -2.89361572265625, -2.7523193359375, -2.61102294921875, -2.4697265625, -2.32843017578125, -2.1871337890625, -2.04583740234375, -1.904541015625, -1.76324462890625, -1.6219482421875, -1.48065185546875, -1.33935546875, -1.19805908203125, -1.0567626953125, -0.91546630859375, -0.774169921875, -0.63287353515625, -0.4915771484375, -0.35028076171875, -0.208984375, -0.06768798828125, 0.0736083984375, 0.21490478515625, 0.356201171875, 0.49749755859375, 0.6387939453125, 0.78009033203125, 0.92138671875, 1.06268310546875, 1.2039794921875, 1.34527587890625, 1.486572265625, 1.62786865234375, 1.7691650390625, 1.91046142578125, 2.0517578125, 2.19305419921875, 2.3343505859375, 2.47564697265625, 2.616943359375, 2.75823974609375, 2.8995361328125, 3.04083251953125, 3.18212890625, 3.32342529296875, 3.4647216796875, 3.60601806640625, 3.747314453125, 3.88861083984375, 4.0299072265625, 4.17120361328125, 4.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 10.0, 6.0, 15.0, 11.0, 18.0, 18.0, 18.0, 31.0, 23.0, 36.0, 44.0, 41.0, 39.0, 39.0, 38.0, 51.0, 52.0, 45.0, 48.0, 39.0, 32.0, 39.0, 35.0, 47.0, 25.0, 33.0, 18.0, 23.0, 24.0, 17.0, 20.0, 13.0, 9.0, 6.0, 3.0, 3.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.18359375, -6.9656982421875, -6.747802734375, -6.5299072265625, -6.31201171875, -6.0941162109375, -5.876220703125, -5.6583251953125, -5.4404296875, -5.2225341796875, -5.004638671875, -4.7867431640625, -4.56884765625, -4.3509521484375, -4.133056640625, -3.9151611328125, -3.697265625, -3.4793701171875, -3.261474609375, -3.0435791015625, -2.82568359375, -2.6077880859375, -2.389892578125, -2.1719970703125, -1.9541015625, -1.7362060546875, -1.518310546875, -1.3004150390625, -1.08251953125, -0.8646240234375, -0.646728515625, -0.4288330078125, -0.2109375, 0.0069580078125, 0.224853515625, 0.4427490234375, 0.66064453125, 0.8785400390625, 1.096435546875, 1.3143310546875, 1.5322265625, 1.7501220703125, 1.968017578125, 2.1859130859375, 2.40380859375, 2.6217041015625, 2.839599609375, 3.0574951171875, 3.275390625, 3.4932861328125, 3.711181640625, 3.9290771484375, 4.14697265625, 4.3648681640625, 4.582763671875, 4.8006591796875, 5.0185546875, 5.2364501953125, 5.454345703125, 5.6722412109375, 5.89013671875, 6.1080322265625, 6.325927734375, 6.5438232421875, 6.76171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 4.0, 3.0, 8.0, 26.0, 32.0, 34.0, 60.0, 99.0, 188.0, 253.0, 459.0, 782.0, 1316.0, 2162.0, 3655.0, 6537.0, 10852.0, 18488.0, 31457.0, 51085.0, 78829.0, 111706.0, 139948.0, 149407.0, 137053.0, 107695.0, 75822.0, 48134.0, 29681.0, 17830.0, 10210.0, 6081.0, 3522.0, 1995.0, 1228.0, 736.0, 465.0, 262.0, 154.0, 104.0, 59.0, 52.0, 25.0, 16.0, 10.0, 5.0, 11.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-6.078125, -5.90167236328125, -5.7252197265625, -5.54876708984375, -5.372314453125, -5.19586181640625, -5.0194091796875, -4.84295654296875, -4.66650390625, -4.49005126953125, -4.3135986328125, -4.13714599609375, -3.960693359375, -3.78424072265625, -3.6077880859375, -3.43133544921875, -3.2548828125, -3.07843017578125, -2.9019775390625, -2.72552490234375, -2.549072265625, -2.37261962890625, -2.1961669921875, -2.01971435546875, -1.84326171875, -1.66680908203125, -1.4903564453125, -1.31390380859375, -1.137451171875, -0.96099853515625, -0.7845458984375, -0.60809326171875, -0.431640625, -0.25518798828125, -0.0787353515625, 0.09771728515625, 0.274169921875, 0.45062255859375, 0.6270751953125, 0.80352783203125, 0.97998046875, 1.15643310546875, 1.3328857421875, 1.50933837890625, 1.685791015625, 1.86224365234375, 2.0386962890625, 2.21514892578125, 2.3916015625, 2.56805419921875, 2.7445068359375, 2.92095947265625, 3.097412109375, 3.27386474609375, 3.4503173828125, 3.62677001953125, 3.80322265625, 3.97967529296875, 4.1561279296875, 4.33258056640625, 4.509033203125, 4.68548583984375, 4.8619384765625, 5.03839111328125, 5.21484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 10.0, 6.0, 4.0, 5.0, 11.0, 13.0, 16.0, 9.0, 19.0, 24.0, 20.0, 38.0, 29.0, 27.0, 25.0, 35.0, 38.0, 32.0, 24.0, 34.0, 45.0, 40.0, 40.0, 46.0, 38.0, 39.0, 39.0, 34.0, 33.0, 34.0, 28.0, 26.0, 20.0, 20.0, 9.0, 13.0, 16.0, 8.0, 17.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2890625, -4.15283203125, -4.0166015625, -3.88037109375, -3.744140625, -3.60791015625, -3.4716796875, -3.33544921875, -3.19921875, -3.06298828125, -2.9267578125, -2.79052734375, -2.654296875, -2.51806640625, -2.3818359375, -2.24560546875, -2.109375, -1.97314453125, -1.8369140625, -1.70068359375, -1.564453125, -1.42822265625, -1.2919921875, -1.15576171875, -1.01953125, -0.88330078125, -0.7470703125, -0.61083984375, -0.474609375, -0.33837890625, -0.2021484375, -0.06591796875, 0.0703125, 0.20654296875, 0.3427734375, 0.47900390625, 0.615234375, 0.75146484375, 0.8876953125, 1.02392578125, 1.16015625, 1.29638671875, 1.4326171875, 1.56884765625, 1.705078125, 1.84130859375, 1.9775390625, 2.11376953125, 2.25, 2.38623046875, 2.5224609375, 2.65869140625, 2.794921875, 2.93115234375, 3.0673828125, 3.20361328125, 3.33984375, 3.47607421875, 3.6123046875, 3.74853515625, 3.884765625, 4.02099609375, 4.1572265625, 4.29345703125, 4.4296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 12.0, 16.0, 27.0, 41.0, 62.0, 89.0, 167.0, 259.0, 409.0, 720.0, 1215.0, 1929.0, 3308.0, 5545.0, 9212.0, 15607.0, 26057.0, 42704.0, 66850.0, 97427.0, 128525.0, 146831.0, 142442.0, 119715.0, 88093.0, 58887.0, 36786.0, 22513.0, 13486.0, 7919.0, 4683.0, 2840.0, 1633.0, 1036.0, 596.0, 377.0, 212.0, 127.0, 80.0, 49.0, 27.0, 29.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.966796875, -1.89862060546875, -1.8304443359375, -1.76226806640625, -1.694091796875, -1.62591552734375, -1.5577392578125, -1.48956298828125, -1.42138671875, -1.35321044921875, -1.2850341796875, -1.21685791015625, -1.148681640625, -1.08050537109375, -1.0123291015625, -0.94415283203125, -0.8759765625, -0.80780029296875, -0.7396240234375, -0.67144775390625, -0.603271484375, -0.53509521484375, -0.4669189453125, -0.39874267578125, -0.33056640625, -0.26239013671875, -0.1942138671875, -0.12603759765625, -0.057861328125, 0.01031494140625, 0.0784912109375, 0.14666748046875, 0.21484375, 0.28302001953125, 0.3511962890625, 0.41937255859375, 0.487548828125, 0.55572509765625, 0.6239013671875, 0.69207763671875, 0.76025390625, 0.82843017578125, 0.8966064453125, 0.96478271484375, 1.032958984375, 1.10113525390625, 1.1693115234375, 1.23748779296875, 1.3056640625, 1.37384033203125, 1.4420166015625, 1.51019287109375, 1.578369140625, 1.64654541015625, 1.7147216796875, 1.78289794921875, 1.85107421875, 1.91925048828125, 1.9874267578125, 2.05560302734375, 2.123779296875, 2.19195556640625, 2.2601318359375, 2.32830810546875, 2.396484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 7.0, 9.0, 14.0, 20.0, 20.0, 27.0, 26.0, 30.0, 35.0, 40.0, 58.0, 57.0, 68.0, 68.0, 62.0, 59.0, 60.0, 65.0, 57.0, 41.0, 31.0, 45.0, 26.0, 18.0, 15.0, 8.0, 8.0, 8.0, 6.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024771690368652344, -0.00023872032761573792, -0.0002297237515449524, -0.00022072717547416687, -0.00021173059940338135, -0.00020273402333259583, -0.0001937374472618103, -0.00018474087119102478, -0.00017574429512023926, -0.00016674771904945374, -0.0001577511429786682, -0.0001487545669078827, -0.00013975799083709717, -0.00013076141476631165, -0.00012176483869552612, -0.0001127682626247406, -0.00010377168655395508, -9.477511048316956e-05, -8.577853441238403e-05, -7.678195834159851e-05, -6.778538227081299e-05, -5.8788806200027466e-05, -4.979223012924194e-05, -4.079565405845642e-05, -3.17990779876709e-05, -2.2802501916885376e-05, -1.3805925846099854e-05, -4.809349775314331e-06, 4.187226295471191e-06, 1.3183802366256714e-05, 2.2180378437042236e-05, 3.117695450782776e-05, 4.017353057861328e-05, 4.9170106649398804e-05, 5.8166682720184326e-05, 6.716325879096985e-05, 7.615983486175537e-05, 8.51564109325409e-05, 9.415298700332642e-05, 0.00010314956307411194, 0.00011214613914489746, 0.00012114271521568298, 0.0001301392912864685, 0.00013913586735725403, 0.00014813244342803955, 0.00015712901949882507, 0.0001661255955696106, 0.00017512217164039612, 0.00018411874771118164, 0.00019311532378196716, 0.00020211189985275269, 0.0002111084759235382, 0.00022010505199432373, 0.00022910162806510925, 0.00023809820413589478, 0.0002470947802066803, 0.0002560913562774658, 0.00026508793234825134, 0.00027408450841903687, 0.0002830810844898224, 0.0002920776605606079, 0.00030107423663139343, 0.00031007081270217896, 0.0003190673887729645, 0.00032806396484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 19.0, 32.0, 45.0, 54.0, 109.0, 206.0, 357.0, 585.0, 1017.0, 1741.0, 3121.0, 5268.0, 9330.0, 16277.0, 27889.0, 46145.0, 72167.0, 103453.0, 134564.0, 149579.0, 141522.0, 115969.0, 83825.0, 54775.0, 33698.0, 19885.0, 11643.0, 6524.0, 3760.0, 2073.0, 1188.0, 661.0, 418.0, 240.0, 148.0, 87.0, 68.0, 39.0, 22.0, 15.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.981170654296875, -1.90960693359375, -1.838043212890625, -1.7664794921875, -1.694915771484375, -1.62335205078125, -1.551788330078125, -1.480224609375, -1.408660888671875, -1.33709716796875, -1.265533447265625, -1.1939697265625, -1.122406005859375, -1.05084228515625, -0.979278564453125, -0.90771484375, -0.836151123046875, -0.76458740234375, -0.693023681640625, -0.6214599609375, -0.549896240234375, -0.47833251953125, -0.406768798828125, -0.335205078125, -0.263641357421875, -0.19207763671875, -0.120513916015625, -0.0489501953125, 0.022613525390625, 0.09417724609375, 0.165740966796875, 0.2373046875, 0.308868408203125, 0.38043212890625, 0.451995849609375, 0.5235595703125, 0.595123291015625, 0.66668701171875, 0.738250732421875, 0.809814453125, 0.881378173828125, 0.95294189453125, 1.024505615234375, 1.0960693359375, 1.167633056640625, 1.23919677734375, 1.310760498046875, 1.38232421875, 1.453887939453125, 1.52545166015625, 1.597015380859375, 1.6685791015625, 1.740142822265625, 1.81170654296875, 1.883270263671875, 1.954833984375, 2.026397705078125, 2.09796142578125, 2.169525146484375, 2.2410888671875, 2.312652587890625, 2.38421630859375, 2.455780029296875, 2.52734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 5.0, 11.0, 9.0, 19.0, 16.0, 18.0, 18.0, 20.0, 26.0, 29.0, 32.0, 42.0, 31.0, 55.0, 63.0, 35.0, 57.0, 45.0, 38.0, 53.0, 33.0, 45.0, 36.0, 45.0, 33.0, 20.0, 23.0, 19.0, 18.0, 16.0, 18.0, 11.0, 14.0, 4.0, 9.0, 6.0, 1.0, 6.0, 5.0, 1.0, 6.0, 2.0, 3.0], "bins": [-0.9111328125, -0.88726806640625, -0.8634033203125, -0.83953857421875, -0.815673828125, -0.79180908203125, -0.7679443359375, -0.74407958984375, -0.72021484375, -0.69635009765625, -0.6724853515625, -0.64862060546875, -0.624755859375, -0.60089111328125, -0.5770263671875, -0.55316162109375, -0.529296875, -0.50543212890625, -0.4815673828125, -0.45770263671875, -0.433837890625, -0.40997314453125, -0.3861083984375, -0.36224365234375, -0.33837890625, -0.31451416015625, -0.2906494140625, -0.26678466796875, -0.242919921875, -0.21905517578125, -0.1951904296875, -0.17132568359375, -0.1474609375, -0.12359619140625, -0.0997314453125, -0.07586669921875, -0.052001953125, -0.02813720703125, -0.0042724609375, 0.01959228515625, 0.04345703125, 0.06732177734375, 0.0911865234375, 0.11505126953125, 0.138916015625, 0.16278076171875, 0.1866455078125, 0.21051025390625, 0.234375, 0.25823974609375, 0.2821044921875, 0.30596923828125, 0.329833984375, 0.35369873046875, 0.3775634765625, 0.40142822265625, 0.42529296875, 0.44915771484375, 0.4730224609375, 0.49688720703125, 0.520751953125, 0.54461669921875, 0.5684814453125, 0.59234619140625, 0.6162109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 8.0, 16.0, 10.0, 23.0, 16.0, 25.0, 32.0, 36.0, 37.0, 36.0, 31.0, 56.0, 60.0, 51.0, 43.0, 55.0, 60.0, 45.0, 58.0, 49.0, 39.0, 28.0, 34.0, 33.0, 21.0, 22.0, 14.0, 13.0, 12.0, 4.0, 8.0, 7.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410310745239258, -4.211811542510986, -4.013312339782715, -3.8148136138916016, -3.61631441116333, -3.4178152084350586, -3.219316244125366, -3.020817279815674, -2.8223180770874023, -2.623818874359131, -2.4253199100494385, -2.226820945739746, -2.0283217430114746, -1.8298226594924927, -1.6313235759735107, -1.4328244924545288, -1.2343254089355469, -1.035826325416565, -0.837327241897583, -0.6388281583786011, -0.44032907485961914, -0.2418299913406372, -0.04333090782165527, 0.15516817569732666, 0.3536672592163086, 0.5521663427352905, 0.7506654262542725, 0.9491645097732544, 1.1476635932922363, 1.3461626768112183, 1.5446617603302002, 1.7431608438491821, 1.941659927368164, 2.1401591300964355, 2.338658094406128, 2.5371570587158203, 2.735656261444092, 2.9341554641723633, 3.1326544284820557, 3.331153392791748, 3.5296525955200195, 3.728151798248291, 3.9266507625579834, 4.125149726867676, 4.323648929595947, 4.522148132324219, 4.720646858215332, 4.9191460609436035, 5.117645263671875, 5.3161444664001465, 5.514643669128418, 5.713142395019531, 5.911641597747803, 6.110140800476074, 6.3086395263671875, 6.507138729095459, 6.7056379318237305, 6.904137134552002, 7.102636337280273, 7.301135063171387, 7.499634265899658, 7.69813346862793, 7.896632194519043, 8.095131874084473, 8.293630599975586]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 9.0, 6.0, 12.0, 16.0, 6.0, 11.0, 11.0, 21.0, 21.0, 30.0, 33.0, 30.0, 37.0, 38.0, 36.0, 41.0, 38.0, 42.0, 33.0, 35.0, 43.0, 44.0, 33.0, 34.0, 39.0, 31.0, 26.0, 45.0, 31.0, 27.0, 24.0, 24.0, 18.0, 14.0, 12.0, 7.0, 8.0, 7.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.914901256561279, -7.664599418640137, -7.414297103881836, -7.163995265960693, -6.913692951202393, -6.66339111328125, -6.413088798522949, -6.162786960601807, -5.912485122680664, -5.6621832847595215, -5.411880970001221, -5.161579132080078, -4.911276817321777, -4.660974979400635, -4.410673141479492, -4.160370826721191, -3.9100685119628906, -3.659766435623169, -3.4094643592834473, -3.1591625213623047, -2.908860206604004, -2.6585583686828613, -2.4082562923431396, -2.157954216003418, -1.9076521396636963, -1.6573500633239746, -1.407047986984253, -1.1567460298538208, -0.9064439535140991, -0.6561418771743774, -0.4058399200439453, -0.15553784370422363, 0.09476375579833984, 0.34506580233573914, 0.5953678488731384, 0.8456698656082153, 1.095971941947937, 1.3462740182876587, 1.5965759754180908, 1.8468780517578125, 2.097180128097534, 2.347482204437256, 2.5977842807769775, 2.848086357116699, 3.098388195037842, 3.3486905097961426, 3.598992347717285, 3.849294424057007, 4.0995965003967285, 4.349898338317871, 4.600200653076172, 4.8505024909973145, 5.100804805755615, 5.351106643676758, 5.601408958435059, 5.851710796356201, 6.102012634277344, 6.352314472198486, 6.602616786956787, 6.85291862487793, 7.1032209396362305, 7.353522777557373, 7.603824615478516, 7.854126930236816, 8.104429244995117]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 11.0, 12.0, 13.0, 24.0, 29.0, 38.0, 46.0, 59.0, 90.0, 113.0, 139.0, 226.0, 325.0, 483.0, 768.0, 1251.0, 2230.0, 3843.0, 5943.0, 1023647.0, 4556.0, 2664.0, 1382.0, 872.0, 554.0, 395.0, 234.0, 161.0, 125.0, 93.0, 70.0, 49.0, 42.0, 27.0, 25.0, 14.0, 13.0, 8.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.40509796142578, -71.55941772460938, -68.7137451171875, -65.8680648803711, -63.02238464355469, -60.17670822143555, -57.331031799316406, -54.4853515625, -51.63967514038086, -48.79399871826172, -45.94831848144531, -43.10264205932617, -40.25696563720703, -37.411285400390625, -34.565608978271484, -31.71993064880371, -28.874252319335938, -26.028573989868164, -23.18289566040039, -20.33721923828125, -17.491540908813477, -14.645862579345703, -11.800186157226562, -8.954507827758789, -6.108829498291016, -3.2631516456604004, -0.41747379302978516, 2.428203582763672, 5.273881912231445, 8.119560241699219, 10.96523666381836, 13.810914993286133, 16.656585693359375, 19.50226402282715, 22.347942352294922, 25.193618774414062, 28.039297103881836, 30.88497543334961, 33.73065185546875, 36.576332092285156, 39.4220085144043, 42.26768493652344, 45.113365173339844, 47.959041595458984, 50.804718017578125, 53.65039825439453, 56.49607467651367, 59.34175109863281, 62.18743133544922, 65.03311157226562, 67.8787841796875, 70.7244644165039, 73.57014465332031, 76.41581726074219, 79.2614974975586, 82.107177734375, 84.95285034179688, 87.79853057861328, 90.64420318603516, 93.48988342285156, 96.33556365966797, 99.18124389648438, 102.02691650390625, 104.87259674072266, 107.71827697753906]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 15.0, 17.0, 27.0, 44.0, 65.0, 76.0, 128.0, 162.0, 206.0, 303.0, 363.0, 528.0, 778.0, 981.0, 1367.0, 1836.0, 2764.0, 4291.0, 8054.0, 36259.0, 51379072.0, 15791.0, 6206.0, 3548.0, 2332.0, 1638.0, 1150.0, 926.0, 654.0, 500.0, 356.0, 274.0, 215.0, 127.0, 92.0, 71.0, 42.0, 31.0, 22.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.5169448852539, -116.89854431152344, -113.2801513671875, -109.66175079345703, -106.04335021972656, -102.42495727539062, -98.80655670166016, -95.18815612792969, -91.56976318359375, -87.95136260986328, -84.33296966552734, -80.71456909179688, -77.0961685180664, -73.47776794433594, -69.859375, -66.24097442626953, -62.62257385253906, -59.00417709350586, -55.38577651977539, -51.76737976074219, -48.14897918701172, -44.530582427978516, -40.91218566894531, -37.293785095214844, -33.67538833618164, -30.056989669799805, -26.43859100341797, -22.820194244384766, -19.20179557800293, -15.583396911621094, -11.96500015258789, -8.346601486206055, -4.72821044921875, -1.1098122596740723, 2.5085859298706055, 6.126983642578125, 9.745382308959961, 13.363780975341797, 16.982177734375, 20.600576400756836, 24.218975067138672, 27.837373733520508, 31.455772399902344, 35.07416915893555, 38.69256591796875, 42.31096649169922, 45.92936325073242, 49.547760009765625, 53.166160583496094, 56.7845573425293, 60.402957916259766, 64.02135467529297, 67.63975524902344, 71.25814819335938, 74.87654876708984, 78.49494934082031, 82.11334228515625, 85.73174285888672, 89.35013580322266, 92.96853637695312, 96.5869369506836, 100.20533752441406, 103.82373046875, 107.44213104248047, 111.06053161621094]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 5.0, 15.0, 16.0, 22.0, 21.0, 32.0, 35.0, 44.0, 42.0, 62.0, 57.0, 87.0, 71.0, 70.0, 68.0, 53.0, 45.0, 47.0, 35.0, 23.0, 21.0, 21.0, 12.0, 17.0, 13.0, 10.0, 9.0, 14.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-105.52364349365234, -101.81562042236328, -98.10760498046875, -94.39958190917969, -90.69155883789062, -86.98353576660156, -83.2755126953125, -79.56749725341797, -75.8594741821289, -72.15145111083984, -68.44343566894531, -64.73541259765625, -61.02738952636719, -57.319366455078125, -53.61134719848633, -49.90332794189453, -46.19530487060547, -42.487281799316406, -38.77926254272461, -35.07124328613281, -31.36322021484375, -27.65519905090332, -23.94717788696289, -20.23915672302246, -16.53113555908203, -12.823114395141602, -9.115093231201172, -5.407072067260742, -1.6990509033203125, 2.008970260620117, 5.716991424560547, 9.425012588500977, 13.133026123046875, 16.841047286987305, 20.549068450927734, 24.257089614868164, 27.965110778808594, 31.673131942749023, 35.38115310668945, 39.08917236328125, 42.79719543457031, 46.505218505859375, 50.21323776245117, 53.92125701904297, 57.62928009033203, 61.337303161621094, 65.04531860351562, 68.75334167480469, 72.46136474609375, 76.16938781738281, 79.87741088867188, 83.5854263305664, 87.29344940185547, 91.00147247314453, 94.70948791503906, 98.41751098632812, 102.12553405761719, 105.83355712890625, 109.54158020019531, 113.24959564208984, 116.9576187133789, 120.66564178466797, 124.3736572265625, 128.08168029785156, 131.78970336914062]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 10.0, 18.0, 15.0, 17.0, 20.0, 17.0, 30.0, 30.0, 26.0, 36.0, 49.0, 57.0, 37.0, 60.0, 64.0, 55.0, 55.0, 46.0, 41.0, 34.0, 22.0, 27.0, 18.0, 22.0, 25.0, 12.0, 16.0, 15.0, 18.0, 6.0, 8.0, 6.0, 9.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-116.35806274414062, -112.50479125976562, -108.65151977539062, -104.79824829101562, -100.94497680664062, -97.09170532226562, -93.23843383789062, -89.38516235351562, -85.53189086914062, -81.67861938476562, -77.82534790039062, -73.97207641601562, -70.11880493164062, -66.26553344726562, -62.412261962890625, -58.558990478515625, -54.705718994140625, -50.852447509765625, -46.999176025390625, -43.145904541015625, -39.292633056640625, -35.439361572265625, -31.586090087890625, -27.732818603515625, -23.879547119140625, -20.026275634765625, -16.173004150390625, -12.319732666015625, -8.466461181640625, -4.613189697265625, -0.759918212890625, 3.093353271484375, 6.946624755859375, 10.799896240234375, 14.653167724609375, 18.506439208984375, 22.359710693359375, 26.212982177734375, 30.066253662109375, 33.919525146484375, 37.772796630859375, 41.626068115234375, 45.479339599609375, 49.332611083984375, 53.185882568359375, 57.039154052734375, 60.892425537109375, 64.74569702148438, 68.59896850585938, 72.45223999023438, 76.30551147460938, 80.15878295898438, 84.01205444335938, 87.86532592773438, 91.71859741210938, 95.57186889648438, 99.42514038085938, 103.27841186523438, 107.13168334960938, 110.98495483398438, 114.83822631835938, 118.69149780273438, 122.54476928710938, 126.39804077148438, 130.25131225585938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 17.0, 13.0, 14.0, 22.0, 32.0, 56.0, 68.0, 114.0, 171.0, 263.0, 439.0, 641.0, 975.0, 1516.0, 2345.0, 4018.0, 6526.0, 10886.0, 19160.0, 36048.0, 72110.0, 153543.0, 352781.0, 956837.0, 1656245.0, 511896.0, 213295.0, 95581.0, 45341.0, 22818.0, 12438.0, 7071.0, 4246.0, 2540.0, 1532.0, 947.0, 613.0, 395.0, 251.0, 168.0, 100.0, 59.0, 50.0, 24.0, 26.0, 16.0, 10.0, 13.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.7900390625, -1.7344207763671875, -1.678802490234375, -1.6231842041015625, -1.56756591796875, -1.5119476318359375, -1.456329345703125, -1.4007110595703125, -1.3450927734375, -1.2894744873046875, -1.233856201171875, -1.1782379150390625, -1.12261962890625, -1.0670013427734375, -1.011383056640625, -0.9557647705078125, -0.900146484375, -0.8445281982421875, -0.788909912109375, -0.7332916259765625, -0.67767333984375, -0.6220550537109375, -0.566436767578125, -0.5108184814453125, -0.4552001953125, -0.3995819091796875, -0.343963623046875, -0.2883453369140625, -0.23272705078125, -0.1771087646484375, -0.121490478515625, -0.0658721923828125, -0.01025390625, 0.0453643798828125, 0.100982666015625, 0.1566009521484375, 0.21221923828125, 0.2678375244140625, 0.323455810546875, 0.3790740966796875, 0.4346923828125, 0.4903106689453125, 0.545928955078125, 0.6015472412109375, 0.65716552734375, 0.7127838134765625, 0.768402099609375, 0.8240203857421875, 0.879638671875, 0.9352569580078125, 0.990875244140625, 1.0464935302734375, 1.10211181640625, 1.1577301025390625, 1.213348388671875, 1.2689666748046875, 1.3245849609375, 1.3802032470703125, 1.435821533203125, 1.4914398193359375, 1.54705810546875, 1.6026763916015625, 1.658294677734375, 1.7139129638671875, 1.76953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 9.0, 12.0, 14.0, 20.0, 23.0, 33.0, 26.0, 34.0, 60.0, 63.0, 60.0, 72.0, 64.0, 65.0, 69.0, 65.0, 52.0, 56.0, 37.0, 31.0, 19.0, 22.0, 17.0, 13.0, 7.0, 11.0, 5.0, 3.0, 0.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.2097492218017578, -0.20184707641601562, -0.19394493103027344, -0.18604278564453125, -0.17814064025878906, -0.17023849487304688, -0.1623363494873047, -0.1544342041015625, -0.1465320587158203, -0.13862991333007812, -0.13072776794433594, -0.12282562255859375, -0.11492347717285156, -0.10702133178710938, -0.09911918640136719, -0.091217041015625, -0.08331489562988281, -0.07541275024414062, -0.06751060485839844, -0.05960845947265625, -0.05170631408691406, -0.043804168701171875, -0.03590202331542969, -0.0279998779296875, -0.020097732543945312, -0.012195587158203125, -0.0042934417724609375, 0.00360870361328125, 0.011510848999023438, 0.019412994384765625, 0.027315139770507812, 0.03521728515625, 0.04311943054199219, 0.051021575927734375, 0.05892372131347656, 0.06682586669921875, 0.07472801208496094, 0.08263015747070312, 0.09053230285644531, 0.0984344482421875, 0.10633659362792969, 0.11423873901367188, 0.12214088439941406, 0.13004302978515625, 0.13794517517089844, 0.14584732055664062, 0.1537494659423828, 0.161651611328125, 0.1695537567138672, 0.17745590209960938, 0.18535804748535156, 0.19326019287109375, 0.20116233825683594, 0.20906448364257812, 0.2169666290283203, 0.2248687744140625, 0.2327709197998047, 0.24067306518554688, 0.24857521057128906, 0.25647735595703125, 0.26437950134277344, 0.2722816467285156, 0.2801837921142578, 0.2880859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 2.0, 13.0, 11.0, 29.0, 25.0, 52.0, 60.0, 89.0, 155.0, 232.0, 392.0, 817.0, 1687.0, 3636.0, 9406.0, 23959.0, 65053.0, 181185.0, 499311.0, 1379823.0, 1280836.0, 474460.0, 171672.0, 62079.0, 22939.0, 8952.0, 3822.0, 1631.0, 814.0, 409.0, 246.0, 156.0, 102.0, 64.0, 50.0, 39.0, 22.0, 22.0, 12.0, 10.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1370849609375, -1.091552734375, -1.0460205078125, -1.00048828125, -0.9549560546875, -0.909423828125, -0.8638916015625, -0.818359375, -0.7728271484375, -0.727294921875, -0.6817626953125, -0.63623046875, -0.5906982421875, -0.545166015625, -0.4996337890625, -0.4541015625, -0.4085693359375, -0.363037109375, -0.3175048828125, -0.27197265625, -0.2264404296875, -0.180908203125, -0.1353759765625, -0.08984375, -0.0443115234375, 0.001220703125, 0.0467529296875, 0.09228515625, 0.1378173828125, 0.183349609375, 0.2288818359375, 0.2744140625, 0.3199462890625, 0.365478515625, 0.4110107421875, 0.45654296875, 0.5020751953125, 0.547607421875, 0.5931396484375, 0.638671875, 0.6842041015625, 0.729736328125, 0.7752685546875, 0.82080078125, 0.8663330078125, 0.911865234375, 0.9573974609375, 1.0029296875, 1.0484619140625, 1.093994140625, 1.1395263671875, 1.18505859375, 1.2305908203125, 1.276123046875, 1.3216552734375, 1.3671875, 1.4127197265625, 1.458251953125, 1.5037841796875, 1.54931640625, 1.5948486328125, 1.640380859375, 1.6859130859375, 1.7314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 7.0, 14.0, 26.0, 21.0, 27.0, 33.0, 25.0, 47.0, 78.0, 65.0, 89.0, 94.0, 106.0, 132.0, 149.0, 159.0, 214.0, 228.0, 271.0, 354.0, 302.0, 237.0, 190.0, 188.0, 150.0, 146.0, 117.0, 99.0, 87.0, 75.0, 56.0, 57.0, 46.0, 33.0, 26.0, 20.0, 18.0, 19.0, 12.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.366943359375, -0.3549842834472656, -0.34302520751953125, -0.3310661315917969, -0.3191070556640625, -0.3071479797363281, -0.29518890380859375, -0.2832298278808594, -0.271270751953125, -0.2593116760253906, -0.24735260009765625, -0.23539352416992188, -0.2234344482421875, -0.21147537231445312, -0.19951629638671875, -0.18755722045898438, -0.17559814453125, -0.16363906860351562, -0.15167999267578125, -0.13972091674804688, -0.1277618408203125, -0.11580276489257812, -0.10384368896484375, -0.09188461303710938, -0.079925537109375, -0.06796646118164062, -0.05600738525390625, -0.044048309326171875, -0.0320892333984375, -0.020130157470703125, -0.00817108154296875, 0.003787994384765625, 0.0157470703125, 0.027706146240234375, 0.03966522216796875, 0.051624298095703125, 0.0635833740234375, 0.07554244995117188, 0.08750152587890625, 0.09946060180664062, 0.111419677734375, 0.12337875366210938, 0.13533782958984375, 0.14729690551757812, 0.1592559814453125, 0.17121505737304688, 0.18317413330078125, 0.19513320922851562, 0.20709228515625, 0.21905136108398438, 0.23101043701171875, 0.24296951293945312, 0.2549285888671875, 0.2668876647949219, 0.27884674072265625, 0.2908058166503906, 0.302764892578125, 0.3147239685058594, 0.32668304443359375, 0.3386421203613281, 0.3506011962890625, 0.3625602722167969, 0.37451934814453125, 0.3864784240722656, 0.3984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 9.0, 6.0, 6.0, 10.0, 17.0, 28.0, 24.0, 40.0, 28.0, 46.0, 50.0, 72.0, 68.0, 65.0, 83.0, 54.0, 60.0, 61.0, 50.0, 46.0, 29.0, 24.0, 25.0, 13.0, 22.0, 15.0, 17.0, 5.0, 6.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.963578701019287, -3.847102165222168, -3.7306253910064697, -3.6141488552093506, -3.4976720809936523, -3.381195545196533, -3.264719009399414, -3.148242235183716, -3.0317654609680176, -2.9152889251708984, -2.7988121509552, -2.682335615158081, -2.565858840942383, -2.4493823051452637, -2.3329057693481445, -2.2164289951324463, -2.099952459335327, -1.9834758043289185, -1.8669991493225098, -1.7505226135253906, -1.6340458393096924, -1.5175693035125732, -1.4010926485061646, -1.2846159934997559, -1.1681393384933472, -1.0516626834869385, -0.9351860284805298, -0.8187094330787659, -0.7022327780723572, -0.5857561230659485, -0.46927952766418457, -0.3528028726577759, -0.2363262176513672, -0.11984957754611969, -0.0033729374408721924, 0.11310368776321411, 0.2295803427696228, 0.3460569977760315, 0.4625335931777954, 0.5790102481842041, 0.6954869031906128, 0.8119635581970215, 0.9284402132034302, 1.0449168682098389, 1.161393404006958, 1.2778701782226562, 1.3943467140197754, 1.510823369026184, 1.6273000240325928, 1.7437766790390015, 1.8602533340454102, 1.9767298698425293, 2.0932066440582275, 2.2096831798553467, 2.326159954071045, 2.442636489868164, 2.559113025665283, 2.6755895614624023, 2.7920663356781006, 2.9085428714752197, 3.025019645690918, 3.141496181488037, 3.2579727172851562, 3.3744494915008545, 3.4909262657165527]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 10.0, 4.0, 10.0, 8.0, 10.0, 19.0, 19.0, 34.0, 30.0, 26.0, 33.0, 47.0, 54.0, 54.0, 44.0, 66.0, 63.0, 58.0, 57.0, 42.0, 47.0, 37.0, 38.0, 41.0, 25.0, 15.0, 27.0, 16.0, 15.0, 14.0, 5.0, 14.0, 9.0, 3.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4074151515960693, -3.304513931274414, -3.201612710952759, -3.0987112522125244, -2.995810031890869, -2.892908811569214, -2.7900075912475586, -2.687106132507324, -2.584204912185669, -2.4813036918640137, -2.3784024715423584, -2.275501012802124, -2.1725997924804688, -2.0696985721588135, -1.9667973518371582, -1.8638960123062134, -1.760994791984558, -1.6580935716629028, -1.555192232131958, -1.4522910118103027, -1.349389672279358, -1.2464884519577026, -1.1435871124267578, -1.0406858921051025, -0.9377846121788025, -0.8348833322525024, -0.7319820523262024, -0.6290807723999023, -0.5261795520782471, -0.423278272151947, -0.320376992225647, -0.21747571229934692, -0.11457443237304688, -0.011673159897327423, 0.09122811257839203, 0.19412937760353088, 0.29703065752983093, 0.3999319076538086, 0.5028331875801086, 0.6057344675064087, 0.7086357474327087, 0.8115370273590088, 0.9144383072853088, 1.0173395872116089, 1.1202408075332642, 1.223142147064209, 1.3260433673858643, 1.4289445877075195, 1.5318459272384644, 1.6347471475601196, 1.7376484870910645, 1.8405497074127197, 1.9434510469436646, 2.0463523864746094, 2.1492536067962646, 2.25215482711792, 2.355056047439575, 2.4579572677612305, 2.5608584880828857, 2.66375994682312, 2.7666611671447754, 2.8695623874664307, 2.972463607788086, 3.0753650665283203, 3.1782662868499756]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 18.0, 15.0, 33.0, 23.0, 51.0, 56.0, 113.0, 184.0, 306.0, 464.0, 771.0, 1404.0, 2365.0, 4399.0, 8831.0, 18507.0, 42260.0, 99893.0, 226219.0, 315931.0, 183874.0, 78490.0, 33377.0, 15022.0, 7193.0, 3753.0, 2019.0, 1201.0, 679.0, 406.0, 238.0, 157.0, 95.0, 63.0, 39.0, 34.0, 23.0, 8.0, 18.0, 4.0, 5.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.869140625, -0.83953857421875, -0.8099365234375, -0.78033447265625, -0.750732421875, -0.72113037109375, -0.6915283203125, -0.66192626953125, -0.63232421875, -0.60272216796875, -0.5731201171875, -0.54351806640625, -0.513916015625, -0.48431396484375, -0.4547119140625, -0.42510986328125, -0.3955078125, -0.36590576171875, -0.3363037109375, -0.30670166015625, -0.277099609375, -0.24749755859375, -0.2178955078125, -0.18829345703125, -0.15869140625, -0.12908935546875, -0.0994873046875, -0.06988525390625, -0.040283203125, -0.01068115234375, 0.0189208984375, 0.04852294921875, 0.078125, 0.10772705078125, 0.1373291015625, 0.16693115234375, 0.196533203125, 0.22613525390625, 0.2557373046875, 0.28533935546875, 0.31494140625, 0.34454345703125, 0.3741455078125, 0.40374755859375, 0.433349609375, 0.46295166015625, 0.4925537109375, 0.52215576171875, 0.5517578125, 0.58135986328125, 0.6109619140625, 0.64056396484375, 0.670166015625, 0.69976806640625, 0.7293701171875, 0.75897216796875, 0.78857421875, 0.81817626953125, 0.8477783203125, 0.87738037109375, 0.906982421875, 0.93658447265625, 0.9661865234375, 0.99578857421875, 1.025390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 8.0, 2.0, 3.0, 6.0, 13.0, 19.0, 18.0, 19.0, 33.0, 26.0, 29.0, 38.0, 47.0, 72.0, 74.0, 64.0, 76.0, 62.0, 49.0, 64.0, 53.0, 44.0, 44.0, 31.0, 20.0, 26.0, 20.0, 6.0, 10.0, 8.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2249755859375, -0.21645164489746094, -0.20792770385742188, -0.1994037628173828, -0.19087982177734375, -0.1823558807373047, -0.17383193969726562, -0.16530799865722656, -0.1567840576171875, -0.14826011657714844, -0.13973617553710938, -0.1312122344970703, -0.12268829345703125, -0.11416435241699219, -0.10564041137695312, -0.09711647033691406, -0.088592529296875, -0.08006858825683594, -0.07154464721679688, -0.06302070617675781, -0.05449676513671875, -0.04597282409667969, -0.037448883056640625, -0.028924942016601562, -0.0204010009765625, -0.011877059936523438, -0.003353118896484375, 0.0051708221435546875, 0.01369476318359375, 0.022218704223632812, 0.030742645263671875, 0.03926658630371094, 0.04779052734375, 0.05631446838378906, 0.06483840942382812, 0.07336235046386719, 0.08188629150390625, 0.09041023254394531, 0.09893417358398438, 0.10745811462402344, 0.1159820556640625, 0.12450599670410156, 0.13302993774414062, 0.1415538787841797, 0.15007781982421875, 0.1586017608642578, 0.16712570190429688, 0.17564964294433594, 0.184173583984375, 0.19269752502441406, 0.20122146606445312, 0.2097454071044922, 0.21826934814453125, 0.2267932891845703, 0.23531723022460938, 0.24384117126464844, 0.2523651123046875, 0.26088905334472656, 0.2694129943847656, 0.2779369354248047, 0.28646087646484375, 0.2949848175048828, 0.3035087585449219, 0.31203269958496094, 0.320556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 7.0, 26.0, 27.0, 36.0, 70.0, 112.0, 221.0, 576.0, 1407.0, 4388.0, 16336.0, 78995.0, 505894.0, 366873.0, 55430.0, 12525.0, 3548.0, 1146.0, 452.0, 203.0, 112.0, 53.0, 37.0, 21.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6318359375, -1.5733489990234375, -1.514862060546875, -1.4563751220703125, -1.39788818359375, -1.3394012451171875, -1.280914306640625, -1.2224273681640625, -1.1639404296875, -1.1054534912109375, -1.046966552734375, -0.9884796142578125, -0.92999267578125, -0.8715057373046875, -0.813018798828125, -0.7545318603515625, -0.696044921875, -0.6375579833984375, -0.579071044921875, -0.5205841064453125, -0.46209716796875, -0.4036102294921875, -0.345123291015625, -0.2866363525390625, -0.2281494140625, -0.1696624755859375, -0.111175537109375, -0.0526885986328125, 0.00579833984375, 0.0642852783203125, 0.122772216796875, 0.1812591552734375, 0.23974609375, 0.2982330322265625, 0.356719970703125, 0.4152069091796875, 0.47369384765625, 0.5321807861328125, 0.590667724609375, 0.6491546630859375, 0.7076416015625, 0.7661285400390625, 0.824615478515625, 0.8831024169921875, 0.94158935546875, 1.0000762939453125, 1.058563232421875, 1.1170501708984375, 1.175537109375, 1.2340240478515625, 1.292510986328125, 1.3509979248046875, 1.40948486328125, 1.4679718017578125, 1.526458740234375, 1.5849456787109375, 1.6434326171875, 1.7019195556640625, 1.760406494140625, 1.8188934326171875, 1.87738037109375, 1.9358673095703125, 1.994354248046875, 2.0528411865234375, 2.111328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 3.0, 4.0, 8.0, 5.0, 9.0, 13.0, 12.0, 14.0, 19.0, 23.0, 26.0, 29.0, 28.0, 30.0, 35.0, 33.0, 40.0, 34.0, 49.0, 50.0, 53.0, 43.0, 47.0, 43.0, 45.0, 31.0, 31.0, 21.0, 35.0, 31.0, 30.0, 15.0, 17.0, 13.0, 8.0, 10.0, 12.0, 12.0, 5.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1158905029296875, -1.080413818359375, -1.0449371337890625, -1.00946044921875, -0.9739837646484375, -0.938507080078125, -0.9030303955078125, -0.8675537109375, -0.8320770263671875, -0.796600341796875, -0.7611236572265625, -0.72564697265625, -0.6901702880859375, -0.654693603515625, -0.6192169189453125, -0.583740234375, -0.5482635498046875, -0.512786865234375, -0.4773101806640625, -0.44183349609375, -0.4063568115234375, -0.370880126953125, -0.3354034423828125, -0.2999267578125, -0.2644500732421875, -0.228973388671875, -0.1934967041015625, -0.15802001953125, -0.1225433349609375, -0.087066650390625, -0.0515899658203125, -0.01611328125, 0.0193634033203125, 0.054840087890625, 0.0903167724609375, 0.12579345703125, 0.1612701416015625, 0.196746826171875, 0.2322235107421875, 0.2677001953125, 0.3031768798828125, 0.338653564453125, 0.3741302490234375, 0.40960693359375, 0.4450836181640625, 0.480560302734375, 0.5160369873046875, 0.551513671875, 0.5869903564453125, 0.622467041015625, 0.6579437255859375, 0.69342041015625, 0.7288970947265625, 0.764373779296875, 0.7998504638671875, 0.8353271484375, 0.8708038330078125, 0.906280517578125, 0.9417572021484375, 0.97723388671875, 1.0127105712890625, 1.048187255859375, 1.0836639404296875, 1.119140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 6.0, 9.0, 13.0, 19.0, 31.0, 33.0, 49.0, 93.0, 125.0, 208.0, 347.0, 585.0, 1129.0, 2546.0, 6401.0, 22264.0, 144662.0, 722768.0, 116894.0, 19632.0, 5978.0, 2320.0, 1028.0, 551.0, 339.0, 171.0, 116.0, 66.0, 44.0, 28.0, 32.0, 12.0, 11.0, 5.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.478515625, -3.380401611328125, -3.28228759765625, -3.184173583984375, -3.0860595703125, -2.987945556640625, -2.88983154296875, -2.791717529296875, -2.693603515625, -2.595489501953125, -2.49737548828125, -2.399261474609375, -2.3011474609375, -2.203033447265625, -2.10491943359375, -2.006805419921875, -1.90869140625, -1.810577392578125, -1.71246337890625, -1.614349365234375, -1.5162353515625, -1.418121337890625, -1.32000732421875, -1.221893310546875, -1.123779296875, -1.025665283203125, -0.92755126953125, -0.829437255859375, -0.7313232421875, -0.633209228515625, -0.53509521484375, -0.436981201171875, -0.3388671875, -0.240753173828125, -0.14263916015625, -0.044525146484375, 0.0535888671875, 0.151702880859375, 0.24981689453125, 0.347930908203125, 0.446044921875, 0.544158935546875, 0.64227294921875, 0.740386962890625, 0.8385009765625, 0.936614990234375, 1.03472900390625, 1.132843017578125, 1.23095703125, 1.329071044921875, 1.42718505859375, 1.525299072265625, 1.6234130859375, 1.721527099609375, 1.81964111328125, 1.917755126953125, 2.015869140625, 2.113983154296875, 2.21209716796875, 2.310211181640625, 2.4083251953125, 2.506439208984375, 2.60455322265625, 2.702667236328125, 2.80078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 11.0, 12.0, 14.0, 15.0, 19.0, 36.0, 46.0, 70.0, 65.0, 92.0, 101.0, 98.0, 70.0, 75.0, 58.0, 45.0, 39.0, 25.0, 27.0, 14.0, 11.0, 7.0, 8.0, 12.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00016880035400390625, -0.00016447808593511581, -0.00016015581786632538, -0.00015583354979753494, -0.0001515112817287445, -0.00014718901365995407, -0.00014286674559116364, -0.0001385444775223732, -0.00013422220945358276, -0.00012989994138479233, -0.0001255776733160019, -0.00012125540524721146, -0.00011693313717842102, -0.00011261086910963058, -0.00010828860104084015, -0.00010396633297204971, -9.964406490325928e-05, -9.532179683446884e-05, -9.09995287656784e-05, -8.667726069688797e-05, -8.235499262809753e-05, -7.80327245593071e-05, -7.371045649051666e-05, -6.938818842172623e-05, -6.506592035293579e-05, -6.0743652284145355e-05, -5.642138421535492e-05, -5.2099116146564484e-05, -4.777684807777405e-05, -4.345458000898361e-05, -3.9132311940193176e-05, -3.481004387140274e-05, -3.0487775802612305e-05, -2.616550773382187e-05, -2.1843239665031433e-05, -1.7520971596240997e-05, -1.3198703527450562e-05, -8.876435458660126e-06, -4.55416738986969e-06, -2.3189932107925415e-07, 4.090368747711182e-06, 8.412636816501617e-06, 1.2734904885292053e-05, 1.705717295408249e-05, 2.1379441022872925e-05, 2.570170909166336e-05, 3.0023977160453796e-05, 3.434624522924423e-05, 3.866851329803467e-05, 4.2990781366825104e-05, 4.731304943561554e-05, 5.1635317504405975e-05, 5.595758557319641e-05, 6.027985364198685e-05, 6.460212171077728e-05, 6.892438977956772e-05, 7.324665784835815e-05, 7.756892591714859e-05, 8.189119398593903e-05, 8.621346205472946e-05, 9.05357301235199e-05, 9.485799819231033e-05, 9.918026626110077e-05, 0.0001035025343298912, 0.00010782480239868164]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 13.0, 16.0, 39.0, 71.0, 90.0, 161.0, 247.0, 487.0, 1132.0, 2436.0, 6449.0, 21918.0, 122534.0, 681416.0, 170683.0, 27805.0, 7825.0, 2765.0, 1157.0, 577.0, 272.0, 167.0, 107.0, 72.0, 30.0, 30.0, 18.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8359375, -2.74005126953125, -2.6441650390625, -2.54827880859375, -2.452392578125, -2.35650634765625, -2.2606201171875, -2.16473388671875, -2.06884765625, -1.97296142578125, -1.8770751953125, -1.78118896484375, -1.685302734375, -1.58941650390625, -1.4935302734375, -1.39764404296875, -1.3017578125, -1.20587158203125, -1.1099853515625, -1.01409912109375, -0.918212890625, -0.82232666015625, -0.7264404296875, -0.63055419921875, -0.53466796875, -0.43878173828125, -0.3428955078125, -0.24700927734375, -0.151123046875, -0.05523681640625, 0.0406494140625, 0.13653564453125, 0.232421875, 0.32830810546875, 0.4241943359375, 0.52008056640625, 0.615966796875, 0.71185302734375, 0.8077392578125, 0.90362548828125, 0.99951171875, 1.09539794921875, 1.1912841796875, 1.28717041015625, 1.383056640625, 1.47894287109375, 1.5748291015625, 1.67071533203125, 1.7666015625, 1.86248779296875, 1.9583740234375, 2.05426025390625, 2.150146484375, 2.24603271484375, 2.3419189453125, 2.43780517578125, 2.53369140625, 2.62957763671875, 2.7254638671875, 2.82135009765625, 2.917236328125, 3.01312255859375, 3.1090087890625, 3.20489501953125, 3.30078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 7.0, 2.0, 3.0, 9.0, 19.0, 10.0, 17.0, 20.0, 25.0, 30.0, 43.0, 34.0, 40.0, 56.0, 58.0, 65.0, 63.0, 67.0, 69.0, 64.0, 45.0, 44.0, 44.0, 30.0, 27.0, 17.0, 25.0, 11.0, 8.0, 11.0, 9.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9547958374023438, -0.9227752685546875, -0.8907546997070312, -0.858734130859375, -0.8267135620117188, -0.7946929931640625, -0.7626724243164062, -0.73065185546875, -0.6986312866210938, -0.6666107177734375, -0.6345901489257812, -0.602569580078125, -0.5705490112304688, -0.5385284423828125, -0.5065078735351562, -0.4744873046875, -0.44246673583984375, -0.4104461669921875, -0.37842559814453125, -0.346405029296875, -0.31438446044921875, -0.2823638916015625, -0.25034332275390625, -0.21832275390625, -0.18630218505859375, -0.1542816162109375, -0.12226104736328125, -0.090240478515625, -0.05821990966796875, -0.0261993408203125, 0.00582122802734375, 0.037841796875, 0.06986236572265625, 0.1018829345703125, 0.13390350341796875, 0.165924072265625, 0.19794464111328125, 0.2299652099609375, 0.26198577880859375, 0.29400634765625, 0.32602691650390625, 0.3580474853515625, 0.39006805419921875, 0.422088623046875, 0.45410919189453125, 0.4861297607421875, 0.5181503295898438, 0.5501708984375, 0.5821914672851562, 0.6142120361328125, 0.6462326049804688, 0.678253173828125, 0.7102737426757812, 0.7422943115234375, 0.7743148803710938, 0.80633544921875, 0.8383560180664062, 0.8703765869140625, 0.9023971557617188, 0.934417724609375, 0.9664382934570312, 0.9984588623046875, 1.0304794311523438, 1.0625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 17.0, 22.0, 66.0, 169.0, 310.0, 224.0, 111.0, 27.0, 28.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.776371002197266, -9.921586990356445, -9.066802024841309, -8.212018013000488, -7.35723352432251, -6.502449035644531, -5.647665023803711, -4.792880535125732, -3.938096046447754, -3.0833115577697754, -2.228527307510376, -1.3737430572509766, -0.518958568572998, 0.33582592010498047, 1.1906099319458008, 2.0453944206237793, 2.900178909301758, 3.7549633979797363, 4.609747886657715, 5.464531898498535, 6.319316387176514, 7.174100875854492, 8.028884887695312, 8.883668899536133, 9.73845386505127, 10.59323787689209, 11.448022842407227, 12.302806854248047, 13.157590866088867, 14.012375831604004, 14.867159843444824, 15.721944808959961, 16.57672882080078, 17.4315128326416, 18.286296844482422, 19.141082763671875, 19.995866775512695, 20.850650787353516, 21.705434799194336, 22.560218811035156, 23.41500473022461, 24.26978874206543, 25.12457275390625, 25.979358673095703, 26.834142684936523, 27.688926696777344, 28.543710708618164, 29.398494720458984, 30.253278732299805, 31.108062744140625, 31.962846755981445, 32.817630767822266, 33.67241668701172, 34.527198791503906, 35.38198471069336, 36.23677062988281, 37.091552734375, 37.94633865356445, 38.80112075805664, 39.655906677246094, 40.51068878173828, 41.365474700927734, 42.22026062011719, 43.075042724609375, 43.92982864379883]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 2.0, 2.0, 10.0, 8.0, 13.0, 19.0, 23.0, 40.0, 65.0, 84.0, 131.0, 108.0, 128.0, 93.0, 63.0, 46.0, 35.0, 29.0, 17.0, 9.0, 10.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.889347076416016, -18.295181274414062, -17.70101547241211, -17.106849670410156, -16.512683868408203, -15.91851806640625, -15.324352264404297, -14.730186462402344, -14.13602066040039, -13.541854858398438, -12.947689056396484, -12.353523254394531, -11.759357452392578, -11.165191650390625, -10.571025848388672, -9.976860046386719, -9.382694244384766, -8.788528442382812, -8.19436264038086, -7.600196838378906, -7.006031036376953, -6.411865234375, -5.817699432373047, -5.223533630371094, -4.629367828369141, -4.0352020263671875, -3.4410362243652344, -2.8468704223632812, -2.252704620361328, -1.658538818359375, -1.0643730163574219, -0.47020721435546875, 0.12395858764648438, 0.7181243896484375, 1.3122901916503906, 1.9064559936523438, 2.500621795654297, 3.09478759765625, 3.688953399658203, 4.283119201660156, 4.877285003662109, 5.4714508056640625, 6.065616607666016, 6.659782409667969, 7.253948211669922, 7.848114013671875, 8.442279815673828, 9.036445617675781, 9.630611419677734, 10.224777221679688, 10.81894302368164, 11.413108825683594, 12.007274627685547, 12.6014404296875, 13.195606231689453, 13.789772033691406, 14.38393783569336, 14.978103637695312, 15.572269439697266, 16.16643524169922, 16.760601043701172, 17.354766845703125, 17.948932647705078, 18.54309844970703, 19.137264251708984]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 7.0, 21.0, 20.0, 44.0, 49.0, 88.0, 154.0, 372.0, 753.0, 1866.0, 4792.0, 14424.0, 50742.0, 249837.0, 3376035.0, 399769.0, 67618.0, 17842.0, 5894.0, 2084.0, 938.0, 426.0, 200.0, 101.0, 63.0, 33.0, 25.0, 18.0, 14.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3984375, -4.2391357421875, -4.079833984375, -3.9205322265625, -3.76123046875, -3.6019287109375, -3.442626953125, -3.2833251953125, -3.1240234375, -2.9647216796875, -2.805419921875, -2.6461181640625, -2.48681640625, -2.3275146484375, -2.168212890625, -2.0089111328125, -1.849609375, -1.6903076171875, -1.531005859375, -1.3717041015625, -1.21240234375, -1.0531005859375, -0.893798828125, -0.7344970703125, -0.5751953125, -0.4158935546875, -0.256591796875, -0.0972900390625, 0.06201171875, 0.2213134765625, 0.380615234375, 0.5399169921875, 0.69921875, 0.8585205078125, 1.017822265625, 1.1771240234375, 1.33642578125, 1.4957275390625, 1.655029296875, 1.8143310546875, 1.9736328125, 2.1329345703125, 2.292236328125, 2.4515380859375, 2.61083984375, 2.7701416015625, 2.929443359375, 3.0887451171875, 3.248046875, 3.4073486328125, 3.566650390625, 3.7259521484375, 3.88525390625, 4.0445556640625, 4.203857421875, 4.3631591796875, 4.5224609375, 4.6817626953125, 4.841064453125, 5.0003662109375, 5.15966796875, 5.3189697265625, 5.478271484375, 5.6375732421875, 5.796875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 1.0, 5.0, 6.0, 6.0, 18.0, 19.0, 16.0, 21.0, 26.0, 25.0, 30.0, 32.0, 35.0, 37.0, 51.0, 55.0, 55.0, 52.0, 57.0, 58.0, 58.0, 41.0, 40.0, 43.0, 41.0, 30.0, 24.0, 17.0, 18.0, 13.0, 15.0, 7.0, 6.0, 5.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17502212524414062, -0.16767120361328125, -0.16032028198242188, -0.1529693603515625, -0.14561843872070312, -0.13826751708984375, -0.13091659545898438, -0.123565673828125, -0.11621475219726562, -0.10886383056640625, -0.10151290893554688, -0.0941619873046875, -0.08681106567382812, -0.07946014404296875, -0.07210922241210938, -0.06475830078125, -0.057407379150390625, -0.05005645751953125, -0.042705535888671875, -0.0353546142578125, -0.028003692626953125, -0.02065277099609375, -0.013301849365234375, -0.005950927734375, 0.001399993896484375, 0.00875091552734375, 0.016101837158203125, 0.0234527587890625, 0.030803680419921875, 0.03815460205078125, 0.045505523681640625, 0.0528564453125, 0.060207366943359375, 0.06755828857421875, 0.07490921020507812, 0.0822601318359375, 0.08961105346679688, 0.09696197509765625, 0.10431289672851562, 0.111663818359375, 0.11901473999023438, 0.12636566162109375, 0.13371658325195312, 0.1410675048828125, 0.14841842651367188, 0.15576934814453125, 0.16312026977539062, 0.17047119140625, 0.17782211303710938, 0.18517303466796875, 0.19252395629882812, 0.1998748779296875, 0.20722579956054688, 0.21457672119140625, 0.22192764282226562, 0.229278564453125, 0.23662948608398438, 0.24398040771484375, 0.2513313293457031, 0.2586822509765625, 0.2660331726074219, 0.27338409423828125, 0.2807350158691406, 0.2880859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 13.0, 18.0, 28.0, 51.0, 52.0, 112.0, 173.0, 292.0, 564.0, 1043.0, 2126.0, 4727.0, 11596.0, 31341.0, 97791.0, 383259.0, 2836117.0, 614268.0, 140897.0, 43032.0, 15225.0, 6107.0, 2578.0, 1345.0, 642.0, 363.0, 203.0, 130.0, 58.0, 55.0, 9.0, 12.0, 9.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.126922607421875, -3.02142333984375, -2.915924072265625, -2.8104248046875, -2.704925537109375, -2.59942626953125, -2.493927001953125, -2.388427734375, -2.282928466796875, -2.17742919921875, -2.071929931640625, -1.9664306640625, -1.860931396484375, -1.75543212890625, -1.649932861328125, -1.54443359375, -1.438934326171875, -1.33343505859375, -1.227935791015625, -1.1224365234375, -1.016937255859375, -0.91143798828125, -0.805938720703125, -0.700439453125, -0.594940185546875, -0.48944091796875, -0.383941650390625, -0.2784423828125, -0.172943115234375, -0.06744384765625, 0.038055419921875, 0.1435546875, 0.249053955078125, 0.35455322265625, 0.460052490234375, 0.5655517578125, 0.671051025390625, 0.77655029296875, 0.882049560546875, 0.987548828125, 1.093048095703125, 1.19854736328125, 1.304046630859375, 1.4095458984375, 1.515045166015625, 1.62054443359375, 1.726043701171875, 1.83154296875, 1.937042236328125, 2.04254150390625, 2.148040771484375, 2.2535400390625, 2.359039306640625, 2.46453857421875, 2.570037841796875, 2.675537109375, 2.781036376953125, 2.88653564453125, 2.992034912109375, 3.0975341796875, 3.203033447265625, 3.30853271484375, 3.414031982421875, 3.51953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 10.0, 8.0, 13.0, 19.0, 33.0, 55.0, 75.0, 146.0, 173.0, 304.0, 557.0, 1428.0, 484.0, 261.0, 167.0, 116.0, 64.0, 55.0, 26.0, 26.0, 16.0, 6.0, 11.0, 10.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5676040649414062, -0.5468292236328125, -0.5260543823242188, -0.505279541015625, -0.48450469970703125, -0.4637298583984375, -0.44295501708984375, -0.42218017578125, -0.40140533447265625, -0.3806304931640625, -0.35985565185546875, -0.339080810546875, -0.31830596923828125, -0.2975311279296875, -0.27675628662109375, -0.2559814453125, -0.23520660400390625, -0.2144317626953125, -0.19365692138671875, -0.172882080078125, -0.15210723876953125, -0.1313323974609375, -0.11055755615234375, -0.08978271484375, -0.06900787353515625, -0.0482330322265625, -0.02745819091796875, -0.006683349609375, 0.01409149169921875, 0.0348663330078125, 0.05564117431640625, 0.076416015625, 0.09719085693359375, 0.1179656982421875, 0.13874053955078125, 0.159515380859375, 0.18029022216796875, 0.2010650634765625, 0.22183990478515625, 0.24261474609375, 0.26338958740234375, 0.2841644287109375, 0.30493927001953125, 0.325714111328125, 0.34648895263671875, 0.3672637939453125, 0.38803863525390625, 0.4088134765625, 0.42958831787109375, 0.4503631591796875, 0.47113800048828125, 0.491912841796875, 0.5126876831054688, 0.5334625244140625, 0.5542373657226562, 0.57501220703125, 0.5957870483398438, 0.6165618896484375, 0.6373367309570312, 0.658111572265625, 0.6788864135742188, 0.6996612548828125, 0.7204360961914062, 0.7412109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 23.0, 109.0, 269.0, 331.0, 184.0, 63.0, 15.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.490816116333008, -14.120329856872559, -13.749844551086426, -13.379358291625977, -13.008872032165527, -12.638385772705078, -12.267900466918945, -11.897414207458496, -11.526927947998047, -11.156441688537598, -10.785956382751465, -10.415470123291016, -10.044983863830566, -9.674497604370117, -9.304012298583984, -8.933526039123535, -8.563040733337402, -8.192554473876953, -7.822068691253662, -7.451582908630371, -7.081096649169922, -6.710610866546631, -6.34012508392334, -5.969638824462891, -5.5991530418396, -5.228667259216309, -4.858180999755859, -4.487695217132568, -4.117209434509277, -3.746723175048828, -3.376237392425537, -3.005751371383667, -2.6352643966674805, -2.2647783756256104, -1.8942924737930298, -1.5238065719604492, -1.153320550918579, -0.782834529876709, -0.41234874725341797, -0.04186272621154785, 0.32862329483032227, 0.6991092562675476, 1.069595217704773, 1.4400811195373535, 1.8105671405792236, 2.1810531616210938, 2.5515389442443848, 2.922024965286255, 3.292510986328125, 3.662997007369995, 4.033483028411865, 4.403968811035156, 4.7744550704956055, 5.1449408531188965, 5.5154266357421875, 5.885912895202637, 6.256398677825928, 6.626884460449219, 6.997370719909668, 7.367856502532959, 7.73834228515625, 8.1088285446167, 8.479314804077148, 8.849800109863281, 9.22028636932373]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 10.0, 11.0, 14.0, 19.0, 15.0, 26.0, 24.0, 32.0, 38.0, 33.0, 48.0, 47.0, 38.0, 46.0, 49.0, 45.0, 60.0, 52.0, 44.0, 34.0, 34.0, 40.0, 34.0, 29.0, 33.0, 25.0, 10.0, 17.0, 17.0, 15.0, 12.0, 8.0, 1.0, 3.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2363553047180176, -2.1701035499572754, -2.103851795196533, -2.037600040435791, -1.9713481664657593, -1.905096411705017, -1.8388445377349854, -1.7725927829742432, -1.706341028213501, -1.6400892734527588, -1.5738375186920166, -1.5075856447219849, -1.4413338899612427, -1.3750821352005005, -1.3088302612304688, -1.2425785064697266, -1.1763267517089844, -1.1100749969482422, -1.0438232421875, -0.9775713682174683, -0.9113196134567261, -0.8450678586959839, -0.7788160443305969, -0.71256422996521, -0.6463124752044678, -0.5800607204437256, -0.5138089060783386, -0.44755712151527405, -0.3813053369522095, -0.3150535523891449, -0.24880176782608032, -0.18254998326301575, -0.11629843711853027, -0.0500466525554657, 0.016205132007598877, 0.08245691657066345, 0.14870870113372803, 0.2149604856967926, 0.2812122702598572, 0.34746405482292175, 0.41371583938598633, 0.4799676239490509, 0.5462194085121155, 0.6124712228775024, 0.6787229776382446, 0.7449747323989868, 0.8112265467643738, 0.8774783611297607, 0.9437301158905029, 1.0099818706512451, 1.0762336254119873, 1.142485499382019, 1.2087372541427612, 1.2749890089035034, 1.3412408828735352, 1.4074926376342773, 1.4737443923950195, 1.5399961471557617, 1.606247901916504, 1.6724997758865356, 1.7387515306472778, 1.80500328540802, 1.8712551593780518, 1.937506914138794, 2.003758668899536]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 6.0, 11.0, 18.0, 24.0, 41.0, 68.0, 79.0, 108.0, 160.0, 231.0, 354.0, 544.0, 880.0, 1429.0, 2282.0, 3675.0, 6119.0, 10131.0, 17785.0, 31649.0, 54791.0, 94288.0, 150588.0, 198024.0, 180258.0, 122046.0, 72959.0, 41734.0, 23996.0, 13442.0, 8035.0, 4785.0, 2993.0, 1752.0, 1155.0, 736.0, 458.0, 318.0, 173.0, 131.0, 99.0, 58.0, 38.0, 28.0, 14.0, 11.0, 9.0, 10.0, 11.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.4326171875, -1.388885498046875, -1.34515380859375, -1.301422119140625, -1.2576904296875, -1.213958740234375, -1.17022705078125, -1.126495361328125, -1.082763671875, -1.039031982421875, -0.99530029296875, -0.951568603515625, -0.9078369140625, -0.864105224609375, -0.82037353515625, -0.776641845703125, -0.73291015625, -0.689178466796875, -0.64544677734375, -0.601715087890625, -0.5579833984375, -0.514251708984375, -0.47052001953125, -0.426788330078125, -0.383056640625, -0.339324951171875, -0.29559326171875, -0.251861572265625, -0.2081298828125, -0.164398193359375, -0.12066650390625, -0.076934814453125, -0.033203125, 0.010528564453125, 0.05426025390625, 0.097991943359375, 0.1417236328125, 0.185455322265625, 0.22918701171875, 0.272918701171875, 0.316650390625, 0.360382080078125, 0.40411376953125, 0.447845458984375, 0.4915771484375, 0.535308837890625, 0.57904052734375, 0.622772216796875, 0.66650390625, 0.710235595703125, 0.75396728515625, 0.797698974609375, 0.8414306640625, 0.885162353515625, 0.92889404296875, 0.972625732421875, 1.016357421875, 1.060089111328125, 1.10382080078125, 1.147552490234375, 1.1912841796875, 1.235015869140625, 1.27874755859375, 1.322479248046875, 1.3662109375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 9.0, 5.0, 7.0, 9.0, 17.0, 15.0, 31.0, 11.0, 27.0, 31.0, 30.0, 49.0, 51.0, 57.0, 42.0, 54.0, 64.0, 52.0, 66.0, 60.0, 42.0, 43.0, 46.0, 27.0, 35.0, 21.0, 20.0, 18.0, 15.0, 9.0, 10.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.22899436950683594, -0.22105026245117188, -0.2131061553955078, -0.20516204833984375, -0.1972179412841797, -0.18927383422851562, -0.18132972717285156, -0.1733856201171875, -0.16544151306152344, -0.15749740600585938, -0.1495532989501953, -0.14160919189453125, -0.1336650848388672, -0.12572097778320312, -0.11777687072753906, -0.109832763671875, -0.10188865661621094, -0.09394454956054688, -0.08600044250488281, -0.07805633544921875, -0.07011222839355469, -0.062168121337890625, -0.05422401428222656, -0.0462799072265625, -0.03833580017089844, -0.030391693115234375, -0.022447586059570312, -0.01450347900390625, -0.0065593719482421875, 0.001384735107421875, 0.009328842163085938, 0.01727294921875, 0.025217056274414062, 0.033161163330078125, 0.04110527038574219, 0.04904937744140625, 0.05699348449707031, 0.06493759155273438, 0.07288169860839844, 0.0808258056640625, 0.08876991271972656, 0.09671401977539062, 0.10465812683105469, 0.11260223388671875, 0.12054634094238281, 0.12849044799804688, 0.13643455505371094, 0.144378662109375, 0.15232276916503906, 0.16026687622070312, 0.1682109832763672, 0.17615509033203125, 0.1840991973876953, 0.19204330444335938, 0.19998741149902344, 0.2079315185546875, 0.21587562561035156, 0.22381973266601562, 0.2317638397216797, 0.23970794677734375, 0.2476520538330078, 0.2555961608886719, 0.26354026794433594, 0.271484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 10.0, 27.0, 30.0, 73.0, 130.0, 280.0, 624.0, 1478.0, 4636.0, 17044.0, 81048.0, 451525.0, 400415.0, 69281.0, 15056.0, 4356.0, 1424.0, 574.0, 229.0, 117.0, 69.0, 47.0, 24.0, 10.0, 14.0, 9.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.5858154296875, -3.486083984375, -3.3863525390625, -3.28662109375, -3.1868896484375, -3.087158203125, -2.9874267578125, -2.8876953125, -2.7879638671875, -2.688232421875, -2.5885009765625, -2.48876953125, -2.3890380859375, -2.289306640625, -2.1895751953125, -2.08984375, -1.9901123046875, -1.890380859375, -1.7906494140625, -1.69091796875, -1.5911865234375, -1.491455078125, -1.3917236328125, -1.2919921875, -1.1922607421875, -1.092529296875, -0.9927978515625, -0.89306640625, -0.7933349609375, -0.693603515625, -0.5938720703125, -0.494140625, -0.3944091796875, -0.294677734375, -0.1949462890625, -0.09521484375, 0.0045166015625, 0.104248046875, 0.2039794921875, 0.3037109375, 0.4034423828125, 0.503173828125, 0.6029052734375, 0.70263671875, 0.8023681640625, 0.902099609375, 1.0018310546875, 1.1015625, 1.2012939453125, 1.301025390625, 1.4007568359375, 1.50048828125, 1.6002197265625, 1.699951171875, 1.7996826171875, 1.8994140625, 1.9991455078125, 2.098876953125, 2.1986083984375, 2.29833984375, 2.3980712890625, 2.497802734375, 2.5975341796875, 2.697265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 12.0, 23.0, 24.0, 27.0, 32.0, 26.0, 43.0, 57.0, 74.0, 62.0, 64.0, 61.0, 55.0, 51.0, 55.0, 60.0, 53.0, 44.0, 28.0, 23.0, 24.0, 20.0, 17.0, 6.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.663330078125, -1.61669921875, -1.570068359375, -1.5234375, -1.476806640625, -1.43017578125, -1.383544921875, -1.3369140625, -1.290283203125, -1.24365234375, -1.197021484375, -1.150390625, -1.103759765625, -1.05712890625, -1.010498046875, -0.9638671875, -0.917236328125, -0.87060546875, -0.823974609375, -0.77734375, -0.730712890625, -0.68408203125, -0.637451171875, -0.5908203125, -0.544189453125, -0.49755859375, -0.450927734375, -0.404296875, -0.357666015625, -0.31103515625, -0.264404296875, -0.2177734375, -0.171142578125, -0.12451171875, -0.077880859375, -0.03125, 0.015380859375, 0.06201171875, 0.108642578125, 0.1552734375, 0.201904296875, 0.24853515625, 0.295166015625, 0.341796875, 0.388427734375, 0.43505859375, 0.481689453125, 0.5283203125, 0.574951171875, 0.62158203125, 0.668212890625, 0.71484375, 0.761474609375, 0.80810546875, 0.854736328125, 0.9013671875, 0.947998046875, 0.99462890625, 1.041259765625, 1.087890625, 1.134521484375, 1.18115234375, 1.227783203125, 1.2744140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 28.0, 52.0, 187.0, 714.0, 3397.0, 28608.0, 618529.0, 375569.0, 18307.0, 2421.0, 500.0, 147.0, 41.0, 19.0, 9.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.140625, -9.904296875, -9.66796875, -9.431640625, -9.1953125, -8.958984375, -8.72265625, -8.486328125, -8.25, -8.013671875, -7.77734375, -7.541015625, -7.3046875, -7.068359375, -6.83203125, -6.595703125, -6.359375, -6.123046875, -5.88671875, -5.650390625, -5.4140625, -5.177734375, -4.94140625, -4.705078125, -4.46875, -4.232421875, -3.99609375, -3.759765625, -3.5234375, -3.287109375, -3.05078125, -2.814453125, -2.578125, -2.341796875, -2.10546875, -1.869140625, -1.6328125, -1.396484375, -1.16015625, -0.923828125, -0.6875, -0.451171875, -0.21484375, 0.021484375, 0.2578125, 0.494140625, 0.73046875, 0.966796875, 1.203125, 1.439453125, 1.67578125, 1.912109375, 2.1484375, 2.384765625, 2.62109375, 2.857421875, 3.09375, 3.330078125, 3.56640625, 3.802734375, 4.0390625, 4.275390625, 4.51171875, 4.748046875, 4.984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 1.0, 10.0, 7.0, 9.0, 15.0, 20.0, 29.0, 64.0, 94.0, 128.0, 165.0, 166.0, 105.0, 71.0, 37.0, 21.0, 17.0, 8.0, 7.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043201446533203125, -0.0004163682460784912, -0.00040072202682495117, -0.00038507580757141113, -0.0003694295883178711, -0.00035378336906433105, -0.000338137149810791, -0.000322490930557251, -0.00030684471130371094, -0.0002911984920501709, -0.00027555227279663086, -0.0002599060535430908, -0.0002442598342895508, -0.00022861361503601074, -0.0002129673957824707, -0.00019732117652893066, -0.00018167495727539062, -0.00016602873802185059, -0.00015038251876831055, -0.0001347362995147705, -0.00011909008026123047, -0.00010344386100769043, -8.779764175415039e-05, -7.215142250061035e-05, -5.650520324707031e-05, -4.0858983993530273e-05, -2.5212764739990234e-05, -9.566545486450195e-06, 6.079673767089844e-06, 2.1725893020629883e-05, 3.737211227416992e-05, 5.301833152770996e-05, 6.866455078125e-05, 8.431077003479004e-05, 9.995698928833008e-05, 0.00011560320854187012, 0.00013124942779541016, 0.0001468956470489502, 0.00016254186630249023, 0.00017818808555603027, 0.0001938343048095703, 0.00020948052406311035, 0.0002251267433166504, 0.00024077296257019043, 0.00025641918182373047, 0.0002720654010772705, 0.00028771162033081055, 0.0003033578395843506, 0.0003190040588378906, 0.00033465027809143066, 0.0003502964973449707, 0.00036594271659851074, 0.0003815889358520508, 0.0003972351551055908, 0.00041288137435913086, 0.0004285275936126709, 0.00044417381286621094, 0.000459820032119751, 0.000475466251373291, 0.0004911124706268311, 0.0005067586898803711, 0.0005224049091339111, 0.0005380511283874512, 0.0005536973476409912, 0.0005693435668945312]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 11.0, 16.0, 14.0, 22.0, 35.0, 50.0, 84.0, 134.0, 202.0, 361.0, 595.0, 1024.0, 1919.0, 3727.0, 7759.0, 17619.0, 42995.0, 114657.0, 285690.0, 330609.0, 146449.0, 54153.0, 21309.0, 9444.0, 4556.0, 2266.0, 1169.0, 688.0, 371.0, 224.0, 140.0, 75.0, 50.0, 41.0, 25.0, 20.0, 7.0, 12.0, 6.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8037109375, -1.7417755126953125, -1.679840087890625, -1.6179046630859375, -1.55596923828125, -1.4940338134765625, -1.432098388671875, -1.3701629638671875, -1.3082275390625, -1.2462921142578125, -1.184356689453125, -1.1224212646484375, -1.06048583984375, -0.9985504150390625, -0.936614990234375, -0.8746795654296875, -0.812744140625, -0.7508087158203125, -0.688873291015625, -0.6269378662109375, -0.56500244140625, -0.5030670166015625, -0.441131591796875, -0.3791961669921875, -0.3172607421875, -0.2553253173828125, -0.193389892578125, -0.1314544677734375, -0.06951904296875, -0.0075836181640625, 0.054351806640625, 0.1162872314453125, 0.17822265625, 0.2401580810546875, 0.302093505859375, 0.3640289306640625, 0.42596435546875, 0.4878997802734375, 0.549835205078125, 0.6117706298828125, 0.6737060546875, 0.7356414794921875, 0.797576904296875, 0.8595123291015625, 0.92144775390625, 0.9833831787109375, 1.045318603515625, 1.1072540283203125, 1.169189453125, 1.2311248779296875, 1.293060302734375, 1.3549957275390625, 1.41693115234375, 1.4788665771484375, 1.540802001953125, 1.6027374267578125, 1.6646728515625, 1.7266082763671875, 1.788543701171875, 1.8504791259765625, 1.91241455078125, 1.9743499755859375, 2.036285400390625, 2.0982208251953125, 2.16015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 8.0, 6.0, 10.0, 15.0, 6.0, 17.0, 15.0, 25.0, 42.0, 29.0, 35.0, 45.0, 57.0, 65.0, 73.0, 81.0, 62.0, 57.0, 57.0, 54.0, 47.0, 32.0, 29.0, 31.0, 29.0, 14.0, 14.0, 10.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0406341552734375, -1.004119873046875, -0.9676055908203125, -0.93109130859375, -0.8945770263671875, -0.858062744140625, -0.8215484619140625, -0.7850341796875, -0.7485198974609375, -0.712005615234375, -0.6754913330078125, -0.63897705078125, -0.6024627685546875, -0.565948486328125, -0.5294342041015625, -0.492919921875, -0.4564056396484375, -0.419891357421875, -0.3833770751953125, -0.34686279296875, -0.3103485107421875, -0.273834228515625, -0.2373199462890625, -0.2008056640625, -0.1642913818359375, -0.127777099609375, -0.0912628173828125, -0.05474853515625, -0.0182342529296875, 0.018280029296875, 0.0547943115234375, 0.09130859375, 0.1278228759765625, 0.164337158203125, 0.2008514404296875, 0.23736572265625, 0.2738800048828125, 0.310394287109375, 0.3469085693359375, 0.3834228515625, 0.4199371337890625, 0.456451416015625, 0.4929656982421875, 0.52947998046875, 0.5659942626953125, 0.602508544921875, 0.6390228271484375, 0.675537109375, 0.7120513916015625, 0.748565673828125, 0.7850799560546875, 0.82159423828125, 0.8581085205078125, 0.894622802734375, 0.9311370849609375, 0.9676513671875, 1.0041656494140625, 1.040679931640625, 1.0771942138671875, 1.11370849609375, 1.1502227783203125, 1.186737060546875, 1.2232513427734375, 1.259765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 31.0, 45.0, 55.0, 87.0, 109.0, 148.0, 142.0, 114.0, 67.0, 75.0, 39.0, 13.0, 15.0, 9.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.57839584350586, -20.119382858276367, -19.660367965698242, -19.20135498046875, -18.742341995239258, -18.283329010009766, -17.82431411743164, -17.36530113220215, -16.906288146972656, -16.447275161743164, -15.988261222839355, -15.529247283935547, -15.070234298706055, -14.611220359802246, -14.152206420898438, -13.693193435668945, -13.23417854309082, -12.775164604187012, -12.31615161895752, -11.857137680053711, -11.398124694824219, -10.93911075592041, -10.480096817016602, -10.02108383178711, -9.5620698928833, -9.103055953979492, -8.64404296875, -8.185029029846191, -7.726015567779541, -7.267002105712891, -6.807988166809082, -6.348974704742432, -5.889962196350098, -5.430948734283447, -4.971935272216797, -4.512921333312988, -4.053907871246338, -3.5948944091796875, -3.135880708694458, -2.6768670082092285, -2.217853546142578, -1.7588399648666382, -1.2998263835906982, -0.8408128023147583, -0.38179922103881836, 0.07721424102783203, 0.5362279415130615, 0.995241641998291, 1.4542551040649414, 1.9132686853408813, 2.3722822666168213, 2.831295967102051, 3.290309429168701, 3.7493228912353516, 4.20833683013916, 4.6673502922058105, 5.126363754272461, 5.585377216339111, 6.044390678405762, 6.50340461730957, 6.962418079376221, 7.421431541442871, 7.88044548034668, 8.339458465576172, 8.79847240447998]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 11.0, 6.0, 10.0, 7.0, 13.0, 30.0, 39.0, 44.0, 63.0, 59.0, 77.0, 81.0, 80.0, 77.0, 80.0, 61.0, 67.0, 49.0, 28.0, 33.0, 16.0, 18.0, 10.0, 8.0, 5.0, 9.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.598836898803711, -15.177528381347656, -14.756218910217285, -14.334909439086914, -13.91360092163086, -13.492292404174805, -13.070982933044434, -12.649673461914062, -12.228364944458008, -11.807056427001953, -11.385746955871582, -10.964437484741211, -10.543128967285156, -10.121820449829102, -9.70051097869873, -9.27920150756836, -8.857892990112305, -8.43658447265625, -8.015275001525879, -7.593966007232666, -7.172657012939453, -6.75134801864624, -6.330039024353027, -5.9087300300598145, -5.487421035766602, -5.066112041473389, -4.644803047180176, -4.223494052886963, -3.80218505859375, -3.380876064300537, -2.959567070007324, -2.5382580757141113, -2.116948127746582, -1.6956391334533691, -1.2743301391601562, -0.8530211448669434, -0.43171215057373047, -0.010403156280517578, 0.4109058380126953, 0.8322148323059082, 1.253523826599121, 1.674832820892334, 2.096141815185547, 2.5174508094787598, 2.9387598037719727, 3.3600687980651855, 3.7813777923583984, 4.202686786651611, 4.623995780944824, 5.045304775238037, 5.46661376953125, 5.887922763824463, 6.309231758117676, 6.730540752410889, 7.151849746704102, 7.5731587409973145, 7.994467735290527, 8.415777206420898, 8.837085723876953, 9.258394241333008, 9.679703712463379, 10.10101318359375, 10.522321701049805, 10.94363021850586, 11.36493968963623]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 13.0, 12.0, 28.0, 47.0, 72.0, 104.0, 202.0, 362.0, 617.0, 1286.0, 2594.0, 5371.0, 11623.0, 28220.0, 75468.0, 263871.0, 2769205.0, 795685.0, 153830.0, 49826.0, 19480.0, 8463.0, 3838.0, 1966.0, 924.0, 506.0, 273.0, 158.0, 91.0, 50.0, 39.0, 12.0, 16.0, 11.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.04296875, -4.902099609375, -4.76123046875, -4.620361328125, -4.4794921875, -4.338623046875, -4.19775390625, -4.056884765625, -3.916015625, -3.775146484375, -3.63427734375, -3.493408203125, -3.3525390625, -3.211669921875, -3.07080078125, -2.929931640625, -2.7890625, -2.648193359375, -2.50732421875, -2.366455078125, -2.2255859375, -2.084716796875, -1.94384765625, -1.802978515625, -1.662109375, -1.521240234375, -1.38037109375, -1.239501953125, -1.0986328125, -0.957763671875, -0.81689453125, -0.676025390625, -0.53515625, -0.394287109375, -0.25341796875, -0.112548828125, 0.0283203125, 0.169189453125, 0.31005859375, 0.450927734375, 0.591796875, 0.732666015625, 0.87353515625, 1.014404296875, 1.1552734375, 1.296142578125, 1.43701171875, 1.577880859375, 1.71875, 1.859619140625, 2.00048828125, 2.141357421875, 2.2822265625, 2.423095703125, 2.56396484375, 2.704833984375, 2.845703125, 2.986572265625, 3.12744140625, 3.268310546875, 3.4091796875, 3.550048828125, 3.69091796875, 3.831787109375, 3.97265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 6.0, 12.0, 24.0, 29.0, 25.0, 31.0, 39.0, 34.0, 57.0, 55.0, 63.0, 71.0, 68.0, 70.0, 51.0, 55.0, 51.0, 54.0, 41.0, 30.0, 32.0, 23.0, 18.0, 13.0, 8.0, 7.0, 9.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3076286315917969, -0.29787445068359375, -0.2881202697753906, -0.2783660888671875, -0.2686119079589844, -0.25885772705078125, -0.24910354614257812, -0.239349365234375, -0.22959518432617188, -0.21984100341796875, -0.21008682250976562, -0.2003326416015625, -0.19057846069335938, -0.18082427978515625, -0.17107009887695312, -0.16131591796875, -0.15156173706054688, -0.14180755615234375, -0.13205337524414062, -0.1222991943359375, -0.11254501342773438, -0.10279083251953125, -0.09303665161132812, -0.083282470703125, -0.07352828979492188, -0.06377410888671875, -0.054019927978515625, -0.0442657470703125, -0.034511566162109375, -0.02475738525390625, -0.015003204345703125, -0.0052490234375, 0.004505157470703125, 0.01425933837890625, 0.024013519287109375, 0.0337677001953125, 0.043521881103515625, 0.05327606201171875, 0.06303024291992188, 0.072784423828125, 0.08253860473632812, 0.09229278564453125, 0.10204696655273438, 0.1118011474609375, 0.12155532836914062, 0.13130950927734375, 0.14106369018554688, 0.15081787109375, 0.16057205200195312, 0.17032623291015625, 0.18008041381835938, 0.1898345947265625, 0.19958877563476562, 0.20934295654296875, 0.21909713745117188, 0.228851318359375, 0.23860549926757812, 0.24835968017578125, 0.2581138610839844, 0.2678680419921875, 0.2776222229003906, 0.28737640380859375, 0.2971305847167969, 0.306884765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 13.0, 4.0, 15.0, 22.0, 32.0, 63.0, 124.0, 289.0, 767.0, 3707.0, 35722.0, 1332028.0, 2766964.0, 48579.0, 4514.0, 863.0, 294.0, 135.0, 61.0, 37.0, 18.0, 9.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.7515869140625, -8.354736328125, -7.9578857421875, -7.56103515625, -7.1641845703125, -6.767333984375, -6.3704833984375, -5.9736328125, -5.5767822265625, -5.179931640625, -4.7830810546875, -4.38623046875, -3.9893798828125, -3.592529296875, -3.1956787109375, -2.798828125, -2.4019775390625, -2.005126953125, -1.6082763671875, -1.21142578125, -0.8145751953125, -0.417724609375, -0.0208740234375, 0.3759765625, 0.7728271484375, 1.169677734375, 1.5665283203125, 1.96337890625, 2.3602294921875, 2.757080078125, 3.1539306640625, 3.55078125, 3.9476318359375, 4.344482421875, 4.7413330078125, 5.13818359375, 5.5350341796875, 5.931884765625, 6.3287353515625, 6.7255859375, 7.1224365234375, 7.519287109375, 7.9161376953125, 8.31298828125, 8.7098388671875, 9.106689453125, 9.5035400390625, 9.900390625, 10.2972412109375, 10.694091796875, 11.0909423828125, 11.48779296875, 11.8846435546875, 12.281494140625, 12.6783447265625, 13.0751953125, 13.4720458984375, 13.868896484375, 14.2657470703125, 14.66259765625, 15.0594482421875, 15.456298828125, 15.8531494140625, 16.25]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 11.0, 10.0, 15.0, 29.0, 32.0, 43.0, 90.0, 128.0, 207.0, 296.0, 530.0, 1273.0, 571.0, 301.0, 175.0, 89.0, 81.0, 60.0, 42.0, 19.0, 23.0, 16.0, 12.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1767578125, -1.145416259765625, -1.11407470703125, -1.082733154296875, -1.0513916015625, -1.020050048828125, -0.98870849609375, -0.957366943359375, -0.926025390625, -0.894683837890625, -0.86334228515625, -0.832000732421875, -0.8006591796875, -0.769317626953125, -0.73797607421875, -0.706634521484375, -0.67529296875, -0.643951416015625, -0.61260986328125, -0.581268310546875, -0.5499267578125, -0.518585205078125, -0.48724365234375, -0.455902099609375, -0.424560546875, -0.393218994140625, -0.36187744140625, -0.330535888671875, -0.2991943359375, -0.267852783203125, -0.23651123046875, -0.205169677734375, -0.173828125, -0.142486572265625, -0.11114501953125, -0.079803466796875, -0.0484619140625, -0.017120361328125, 0.01422119140625, 0.045562744140625, 0.076904296875, 0.108245849609375, 0.13958740234375, 0.170928955078125, 0.2022705078125, 0.233612060546875, 0.26495361328125, 0.296295166015625, 0.32763671875, 0.358978271484375, 0.39031982421875, 0.421661376953125, 0.4530029296875, 0.484344482421875, 0.51568603515625, 0.547027587890625, 0.578369140625, 0.609710693359375, 0.64105224609375, 0.672393798828125, 0.7037353515625, 0.735076904296875, 0.76641845703125, 0.797760009765625, 0.8291015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 32.0, 66.0, 99.0, 188.0, 222.0, 200.0, 106.0, 50.0, 25.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.2059326171875, -16.82863426208496, -16.451337814331055, -16.074039459228516, -15.696741104125977, -15.319443702697754, -14.942146301269531, -14.564847946166992, -14.18755054473877, -13.810253143310547, -13.432954788208008, -13.055657386779785, -12.678359985351562, -12.301061630249023, -11.9237642288208, -11.546466827392578, -11.169168472290039, -10.791871070861816, -10.414572715759277, -10.037275314331055, -9.659976959228516, -9.282679557800293, -8.90538215637207, -8.528083801269531, -8.150786399841309, -7.773488521575928, -7.396190643310547, -7.018893241882324, -6.641595363616943, -6.2642974853515625, -5.88700008392334, -5.509702205657959, -5.132403373718262, -4.755105495452881, -4.3778076171875, -4.000510215759277, -3.6232123374938965, -3.2459144592285156, -2.868616819381714, -2.491319179534912, -2.1140213012695312, -1.73672354221344, -1.3594257831573486, -0.9821280241012573, -0.604830265045166, -0.2275325059890747, 0.1497652530670166, 0.5270628929138184, 0.9043607711791992, 1.2816585302352905, 1.6589562892913818, 2.0362539291381836, 2.4135518074035645, 2.7908496856689453, 3.168147325515747, 3.545444965362549, 3.9227428436279297, 4.3000407218933105, 4.677338600158691, 5.054636001586914, 5.431933879852295, 5.809231758117676, 6.186529159545898, 6.563827037811279, 6.94112491607666]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 12.0, 10.0, 15.0, 22.0, 26.0, 28.0, 38.0, 42.0, 61.0, 44.0, 69.0, 76.0, 77.0, 71.0, 73.0, 71.0, 45.0, 54.0, 48.0, 31.0, 30.0, 24.0, 11.0, 11.0, 7.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0382323265075684, -2.8730597496032715, -2.7078871726989746, -2.5427145957946777, -2.3775417804718018, -2.212369203567505, -2.047196626663208, -1.8820239305496216, -1.7168513536453247, -1.5516787767410278, -1.3865060806274414, -1.2213335037231445, -1.0561609268188477, -0.8909882307052612, -0.7258156538009644, -0.5606429576873779, -0.39547038078308105, -0.2302977591753006, -0.06512513756752014, 0.10004746913909912, 0.26522010564804077, 0.4303927421569824, 0.5955653190612793, 0.7607380151748657, 0.9259105920791626, 1.0910831689834595, 1.256255865097046, 1.4214284420013428, 1.5866010189056396, 1.751773715019226, 1.916946291923523, 2.0821189880371094, 2.2472915649414062, 2.412464141845703, 2.57763671875, 2.742809295654297, 2.907982110977173, 3.0731546878814697, 3.2383272647857666, 3.4035000801086426, 3.5686726570129395, 3.7338452339172363, 3.899017810821533, 4.06419038772583, 4.229362964630127, 4.394536018371582, 4.559708595275879, 4.724881172180176, 4.890053749084473, 5.0552263259887695, 5.220398902893066, 5.385571479797363, 5.55074405670166, 5.715916633605957, 5.881089210510254, 6.046262264251709, 6.211434364318848, 6.3766069412231445, 6.541779518127441, 6.706952095031738, 6.872124671936035, 7.037297248840332, 7.202469825744629, 7.367642879486084, 7.532815456390381]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 9.0, 11.0, 12.0, 17.0, 15.0, 26.0, 26.0, 50.0, 51.0, 36.0, 58.0, 132.0, 3690.0, 309185.0, 723974.0, 10636.0, 284.0, 64.0, 55.0, 31.0, 36.0, 26.0, 26.0, 23.0, 14.0, 11.0, 7.0, 5.0, 6.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.5, -17.9879150390625, -17.475830078125, -16.9637451171875, -16.45166015625, -15.9395751953125, -15.427490234375, -14.9154052734375, -14.4033203125, -13.8912353515625, -13.379150390625, -12.8670654296875, -12.35498046875, -11.8428955078125, -11.330810546875, -10.8187255859375, -10.306640625, -9.7945556640625, -9.282470703125, -8.7703857421875, -8.25830078125, -7.7462158203125, -7.234130859375, -6.7220458984375, -6.2099609375, -5.6978759765625, -5.185791015625, -4.6737060546875, -4.16162109375, -3.6495361328125, -3.137451171875, -2.6253662109375, -2.11328125, -1.6011962890625, -1.089111328125, -0.5770263671875, -0.06494140625, 0.4471435546875, 0.959228515625, 1.4713134765625, 1.9833984375, 2.4954833984375, 3.007568359375, 3.5196533203125, 4.03173828125, 4.5438232421875, 5.055908203125, 5.5679931640625, 6.080078125, 6.5921630859375, 7.104248046875, 7.6163330078125, 8.12841796875, 8.6405029296875, 9.152587890625, 9.6646728515625, 10.1767578125, 10.6888427734375, 11.200927734375, 11.7130126953125, 12.22509765625, 12.7371826171875, 13.249267578125, 13.7613525390625, 14.2734375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 10.0, 17.0, 40.0, 73.0, 120.0, 141.0, 166.0, 163.0, 128.0, 78.0, 48.0, 17.0, 11.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248779296875, -0.22005081176757812, -0.19132232666015625, -0.16259384155273438, -0.1338653564453125, -0.10513687133789062, -0.07640838623046875, -0.047679901123046875, -0.018951416015625, 0.009777069091796875, 0.03850555419921875, 0.06723403930664062, 0.0959625244140625, 0.12469100952148438, 0.15341949462890625, 0.18214797973632812, 0.21087646484375, 0.23960494995117188, 0.26833343505859375, 0.2970619201660156, 0.3257904052734375, 0.3545188903808594, 0.38324737548828125, 0.4119758605957031, 0.440704345703125, 0.4694328308105469, 0.49816131591796875, 0.5268898010253906, 0.5556182861328125, 0.5843467712402344, 0.6130752563476562, 0.6418037414550781, 0.6705322265625, 0.6992607116699219, 0.7279891967773438, 0.7567176818847656, 0.7854461669921875, 0.8141746520996094, 0.8429031372070312, 0.8716316223144531, 0.900360107421875, 0.9290885925292969, 0.9578170776367188, 0.9865455627441406, 1.0152740478515625, 1.0440025329589844, 1.0727310180664062, 1.1014595031738281, 1.13018798828125, 1.1589164733886719, 1.1876449584960938, 1.2163734436035156, 1.2451019287109375, 1.2738304138183594, 1.3025588989257812, 1.3312873840332031, 1.360015869140625, 1.3887443542480469, 1.4174728393554688, 1.4462013244628906, 1.4749298095703125, 1.5036582946777344, 1.5323867797851562, 1.5611152648925781, 1.58984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 14.0, 21.0, 12.0, 21.0, 28.0, 37.0, 55.0, 93.0, 109.0, 172.0, 279.0, 599.0, 1051.0, 2478.0, 5770.0, 15759.0, 49484.0, 174671.0, 428708.0, 258578.0, 73576.0, 22780.0, 7928.0, 3157.0, 1398.0, 712.0, 382.0, 197.0, 137.0, 81.0, 61.0, 44.0, 43.0, 31.0, 12.0, 11.0, 9.0, 10.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.966796875, -3.828399658203125, -3.69000244140625, -3.551605224609375, -3.4132080078125, -3.274810791015625, -3.13641357421875, -2.998016357421875, -2.859619140625, -2.721221923828125, -2.58282470703125, -2.444427490234375, -2.3060302734375, -2.167633056640625, -2.02923583984375, -1.890838623046875, -1.75244140625, -1.614044189453125, -1.47564697265625, -1.337249755859375, -1.1988525390625, -1.060455322265625, -0.92205810546875, -0.783660888671875, -0.645263671875, -0.506866455078125, -0.36846923828125, -0.230072021484375, -0.0916748046875, 0.046722412109375, 0.18511962890625, 0.323516845703125, 0.4619140625, 0.600311279296875, 0.73870849609375, 0.877105712890625, 1.0155029296875, 1.153900146484375, 1.29229736328125, 1.430694580078125, 1.569091796875, 1.707489013671875, 1.84588623046875, 1.984283447265625, 2.1226806640625, 2.261077880859375, 2.39947509765625, 2.537872314453125, 2.67626953125, 2.814666748046875, 2.95306396484375, 3.091461181640625, 3.2298583984375, 3.368255615234375, 3.50665283203125, 3.645050048828125, 3.783447265625, 3.921844482421875, 4.06024169921875, 4.198638916015625, 4.3370361328125, 4.475433349609375, 4.61383056640625, 4.752227783203125, 4.890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 3.0, 8.0, 11.0, 9.0, 18.0, 18.0, 11.0, 31.0, 18.0, 40.0, 38.0, 46.0, 53.0, 64.0, 49.0, 58.0, 60.0, 44.0, 45.0, 43.0, 49.0, 42.0, 38.0, 35.0, 33.0, 20.0, 26.0, 15.0, 12.0, 10.0, 10.0, 5.0, 7.0, 5.0, 6.0, 0.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.8271484375, -1.7578125, -1.6884765625, -1.619140625, -1.5498046875, -1.48046875, -1.4111328125, -1.341796875, -1.2724609375, -1.203125, -1.1337890625, -1.064453125, -0.9951171875, -0.92578125, -0.8564453125, -0.787109375, -0.7177734375, -0.6484375, -0.5791015625, -0.509765625, -0.4404296875, -0.37109375, -0.3017578125, -0.232421875, -0.1630859375, -0.09375, -0.0244140625, 0.044921875, 0.1142578125, 0.18359375, 0.2529296875, 0.322265625, 0.3916015625, 0.4609375, 0.5302734375, 0.599609375, 0.6689453125, 0.73828125, 0.8076171875, 0.876953125, 0.9462890625, 1.015625, 1.0849609375, 1.154296875, 1.2236328125, 1.29296875, 1.3623046875, 1.431640625, 1.5009765625, 1.5703125, 1.6396484375, 1.708984375, 1.7783203125, 1.84765625, 1.9169921875, 1.986328125, 2.0556640625, 2.125, 2.1943359375, 2.263671875, 2.3330078125, 2.40234375, 2.4716796875, 2.541015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 11.0, 17.0, 9.0, 32.0, 50.0, 47.0, 84.0, 145.0, 189.0, 366.0, 546.0, 1085.0, 2070.0, 4672.0, 14607.0, 97193.0, 769835.0, 130183.0, 17056.0, 5218.0, 2264.0, 1146.0, 656.0, 417.0, 234.0, 147.0, 96.0, 62.0, 31.0, 25.0, 17.0, 10.0, 4.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3515625, -10.075927734375, -9.80029296875, -9.524658203125, -9.2490234375, -8.973388671875, -8.69775390625, -8.422119140625, -8.146484375, -7.870849609375, -7.59521484375, -7.319580078125, -7.0439453125, -6.768310546875, -6.49267578125, -6.217041015625, -5.94140625, -5.665771484375, -5.39013671875, -5.114501953125, -4.8388671875, -4.563232421875, -4.28759765625, -4.011962890625, -3.736328125, -3.460693359375, -3.18505859375, -2.909423828125, -2.6337890625, -2.358154296875, -2.08251953125, -1.806884765625, -1.53125, -1.255615234375, -0.97998046875, -0.704345703125, -0.4287109375, -0.153076171875, 0.12255859375, 0.398193359375, 0.673828125, 0.949462890625, 1.22509765625, 1.500732421875, 1.7763671875, 2.052001953125, 2.32763671875, 2.603271484375, 2.87890625, 3.154541015625, 3.43017578125, 3.705810546875, 3.9814453125, 4.257080078125, 4.53271484375, 4.808349609375, 5.083984375, 5.359619140625, 5.63525390625, 5.910888671875, 6.1865234375, 6.462158203125, 6.73779296875, 7.013427734375, 7.2890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 6.0, 16.0, 26.0, 46.0, 82.0, 121.0, 238.0, 176.0, 110.0, 59.0, 33.0, 28.0, 10.0, 12.0, 4.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009822845458984375, -0.0009470432996749878, -0.0009118020534515381, -0.0008765608072280884, -0.0008413195610046387, -0.000806078314781189, -0.0007708370685577393, -0.0007355958223342896, -0.0007003545761108398, -0.0006651133298873901, -0.0006298720836639404, -0.0005946308374404907, -0.000559389591217041, -0.0005241483449935913, -0.0004889070987701416, -0.0004536658525466919, -0.0004184246063232422, -0.0003831833600997925, -0.0003479421138763428, -0.00031270086765289307, -0.00027745962142944336, -0.00024221837520599365, -0.00020697712898254395, -0.00017173588275909424, -0.00013649463653564453, -0.00010125339031219482, -6.601214408874512e-05, -3.077089786529541e-05, 4.470348358154297e-06, 3.9711594581604004e-05, 7.495284080505371e-05, 0.00011019408702850342, 0.00014543533325195312, 0.00018067657947540283, 0.00021591782569885254, 0.00025115907192230225, 0.00028640031814575195, 0.00032164156436920166, 0.00035688281059265137, 0.0003921240568161011, 0.0004273653030395508, 0.0004626065492630005, 0.0004978477954864502, 0.0005330890417098999, 0.0005683302879333496, 0.0006035715341567993, 0.000638812780380249, 0.0006740540266036987, 0.0007092952728271484, 0.0007445365190505981, 0.0007797777652740479, 0.0008150190114974976, 0.0008502602577209473, 0.000885501503944397, 0.0009207427501678467, 0.0009559839963912964, 0.000991225242614746, 0.0010264664888381958, 0.0010617077350616455, 0.0010969489812850952, 0.001132190227508545, 0.0011674314737319946, 0.0012026727199554443, 0.001237913966178894, 0.0012731552124023438]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 9.0, 9.0, 6.0, 11.0, 11.0, 24.0, 45.0, 62.0, 93.0, 159.0, 333.0, 627.0, 1401.0, 3217.0, 8796.0, 39622.0, 632819.0, 323651.0, 25842.0, 6779.0, 2584.0, 1178.0, 565.0, 286.0, 170.0, 78.0, 63.0, 28.0, 25.0, 20.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.3626708984375, -9.014404296875, -8.6661376953125, -8.31787109375, -7.9696044921875, -7.621337890625, -7.2730712890625, -6.9248046875, -6.5765380859375, -6.228271484375, -5.8800048828125, -5.53173828125, -5.1834716796875, -4.835205078125, -4.4869384765625, -4.138671875, -3.7904052734375, -3.442138671875, -3.0938720703125, -2.74560546875, -2.3973388671875, -2.049072265625, -1.7008056640625, -1.3525390625, -1.0042724609375, -0.656005859375, -0.3077392578125, 0.04052734375, 0.3887939453125, 0.737060546875, 1.0853271484375, 1.43359375, 1.7818603515625, 2.130126953125, 2.4783935546875, 2.82666015625, 3.1749267578125, 3.523193359375, 3.8714599609375, 4.2197265625, 4.5679931640625, 4.916259765625, 5.2645263671875, 5.61279296875, 5.9610595703125, 6.309326171875, 6.6575927734375, 7.005859375, 7.3541259765625, 7.702392578125, 8.0506591796875, 8.39892578125, 8.7471923828125, 9.095458984375, 9.4437255859375, 9.7919921875, 10.1402587890625, 10.488525390625, 10.8367919921875, 11.18505859375, 11.5333251953125, 11.881591796875, 12.2298583984375, 12.578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 6.0, 11.0, 8.0, 20.0, 21.0, 26.0, 44.0, 74.0, 129.0, 184.0, 167.0, 104.0, 61.0, 37.0, 26.0, 20.0, 11.0, 13.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.599945068359375, -3.47528076171875, -3.350616455078125, -3.2259521484375, -3.101287841796875, -2.97662353515625, -2.851959228515625, -2.727294921875, -2.602630615234375, -2.47796630859375, -2.353302001953125, -2.2286376953125, -2.103973388671875, -1.97930908203125, -1.854644775390625, -1.72998046875, -1.605316162109375, -1.48065185546875, -1.355987548828125, -1.2313232421875, -1.106658935546875, -0.98199462890625, -0.857330322265625, -0.732666015625, -0.608001708984375, -0.48333740234375, -0.358673095703125, -0.2340087890625, -0.109344482421875, 0.01531982421875, 0.139984130859375, 0.2646484375, 0.389312744140625, 0.51397705078125, 0.638641357421875, 0.7633056640625, 0.887969970703125, 1.01263427734375, 1.137298583984375, 1.261962890625, 1.386627197265625, 1.51129150390625, 1.635955810546875, 1.7606201171875, 1.885284423828125, 2.00994873046875, 2.134613037109375, 2.25927734375, 2.383941650390625, 2.50860595703125, 2.633270263671875, 2.7579345703125, 2.882598876953125, 3.00726318359375, 3.131927490234375, 3.256591796875, 3.381256103515625, 3.50592041015625, 3.630584716796875, 3.7552490234375, 3.879913330078125, 4.00457763671875, 4.129241943359375, 4.25390625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 13.0, 14.0, 41.0, 54.0, 81.0, 128.0, 179.0, 156.0, 131.0, 80.0, 35.0, 22.0, 19.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.483680725097656, -36.4127197265625, -35.341758728027344, -34.27079772949219, -33.19983673095703, -32.128875732421875, -31.05791473388672, -29.986953735351562, -28.915992736816406, -27.84503173828125, -26.774070739746094, -25.703109741210938, -24.63214874267578, -23.561187744140625, -22.49022674560547, -21.419265747070312, -20.348304748535156, -19.27734375, -18.206382751464844, -17.135421752929688, -16.06446075439453, -14.993499755859375, -13.922538757324219, -12.851577758789062, -11.780616760253906, -10.70965576171875, -9.638694763183594, -8.567733764648438, -7.496772766113281, -6.425811767578125, -5.354850769042969, -4.2838897705078125, -3.2129249572753906, -2.1419639587402344, -1.0710029602050781, -4.1961669921875e-05, 1.0709190368652344, 2.1418800354003906, 3.212841033935547, 4.283802032470703, 5.354763031005859, 6.425724029541016, 7.496685028076172, 8.567646026611328, 9.638607025146484, 10.70956802368164, 11.780529022216797, 12.851490020751953, 13.92245101928711, 14.993412017822266, 16.064373016357422, 17.135334014892578, 18.206295013427734, 19.27725601196289, 20.348217010498047, 21.419178009033203, 22.49013900756836, 23.561100006103516, 24.632061004638672, 25.703022003173828, 26.773983001708984, 27.84494400024414, 28.915904998779297, 29.986865997314453, 31.05782699584961]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 8.0, 5.0, 5.0, 5.0, 11.0, 12.0, 23.0, 12.0, 23.0, 30.0, 23.0, 28.0, 23.0, 35.0, 30.0, 28.0, 39.0, 58.0, 35.0, 37.0, 43.0, 31.0, 40.0, 36.0, 31.0, 45.0, 35.0, 27.0, 25.0, 30.0, 24.0, 27.0, 24.0, 17.0, 12.0, 13.0, 17.0, 12.0, 8.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-13.533905029296875, -13.115424156188965, -12.696943283081055, -12.278462409973145, -11.859981536865234, -11.441499710083008, -11.023018836975098, -10.604537963867188, -10.186057090759277, -9.767576217651367, -9.349095344543457, -8.930614471435547, -8.51213264465332, -8.093652725219727, -7.6751708984375, -7.25669002532959, -6.83820915222168, -6.4197282791137695, -6.001247406005859, -5.582766056060791, -5.164285182952881, -4.745804309844971, -4.327322959899902, -3.908842086791992, -3.490361213684082, -3.071880340576172, -2.6533992290496826, -2.2349181175231934, -1.8164372444152832, -1.397956371307373, -0.9794752597808838, -0.5609941482543945, -0.14251232147216797, 0.27596867084503174, 0.6944496631622314, 1.1129306554794312, 1.5314116477966309, 1.949892520904541, 2.3683736324310303, 2.7868547439575195, 3.2053356170654297, 3.62381649017334, 4.04229736328125, 4.460778713226318, 4.8792595863342285, 5.297740459442139, 5.716221809387207, 6.134702682495117, 6.553183555603027, 6.9716644287109375, 7.390145301818848, 7.808626651763916, 8.227108001708984, 8.645587921142578, 9.064069747924805, 9.482550621032715, 9.901031494140625, 10.319512367248535, 10.737993240356445, 11.156474113464355, 11.574954986572266, 11.993436813354492, 12.411917686462402, 12.830398559570312, 13.248879432678223]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 36.0, 134.0, 833.0, 8909.0, 260724.0, 3877135.0, 42581.0, 2875.0, 460.0, 137.0, 79.0, 45.0, 49.0, 49.0, 37.0, 32.0, 29.0, 21.0, 23.0, 11.0, 20.0, 13.0, 7.0, 11.0, 9.0, 7.0, 3.0, 7.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.34033203125, -3.7431640625, -3.14599609375, -2.548828125, -1.95166015625, -1.3544921875, -0.75732421875, -0.16015625, 0.43701171875, 1.0341796875, 1.63134765625, 2.228515625, 2.82568359375, 3.4228515625, 4.02001953125, 4.6171875, 5.21435546875, 5.8115234375, 6.40869140625, 7.005859375, 7.60302734375, 8.2001953125, 8.79736328125, 9.39453125, 9.99169921875, 10.5888671875, 11.18603515625, 11.783203125, 12.38037109375, 12.9775390625, 13.57470703125, 14.171875, 14.76904296875, 15.3662109375, 15.96337890625, 16.560546875, 17.15771484375, 17.7548828125, 18.35205078125, 18.94921875, 19.54638671875, 20.1435546875, 20.74072265625, 21.337890625, 21.93505859375, 22.5322265625, 23.12939453125, 23.7265625, 24.32373046875, 24.9208984375, 25.51806640625, 26.115234375, 26.71240234375, 27.3095703125, 27.90673828125, 28.50390625, 29.10107421875, 29.6982421875, 30.29541015625, 30.892578125, 31.48974609375, 32.0869140625, 32.68408203125, 33.28125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 9.0, 15.0, 18.0, 45.0, 80.0, 112.0, 146.0, 146.0, 140.0, 113.0, 85.0, 52.0, 28.0, 16.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.436767578125, -0.4023704528808594, -0.36797332763671875, -0.3335762023925781, -0.2991790771484375, -0.2647819519042969, -0.23038482666015625, -0.19598770141601562, -0.161590576171875, -0.12719345092773438, -0.09279632568359375, -0.058399200439453125, -0.0240020751953125, 0.010395050048828125, 0.04479217529296875, 0.07918930053710938, 0.11358642578125, 0.14798355102539062, 0.18238067626953125, 0.21677780151367188, 0.2511749267578125, 0.2855720520019531, 0.31996917724609375, 0.3543663024902344, 0.388763427734375, 0.4231605529785156, 0.45755767822265625, 0.4919548034667969, 0.5263519287109375, 0.5607490539550781, 0.5951461791992188, 0.6295433044433594, 0.6639404296875, 0.6983375549316406, 0.7327346801757812, 0.7671318054199219, 0.8015289306640625, 0.8359260559082031, 0.8703231811523438, 0.9047203063964844, 0.939117431640625, 0.9735145568847656, 1.0079116821289062, 1.0423088073730469, 1.0767059326171875, 1.1111030578613281, 1.1455001831054688, 1.1798973083496094, 1.21429443359375, 1.2486915588378906, 1.2830886840820312, 1.3174858093261719, 1.3518829345703125, 1.3862800598144531, 1.4206771850585938, 1.4550743103027344, 1.489471435546875, 1.5238685607910156, 1.5582656860351562, 1.5926628112792969, 1.6270599365234375, 1.6614570617675781, 1.6958541870117188, 1.7302513122558594, 1.7646484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 15.0, 13.0, 12.0, 21.0, 25.0, 37.0, 60.0, 88.0, 272.0, 2964.0, 4058383.0, 131007.0, 904.0, 155.0, 78.0, 56.0, 45.0, 39.0, 37.0, 22.0, 17.0, 16.0, 7.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.80908203125, -46.1494140625, -44.48974609375, -42.830078125, -41.17041015625, -39.5107421875, -37.85107421875, -36.19140625, -34.53173828125, -32.8720703125, -31.21240234375, -29.552734375, -27.89306640625, -26.2333984375, -24.57373046875, -22.9140625, -21.25439453125, -19.5947265625, -17.93505859375, -16.275390625, -14.61572265625, -12.9560546875, -11.29638671875, -9.63671875, -7.97705078125, -6.3173828125, -4.65771484375, -2.998046875, -1.33837890625, 0.3212890625, 1.98095703125, 3.640625, 5.30029296875, 6.9599609375, 8.61962890625, 10.279296875, 11.93896484375, 13.5986328125, 15.25830078125, 16.91796875, 18.57763671875, 20.2373046875, 21.89697265625, 23.556640625, 25.21630859375, 26.8759765625, 28.53564453125, 30.1953125, 31.85498046875, 33.5146484375, 35.17431640625, 36.833984375, 38.49365234375, 40.1533203125, 41.81298828125, 43.47265625, 45.13232421875, 46.7919921875, 48.45166015625, 50.111328125, 51.77099609375, 53.4306640625, 55.09033203125, 56.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 16.0, 48.0, 154.0, 874.0, 2568.0, 297.0, 88.0, 17.0, 13.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.587249755859375, -2.39129638671875, -2.195343017578125, -1.9993896484375, -1.803436279296875, -1.60748291015625, -1.411529541015625, -1.215576171875, -1.019622802734375, -0.82366943359375, -0.627716064453125, -0.4317626953125, -0.235809326171875, -0.03985595703125, 0.156097412109375, 0.35205078125, 0.548004150390625, 0.74395751953125, 0.939910888671875, 1.1358642578125, 1.331817626953125, 1.52777099609375, 1.723724365234375, 1.919677734375, 2.115631103515625, 2.31158447265625, 2.507537841796875, 2.7034912109375, 2.899444580078125, 3.09539794921875, 3.291351318359375, 3.4873046875, 3.683258056640625, 3.87921142578125, 4.075164794921875, 4.2711181640625, 4.467071533203125, 4.66302490234375, 4.858978271484375, 5.054931640625, 5.250885009765625, 5.44683837890625, 5.642791748046875, 5.8387451171875, 6.034698486328125, 6.23065185546875, 6.426605224609375, 6.62255859375, 6.818511962890625, 7.01446533203125, 7.210418701171875, 7.4063720703125, 7.602325439453125, 7.79827880859375, 7.994232177734375, 8.190185546875, 8.386138916015625, 8.58209228515625, 8.778045654296875, 8.9739990234375, 9.169952392578125, 9.36590576171875, 9.561859130859375, 9.7578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 15.0, 102.0, 623.0, 234.0, 25.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.08065032958984, -74.47716522216797, -71.87367248535156, -69.27018737792969, -66.66670227050781, -64.06321716308594, -61.45972442626953, -58.856239318847656, -56.252750396728516, -53.649261474609375, -51.0457763671875, -48.44228744506836, -45.83879852294922, -43.235313415527344, -40.6318244934082, -38.02833557128906, -35.42485046386719, -32.82136154174805, -30.217876434326172, -27.61438751220703, -25.010900497436523, -22.407413482666016, -19.803924560546875, -17.200437545776367, -14.59695053100586, -11.993463516235352, -9.389975547790527, -6.786488056182861, -4.183000564575195, -1.5795135498046875, 1.0239744186401367, 3.627462387084961, 6.23095703125, 8.834444046020508, 11.437932014465332, 14.041419982910156, 16.644906997680664, 19.248394012451172, 21.851882934570312, 24.45536994934082, 27.058856964111328, 29.662343978881836, 32.265830993652344, 34.869319915771484, 37.472808837890625, 40.0762939453125, 42.67978286743164, 45.28327178955078, 47.886756896972656, 50.4902458190918, 53.09373092651367, 55.69721984863281, 58.30070495605469, 60.90419387817383, 63.50768280029297, 66.11116790771484, 68.71466064453125, 71.31814575195312, 73.92163848876953, 76.5251235961914, 79.12860870361328, 81.73210144042969, 84.33558654785156, 86.93907165527344, 89.54255676269531]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 19.0, 20.0, 32.0, 52.0, 63.0, 103.0, 84.0, 103.0, 109.0, 103.0, 89.0, 76.0, 44.0, 31.0, 22.0, 18.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.500822067260742, -21.888446807861328, -21.276071548461914, -20.6636962890625, -20.051321029663086, -19.438945770263672, -18.826570510864258, -18.214195251464844, -17.60181999206543, -16.989444732666016, -16.3770694732666, -15.764694213867188, -15.152318954467773, -14.53994369506836, -13.927568435668945, -13.315193176269531, -12.702817916870117, -12.090442657470703, -11.478067398071289, -10.865692138671875, -10.253316879272461, -9.640941619873047, -9.028566360473633, -8.416191101074219, -7.803815841674805, -7.191440582275391, -6.579065322875977, -5.9666900634765625, -5.354314804077148, -4.741939544677734, -4.12956428527832, -3.5171890258789062, -2.904813766479492, -2.292438507080078, -1.680063247680664, -1.06768798828125, -0.45531272888183594, 0.15706253051757812, 0.7694377899169922, 1.3818130493164062, 1.9941883087158203, 2.6065635681152344, 3.2189388275146484, 3.8313140869140625, 4.443689346313477, 5.056064605712891, 5.668439865112305, 6.280815124511719, 6.893190383911133, 7.505565643310547, 8.117940902709961, 8.730316162109375, 9.342691421508789, 9.955066680908203, 10.567441940307617, 11.179817199707031, 11.792192459106445, 12.40456771850586, 13.016942977905273, 13.629318237304688, 14.241693496704102, 14.854068756103516, 15.46644401550293, 16.078819274902344, 16.691194534301758]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 11.0, 7.0, 17.0, 18.0, 22.0, 27.0, 54.0, 59.0, 86.0, 162.0, 250.0, 531.0, 1760.0, 8008.0, 69319.0, 573428.0, 353459.0, 34284.0, 4854.0, 1131.0, 413.0, 219.0, 115.0, 82.0, 55.0, 29.0, 30.0, 28.0, 12.0, 14.0, 6.0, 9.0, 11.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.5670166015625, -8.235595703125, -7.9041748046875, -7.57275390625, -7.2413330078125, -6.909912109375, -6.5784912109375, -6.2470703125, -5.9156494140625, -5.584228515625, -5.2528076171875, -4.92138671875, -4.5899658203125, -4.258544921875, -3.9271240234375, -3.595703125, -3.2642822265625, -2.932861328125, -2.6014404296875, -2.27001953125, -1.9385986328125, -1.607177734375, -1.2757568359375, -0.9443359375, -0.6129150390625, -0.281494140625, 0.0499267578125, 0.38134765625, 0.7127685546875, 1.044189453125, 1.3756103515625, 1.70703125, 2.0384521484375, 2.369873046875, 2.7012939453125, 3.03271484375, 3.3641357421875, 3.695556640625, 4.0269775390625, 4.3583984375, 4.6898193359375, 5.021240234375, 5.3526611328125, 5.68408203125, 6.0155029296875, 6.346923828125, 6.6783447265625, 7.009765625, 7.3411865234375, 7.672607421875, 8.0040283203125, 8.33544921875, 8.6668701171875, 8.998291015625, 9.3297119140625, 9.6611328125, 9.9925537109375, 10.323974609375, 10.6553955078125, 10.98681640625, 11.3182373046875, 11.649658203125, 11.9810791015625, 12.3125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 12.0, 19.0, 38.0, 54.0, 79.0, 97.0, 123.0, 122.0, 116.0, 109.0, 73.0, 49.0, 37.0, 23.0, 24.0, 8.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5600662231445312, -0.5219879150390625, -0.48390960693359375, -0.445831298828125, -0.40775299072265625, -0.3696746826171875, -0.33159637451171875, -0.29351806640625, -0.25543975830078125, -0.2173614501953125, -0.17928314208984375, -0.141204833984375, -0.10312652587890625, -0.0650482177734375, -0.02696990966796875, 0.0111083984375, 0.04918670654296875, 0.0872650146484375, 0.12534332275390625, 0.163421630859375, 0.20149993896484375, 0.2395782470703125, 0.27765655517578125, 0.31573486328125, 0.35381317138671875, 0.3918914794921875, 0.42996978759765625, 0.468048095703125, 0.5061264038085938, 0.5442047119140625, 0.5822830200195312, 0.620361328125, 0.6584396362304688, 0.6965179443359375, 0.7345962524414062, 0.772674560546875, 0.8107528686523438, 0.8488311767578125, 0.8869094848632812, 0.92498779296875, 0.9630661010742188, 1.0011444091796875, 1.0392227172851562, 1.077301025390625, 1.1153793334960938, 1.1534576416015625, 1.1915359497070312, 1.2296142578125, 1.2676925659179688, 1.3057708740234375, 1.3438491821289062, 1.381927490234375, 1.4200057983398438, 1.4580841064453125, 1.4961624145507812, 1.53424072265625, 1.5723190307617188, 1.6103973388671875, 1.6484756469726562, 1.686553955078125, 1.7246322631835938, 1.7627105712890625, 1.8007888793945312, 1.8388671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 8.0, 9.0, 17.0, 24.0, 22.0, 33.0, 51.0, 63.0, 80.0, 118.0, 167.0, 270.0, 505.0, 1024.0, 2382.0, 5772.0, 16259.0, 49680.0, 166004.0, 429198.0, 259006.0, 78434.0, 24509.0, 8517.0, 3264.0, 1387.0, 665.0, 376.0, 208.0, 145.0, 93.0, 72.0, 53.0, 42.0, 26.0, 18.0, 12.0, 13.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.578125, -5.402099609375, -5.22607421875, -5.050048828125, -4.8740234375, -4.697998046875, -4.52197265625, -4.345947265625, -4.169921875, -3.993896484375, -3.81787109375, -3.641845703125, -3.4658203125, -3.289794921875, -3.11376953125, -2.937744140625, -2.76171875, -2.585693359375, -2.40966796875, -2.233642578125, -2.0576171875, -1.881591796875, -1.70556640625, -1.529541015625, -1.353515625, -1.177490234375, -1.00146484375, -0.825439453125, -0.6494140625, -0.473388671875, -0.29736328125, -0.121337890625, 0.0546875, 0.230712890625, 0.40673828125, 0.582763671875, 0.7587890625, 0.934814453125, 1.11083984375, 1.286865234375, 1.462890625, 1.638916015625, 1.81494140625, 1.990966796875, 2.1669921875, 2.343017578125, 2.51904296875, 2.695068359375, 2.87109375, 3.047119140625, 3.22314453125, 3.399169921875, 3.5751953125, 3.751220703125, 3.92724609375, 4.103271484375, 4.279296875, 4.455322265625, 4.63134765625, 4.807373046875, 4.9833984375, 5.159423828125, 5.33544921875, 5.511474609375, 5.6875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 8.0, 10.0, 17.0, 11.0, 13.0, 17.0, 19.0, 18.0, 28.0, 34.0, 27.0, 51.0, 52.0, 34.0, 47.0, 45.0, 48.0, 46.0, 53.0, 43.0, 48.0, 39.0, 38.0, 27.0, 30.0, 21.0, 33.0, 24.0, 16.0, 16.0, 15.0, 12.0, 11.0, 6.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.1666259765625, -3.067626953125, -2.9686279296875, -2.86962890625, -2.7706298828125, -2.671630859375, -2.5726318359375, -2.4736328125, -2.3746337890625, -2.275634765625, -2.1766357421875, -2.07763671875, -1.9786376953125, -1.879638671875, -1.7806396484375, -1.681640625, -1.5826416015625, -1.483642578125, -1.3846435546875, -1.28564453125, -1.1866455078125, -1.087646484375, -0.9886474609375, -0.8896484375, -0.7906494140625, -0.691650390625, -0.5926513671875, -0.49365234375, -0.3946533203125, -0.295654296875, -0.1966552734375, -0.09765625, 0.0013427734375, 0.100341796875, 0.1993408203125, 0.29833984375, 0.3973388671875, 0.496337890625, 0.5953369140625, 0.6943359375, 0.7933349609375, 0.892333984375, 0.9913330078125, 1.09033203125, 1.1893310546875, 1.288330078125, 1.3873291015625, 1.486328125, 1.5853271484375, 1.684326171875, 1.7833251953125, 1.88232421875, 1.9813232421875, 2.080322265625, 2.1793212890625, 2.2783203125, 2.3773193359375, 2.476318359375, 2.5753173828125, 2.67431640625, 2.7733154296875, 2.872314453125, 2.9713134765625, 3.0703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 8.0, 5.0, 20.0, 25.0, 37.0, 58.0, 66.0, 129.0, 223.0, 374.0, 669.0, 1219.0, 2290.0, 4722.0, 10453.0, 24135.0, 62237.0, 168629.0, 351644.0, 257486.0, 98500.0, 36822.0, 15267.0, 6619.0, 3086.0, 1673.0, 912.0, 516.0, 278.0, 158.0, 98.0, 64.0, 41.0, 21.0, 33.0, 7.0, 10.0, 9.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.435546875, -2.36334228515625, -2.2911376953125, -2.21893310546875, -2.146728515625, -2.07452392578125, -2.0023193359375, -1.93011474609375, -1.85791015625, -1.78570556640625, -1.7135009765625, -1.64129638671875, -1.569091796875, -1.49688720703125, -1.4246826171875, -1.35247802734375, -1.2802734375, -1.20806884765625, -1.1358642578125, -1.06365966796875, -0.991455078125, -0.91925048828125, -0.8470458984375, -0.77484130859375, -0.70263671875, -0.63043212890625, -0.5582275390625, -0.48602294921875, -0.413818359375, -0.34161376953125, -0.2694091796875, -0.19720458984375, -0.125, -0.05279541015625, 0.0194091796875, 0.09161376953125, 0.163818359375, 0.23602294921875, 0.3082275390625, 0.38043212890625, 0.45263671875, 0.52484130859375, 0.5970458984375, 0.66925048828125, 0.741455078125, 0.81365966796875, 0.8858642578125, 0.95806884765625, 1.0302734375, 1.10247802734375, 1.1746826171875, 1.24688720703125, 1.319091796875, 1.39129638671875, 1.4635009765625, 1.53570556640625, 1.60791015625, 1.68011474609375, 1.7523193359375, 1.82452392578125, 1.896728515625, 1.96893310546875, 2.0411376953125, 2.11334228515625, 2.185546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 14.0, 16.0, 20.0, 46.0, 62.0, 64.0, 83.0, 94.0, 127.0, 116.0, 87.0, 73.0, 44.0, 33.0, 21.0, 26.0, 17.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005240440368652344, -0.0005035996437072754, -0.0004831552505493164, -0.0004627108573913574, -0.00044226646423339844, -0.00042182207107543945, -0.00040137767791748047, -0.0003809332847595215, -0.0003604888916015625, -0.0003400444984436035, -0.00031960010528564453, -0.00029915571212768555, -0.00027871131896972656, -0.0002582669258117676, -0.0002378225326538086, -0.0002173781394958496, -0.00019693374633789062, -0.00017648935317993164, -0.00015604496002197266, -0.00013560056686401367, -0.00011515617370605469, -9.47117805480957e-05, -7.426738739013672e-05, -5.3822994232177734e-05, -3.337860107421875e-05, -1.2934207916259766e-05, 7.510185241699219e-06, 2.7954578399658203e-05, 4.839897155761719e-05, 6.884336471557617e-05, 8.928775787353516e-05, 0.00010973215103149414, 0.00013017654418945312, 0.0001506209373474121, 0.0001710653305053711, 0.00019150972366333008, 0.00021195411682128906, 0.00023239850997924805, 0.00025284290313720703, 0.000273287296295166, 0.000293731689453125, 0.000314176082611084, 0.00033462047576904297, 0.00035506486892700195, 0.00037550926208496094, 0.0003959536552429199, 0.0004163980484008789, 0.0004368424415588379, 0.0004572868347167969, 0.00047773122787475586, 0.0004981756210327148, 0.0005186200141906738, 0.0005390644073486328, 0.0005595088005065918, 0.0005799531936645508, 0.0006003975868225098, 0.0006208419799804688, 0.0006412863731384277, 0.0006617307662963867, 0.0006821751594543457, 0.0007026195526123047, 0.0007230639457702637, 0.0007435083389282227, 0.0007639527320861816, 0.0007843971252441406]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 7.0, 8.0, 6.0, 19.0, 31.0, 36.0, 63.0, 76.0, 136.0, 264.0, 495.0, 997.0, 2353.0, 6111.0, 20075.0, 76291.0, 365985.0, 444826.0, 94400.0, 23930.0, 7269.0, 2749.0, 1151.0, 552.0, 288.0, 175.0, 84.0, 56.0, 40.0, 28.0, 18.0, 8.0, 9.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.16796875, -5.028564453125, -4.88916015625, -4.749755859375, -4.6103515625, -4.470947265625, -4.33154296875, -4.192138671875, -4.052734375, -3.913330078125, -3.77392578125, -3.634521484375, -3.4951171875, -3.355712890625, -3.21630859375, -3.076904296875, -2.9375, -2.798095703125, -2.65869140625, -2.519287109375, -2.3798828125, -2.240478515625, -2.10107421875, -1.961669921875, -1.822265625, -1.682861328125, -1.54345703125, -1.404052734375, -1.2646484375, -1.125244140625, -0.98583984375, -0.846435546875, -0.70703125, -0.567626953125, -0.42822265625, -0.288818359375, -0.1494140625, -0.010009765625, 0.12939453125, 0.268798828125, 0.408203125, 0.547607421875, 0.68701171875, 0.826416015625, 0.9658203125, 1.105224609375, 1.24462890625, 1.384033203125, 1.5234375, 1.662841796875, 1.80224609375, 1.941650390625, 2.0810546875, 2.220458984375, 2.35986328125, 2.499267578125, 2.638671875, 2.778076171875, 2.91748046875, 3.056884765625, 3.1962890625, 3.335693359375, 3.47509765625, 3.614501953125, 3.75390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 1.0, 4.0, 8.0, 5.0, 9.0, 8.0, 9.0, 18.0, 17.0, 19.0, 27.0, 29.0, 30.0, 41.0, 52.0, 61.0, 76.0, 85.0, 79.0, 66.0, 53.0, 54.0, 52.0, 30.0, 33.0, 25.0, 13.0, 14.0, 22.0, 14.0, 8.0, 5.0, 6.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.4652557373046875, -1.410980224609375, -1.3567047119140625, -1.30242919921875, -1.2481536865234375, -1.193878173828125, -1.1396026611328125, -1.0853271484375, -1.0310516357421875, -0.976776123046875, -0.9225006103515625, -0.86822509765625, -0.8139495849609375, -0.759674072265625, -0.7053985595703125, -0.651123046875, -0.5968475341796875, -0.542572021484375, -0.4882965087890625, -0.43402099609375, -0.3797454833984375, -0.325469970703125, -0.2711944580078125, -0.2169189453125, -0.1626434326171875, -0.108367919921875, -0.0540924072265625, 0.00018310546875, 0.0544586181640625, 0.108734130859375, 0.1630096435546875, 0.21728515625, 0.2715606689453125, 0.325836181640625, 0.3801116943359375, 0.43438720703125, 0.4886627197265625, 0.542938232421875, 0.5972137451171875, 0.6514892578125, 0.7057647705078125, 0.760040283203125, 0.8143157958984375, 0.86859130859375, 0.9228668212890625, 0.977142333984375, 1.0314178466796875, 1.085693359375, 1.1399688720703125, 1.194244384765625, 1.2485198974609375, 1.30279541015625, 1.3570709228515625, 1.411346435546875, 1.4656219482421875, 1.5198974609375, 1.5741729736328125, 1.628448486328125, 1.6827239990234375, 1.73699951171875, 1.7912750244140625, 1.845550537109375, 1.8998260498046875, 1.9541015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 10.0, 24.0, 58.0, 156.0, 302.0, 298.0, 110.0, 34.0, 15.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.838422775268555, -29.164569854736328, -26.490718841552734, -23.816865921020508, -21.14301300048828, -18.469161987304688, -15.795309066772461, -13.121458053588867, -10.44760513305664, -7.7737531661987305, -5.099900722503662, -2.4260482788085938, 0.2478036880493164, 2.9216556549072266, 5.595508575439453, 8.269359588623047, 10.943212509155273, 13.617064476013184, 16.290916442871094, 18.96476936340332, 21.638622283935547, 24.31247329711914, 26.986326217651367, 29.66017723083496, 32.33403015136719, 35.00788116455078, 37.68173599243164, 40.355587005615234, 43.02943801879883, 45.70329284667969, 48.37714385986328, 51.050994873046875, 53.72484588623047, 56.39869689941406, 59.07255172729492, 61.746402740478516, 64.42025756835938, 67.09410858154297, 69.76795959472656, 72.44181060791016, 75.11566162109375, 77.78951263427734, 80.46336364746094, 83.13722229003906, 85.81107330322266, 88.48492431640625, 91.15877532958984, 93.83262634277344, 96.50648498535156, 99.18033599853516, 101.85418701171875, 104.52804565429688, 107.20189666748047, 109.87574768066406, 112.54959869384766, 115.22344970703125, 117.89730072021484, 120.57115173339844, 123.24500274658203, 125.91885375976562, 128.59271240234375, 131.2665557861328, 133.94041442871094, 136.6142578125, 139.28811645507812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 7.0, 11.0, 18.0, 6.0, 17.0, 19.0, 19.0, 20.0, 30.0, 30.0, 36.0, 39.0, 42.0, 47.0, 34.0, 51.0, 47.0, 43.0, 41.0, 48.0, 42.0, 43.0, 38.0, 36.0, 32.0, 32.0, 23.0, 24.0, 14.0, 15.0, 17.0, 13.0, 15.0, 10.0, 9.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-22.802379608154297, -22.137596130371094, -21.47281265258789, -20.808029174804688, -20.143247604370117, -19.478464126586914, -18.81368064880371, -18.148897171020508, -17.484113693237305, -16.8193302154541, -16.1545467376709, -15.489764213562012, -14.824980735778809, -14.160198211669922, -13.495414733886719, -12.830631256103516, -12.165848731994629, -11.501065254211426, -10.836282730102539, -10.171499252319336, -9.506715774536133, -8.84193229675293, -8.177149772644043, -7.51236629486084, -6.847583293914795, -6.18280029296875, -5.518016815185547, -4.853233814239502, -4.188450813293457, -3.523667335510254, -2.858884334564209, -2.194100856781006, -1.529317855834961, -0.8645346760749817, -0.19975149631500244, 0.46503162384033203, 1.129814863204956, 1.79459810256958, 2.459381103515625, 3.124164581298828, 3.788947582244873, 4.453730583190918, 5.118514060974121, 5.783297061920166, 6.448080062866211, 7.112863540649414, 7.777646541595459, 8.44243049621582, 9.107213020324707, 9.77199649810791, 10.436779022216797, 11.1015625, 11.766345977783203, 12.431129455566406, 13.095911979675293, 13.760695457458496, 14.425477981567383, 15.090261459350586, 15.755043983459473, 16.41982650756836, 17.084609985351562, 17.749393463134766, 18.41417694091797, 19.078960418701172, 19.743743896484375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 15.0, 17.0, 23.0, 31.0, 28.0, 45.0, 70.0, 120.0, 195.0, 313.0, 499.0, 799.0, 1528.0, 3150.0, 6562.0, 15161.0, 39028.0, 133671.0, 3274587.0, 581669.0, 85875.0, 28026.0, 11608.0, 5281.0, 2641.0, 1305.0, 774.0, 432.0, 252.0, 184.0, 118.0, 68.0, 63.0, 45.0, 18.0, 25.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.70599365234375, -4.5369873046875, -4.36798095703125, -4.198974609375, -4.02996826171875, -3.8609619140625, -3.69195556640625, -3.52294921875, -3.35394287109375, -3.1849365234375, -3.01593017578125, -2.846923828125, -2.67791748046875, -2.5089111328125, -2.33990478515625, -2.1708984375, -2.00189208984375, -1.8328857421875, -1.66387939453125, -1.494873046875, -1.32586669921875, -1.1568603515625, -0.98785400390625, -0.81884765625, -0.64984130859375, -0.4808349609375, -0.31182861328125, -0.142822265625, 0.02618408203125, 0.1951904296875, 0.36419677734375, 0.533203125, 0.70220947265625, 0.8712158203125, 1.04022216796875, 1.209228515625, 1.37823486328125, 1.5472412109375, 1.71624755859375, 1.88525390625, 2.05426025390625, 2.2232666015625, 2.39227294921875, 2.561279296875, 2.73028564453125, 2.8992919921875, 3.06829833984375, 3.2373046875, 3.40631103515625, 3.5753173828125, 3.74432373046875, 3.913330078125, 4.08233642578125, 4.2513427734375, 4.42034912109375, 4.58935546875, 4.75836181640625, 4.9273681640625, 5.09637451171875, 5.265380859375, 5.43438720703125, 5.6033935546875, 5.77239990234375, 5.94140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 8.0, 11.0, 8.0, 11.0, 5.0, 15.0, 18.0, 28.0, 29.0, 29.0, 39.0, 34.0, 43.0, 39.0, 50.0, 49.0, 42.0, 48.0, 51.0, 46.0, 53.0, 32.0, 41.0, 37.0, 35.0, 29.0, 23.0, 24.0, 22.0, 15.0, 14.0, 13.0, 15.0, 6.0, 9.0, 6.0, 1.0, 7.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6171875, -0.5994644165039062, -0.5817413330078125, -0.5640182495117188, -0.546295166015625, -0.5285720825195312, -0.5108489990234375, -0.49312591552734375, -0.47540283203125, -0.45767974853515625, -0.4399566650390625, -0.42223358154296875, -0.404510498046875, -0.38678741455078125, -0.3690643310546875, -0.35134124755859375, -0.3336181640625, -0.31589508056640625, -0.2981719970703125, -0.28044891357421875, -0.262725830078125, -0.24500274658203125, -0.2272796630859375, -0.20955657958984375, -0.19183349609375, -0.17411041259765625, -0.1563873291015625, -0.13866424560546875, -0.120941162109375, -0.10321807861328125, -0.0854949951171875, -0.06777191162109375, -0.050048828125, -0.03232574462890625, -0.0146026611328125, 0.00312042236328125, 0.020843505859375, 0.03856658935546875, 0.0562896728515625, 0.07401275634765625, 0.09173583984375, 0.10945892333984375, 0.1271820068359375, 0.14490509033203125, 0.162628173828125, 0.18035125732421875, 0.1980743408203125, 0.21579742431640625, 0.2335205078125, 0.25124359130859375, 0.2689666748046875, 0.28668975830078125, 0.304412841796875, 0.32213592529296875, 0.3398590087890625, 0.35758209228515625, 0.37530517578125, 0.39302825927734375, 0.4107513427734375, 0.42847442626953125, 0.446197509765625, 0.46392059326171875, 0.4816436767578125, 0.49936676025390625, 0.51708984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 10.0, 18.0, 30.0, 59.0, 105.0, 227.0, 468.0, 1180.0, 3161.0, 9430.0, 37541.0, 265670.0, 3644113.0, 191518.0, 29280.0, 7317.0, 2431.0, 840.0, 403.0, 188.0, 105.0, 55.0, 48.0, 25.0, 12.0, 7.0, 4.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.226318359375, -7.93701171875, -7.647705078125, -7.3583984375, -7.069091796875, -6.77978515625, -6.490478515625, -6.201171875, -5.911865234375, -5.62255859375, -5.333251953125, -5.0439453125, -4.754638671875, -4.46533203125, -4.176025390625, -3.88671875, -3.597412109375, -3.30810546875, -3.018798828125, -2.7294921875, -2.440185546875, -2.15087890625, -1.861572265625, -1.572265625, -1.282958984375, -0.99365234375, -0.704345703125, -0.4150390625, -0.125732421875, 0.16357421875, 0.452880859375, 0.7421875, 1.031494140625, 1.32080078125, 1.610107421875, 1.8994140625, 2.188720703125, 2.47802734375, 2.767333984375, 3.056640625, 3.345947265625, 3.63525390625, 3.924560546875, 4.2138671875, 4.503173828125, 4.79248046875, 5.081787109375, 5.37109375, 5.660400390625, 5.94970703125, 6.239013671875, 6.5283203125, 6.817626953125, 7.10693359375, 7.396240234375, 7.685546875, 7.974853515625, 8.26416015625, 8.553466796875, 8.8427734375, 9.132080078125, 9.42138671875, 9.710693359375, 10.0]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 13.0, 14.0, 8.0, 12.0, 17.0, 24.0, 24.0, 39.0, 53.0, 67.0, 93.0, 158.0, 261.0, 987.0, 1424.0, 328.0, 157.0, 107.0, 73.0, 45.0, 38.0, 31.0, 18.0, 22.0, 6.0, 8.0, 6.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.32421875, -1.2786407470703125, -1.233062744140625, -1.1874847412109375, -1.14190673828125, -1.0963287353515625, -1.050750732421875, -1.0051727294921875, -0.9595947265625, -0.9140167236328125, -0.868438720703125, -0.8228607177734375, -0.77728271484375, -0.7317047119140625, -0.686126708984375, -0.6405487060546875, -0.594970703125, -0.5493927001953125, -0.503814697265625, -0.4582366943359375, -0.41265869140625, -0.3670806884765625, -0.321502685546875, -0.2759246826171875, -0.2303466796875, -0.1847686767578125, -0.139190673828125, -0.0936126708984375, -0.04803466796875, -0.0024566650390625, 0.043121337890625, 0.0886993408203125, 0.13427734375, 0.1798553466796875, 0.225433349609375, 0.2710113525390625, 0.31658935546875, 0.3621673583984375, 0.407745361328125, 0.4533233642578125, 0.4989013671875, 0.5444793701171875, 0.590057373046875, 0.6356353759765625, 0.68121337890625, 0.7267913818359375, 0.772369384765625, 0.8179473876953125, 0.863525390625, 0.9091033935546875, 0.954681396484375, 1.0002593994140625, 1.04583740234375, 1.0914154052734375, 1.136993408203125, 1.1825714111328125, 1.2281494140625, 1.2737274169921875, 1.319305419921875, 1.3648834228515625, 1.41046142578125, 1.4560394287109375, 1.501617431640625, 1.5471954345703125, 1.5927734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 11.0, 31.0, 68.0, 153.0, 281.0, 260.0, 114.0, 46.0, 14.0, 8.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-41.503623962402344, -40.703800201416016, -39.90398025512695, -39.104156494140625, -38.3043327331543, -37.504512786865234, -36.704689025878906, -35.90486526489258, -35.105045318603516, -34.30522155761719, -33.505401611328125, -32.7055778503418, -31.9057559967041, -31.105934143066406, -30.306110382080078, -29.506288528442383, -28.706464767456055, -27.90664291381836, -27.10681915283203, -26.306997299194336, -25.50717544555664, -24.707351684570312, -23.907529830932617, -23.107707977294922, -22.307884216308594, -21.5080623626709, -20.70823860168457, -19.908416748046875, -19.10859489440918, -18.308773040771484, -17.508949279785156, -16.70912742614746, -15.90930461883545, -15.109481811523438, -14.309659957885742, -13.50983715057373, -12.710014343261719, -11.910192489624023, -11.110369682312012, -10.310546875, -9.510725021362305, -8.710902214050293, -7.911080360412598, -7.111257553100586, -6.311435222625732, -5.511612892150879, -4.711790084838867, -3.9119677543640137, -3.11214542388916, -2.3123230934143066, -1.512500524520874, -0.7126779556274414, 0.08714437484741211, 0.8869667053222656, 1.6867895126342773, 2.486611843109131, 3.2864341735839844, 4.086256504058838, 4.886078834533691, 5.685901641845703, 6.485723972320557, 7.28554630279541, 8.085369110107422, 8.885190963745117, 9.685013771057129]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 10.0, 12.0, 15.0, 14.0, 26.0, 31.0, 25.0, 45.0, 51.0, 41.0, 50.0, 68.0, 52.0, 59.0, 57.0, 50.0, 49.0, 49.0, 50.0, 44.0, 32.0, 39.0, 30.0, 25.0, 17.0, 14.0, 12.0, 5.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.099781036376953, -6.849028587341309, -6.598276138305664, -6.347524166107178, -6.096771717071533, -5.846019268035889, -5.595267295837402, -5.344514846801758, -5.093762397766113, -4.843009948730469, -4.592257499694824, -4.341505527496338, -4.090753078460693, -3.840000629425049, -3.5892484188079834, -3.338496208190918, -3.0877437591552734, -2.836991310119629, -2.5862390995025635, -2.335486888885498, -2.0847344398498535, -1.8339821100234985, -1.5832297801971436, -1.3324774503707886, -1.0817251205444336, -0.8309727907180786, -0.5802204608917236, -0.32946813106536865, -0.07871580123901367, 0.1720365285873413, 0.4227888584136963, 0.6735411882400513, 0.9242935180664062, 1.1750458478927612, 1.4257981777191162, 1.6765505075454712, 1.9273028373718262, 2.1780552864074707, 2.428807497024536, 2.6795597076416016, 2.930312156677246, 3.1810646057128906, 3.431816816329956, 3.6825690269470215, 3.933321475982666, 4.1840739250183105, 4.434825897216797, 4.685578346252441, 4.936330795288086, 5.1870832443237305, 5.437835693359375, 5.688587665557861, 5.939340114593506, 6.19009256362915, 6.440844535827637, 6.691596984863281, 6.942349433898926, 7.19310188293457, 7.443854331970215, 7.694606304168701, 7.945358753204346, 8.196110725402832, 8.446863174438477, 8.697615623474121, 8.948368072509766]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 7.0, 11.0, 11.0, 12.0, 11.0, 17.0, 25.0, 38.0, 34.0, 46.0, 73.0, 168.0, 607.0, 2536.0, 17741.0, 148310.0, 650290.0, 200216.0, 23797.0, 3390.0, 696.0, 216.0, 86.0, 37.0, 29.0, 23.0, 24.0, 15.0, 16.0, 14.0, 9.0, 15.0, 6.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82421875, -7.55963134765625, -7.2950439453125, -7.03045654296875, -6.765869140625, -6.50128173828125, -6.2366943359375, -5.97210693359375, -5.70751953125, -5.44293212890625, -5.1783447265625, -4.91375732421875, -4.649169921875, -4.38458251953125, -4.1199951171875, -3.85540771484375, -3.5908203125, -3.32623291015625, -3.0616455078125, -2.79705810546875, -2.532470703125, -2.26788330078125, -2.0032958984375, -1.73870849609375, -1.47412109375, -1.20953369140625, -0.9449462890625, -0.68035888671875, -0.415771484375, -0.15118408203125, 0.1134033203125, 0.37799072265625, 0.642578125, 0.90716552734375, 1.1717529296875, 1.43634033203125, 1.700927734375, 1.96551513671875, 2.2301025390625, 2.49468994140625, 2.75927734375, 3.02386474609375, 3.2884521484375, 3.55303955078125, 3.817626953125, 4.08221435546875, 4.3468017578125, 4.61138916015625, 4.8759765625, 5.14056396484375, 5.4051513671875, 5.66973876953125, 5.934326171875, 6.19891357421875, 6.4635009765625, 6.72808837890625, 6.99267578125, 7.25726318359375, 7.5218505859375, 7.78643798828125, 8.051025390625, 8.31561279296875, 8.5802001953125, 8.84478759765625, 9.109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 0.0, 9.0, 18.0, 24.0, 37.0, 71.0, 46.0, 89.0, 104.0, 109.0, 106.0, 99.0, 81.0, 75.0, 41.0, 47.0, 23.0, 16.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5009231567382812, -0.4593658447265625, -0.41780853271484375, -0.376251220703125, -0.33469390869140625, -0.2931365966796875, -0.25157928466796875, -0.21002197265625, -0.16846466064453125, -0.1269073486328125, -0.08535003662109375, -0.043792724609375, -0.00223541259765625, 0.0393218994140625, 0.08087921142578125, 0.1224365234375, 0.16399383544921875, 0.2055511474609375, 0.24710845947265625, 0.288665771484375, 0.33022308349609375, 0.3717803955078125, 0.41333770751953125, 0.45489501953125, 0.49645233154296875, 0.5380096435546875, 0.5795669555664062, 0.621124267578125, 0.6626815795898438, 0.7042388916015625, 0.7457962036132812, 0.787353515625, 0.8289108276367188, 0.8704681396484375, 0.9120254516601562, 0.953582763671875, 0.9951400756835938, 1.0366973876953125, 1.0782546997070312, 1.11981201171875, 1.1613693237304688, 1.2029266357421875, 1.2444839477539062, 1.286041259765625, 1.3275985717773438, 1.3691558837890625, 1.4107131958007812, 1.4522705078125, 1.4938278198242188, 1.5353851318359375, 1.5769424438476562, 1.618499755859375, 1.6600570678710938, 1.7016143798828125, 1.7431716918945312, 1.78472900390625, 1.8262863159179688, 1.8678436279296875, 1.9094009399414062, 1.950958251953125, 1.9925155639648438, 2.0340728759765625, 2.0756301879882812, 2.1171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 11.0, 12.0, 14.0, 27.0, 33.0, 42.0, 72.0, 99.0, 138.0, 237.0, 335.0, 666.0, 1220.0, 2461.0, 5331.0, 12585.0, 32724.0, 93082.0, 257024.0, 373016.0, 171110.0, 59684.0, 22011.0, 8732.0, 3721.0, 1772.0, 881.0, 532.0, 317.0, 217.0, 135.0, 89.0, 59.0, 56.0, 22.0, 11.0, 13.0, 17.0, 8.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.719024658203125, -3.59625244140625, -3.473480224609375, -3.3507080078125, -3.227935791015625, -3.10516357421875, -2.982391357421875, -2.859619140625, -2.736846923828125, -2.61407470703125, -2.491302490234375, -2.3685302734375, -2.245758056640625, -2.12298583984375, -2.000213623046875, -1.87744140625, -1.754669189453125, -1.63189697265625, -1.509124755859375, -1.3863525390625, -1.263580322265625, -1.14080810546875, -1.018035888671875, -0.895263671875, -0.772491455078125, -0.64971923828125, -0.526947021484375, -0.4041748046875, -0.281402587890625, -0.15863037109375, -0.035858154296875, 0.0869140625, 0.209686279296875, 0.33245849609375, 0.455230712890625, 0.5780029296875, 0.700775146484375, 0.82354736328125, 0.946319580078125, 1.069091796875, 1.191864013671875, 1.31463623046875, 1.437408447265625, 1.5601806640625, 1.682952880859375, 1.80572509765625, 1.928497314453125, 2.05126953125, 2.174041748046875, 2.29681396484375, 2.419586181640625, 2.5423583984375, 2.665130615234375, 2.78790283203125, 2.910675048828125, 3.033447265625, 3.156219482421875, 3.27899169921875, 3.401763916015625, 3.5245361328125, 3.647308349609375, 3.77008056640625, 3.892852783203125, 4.015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 13.0, 14.0, 16.0, 10.0, 20.0, 28.0, 23.0, 25.0, 43.0, 40.0, 42.0, 44.0, 58.0, 76.0, 51.0, 58.0, 50.0, 53.0, 40.0, 55.0, 44.0, 29.0, 35.0, 19.0, 24.0, 15.0, 20.0, 10.0, 7.0, 8.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.939117431640625, -3.81964111328125, -3.700164794921875, -3.5806884765625, -3.461212158203125, -3.34173583984375, -3.222259521484375, -3.102783203125, -2.983306884765625, -2.86383056640625, -2.744354248046875, -2.6248779296875, -2.505401611328125, -2.38592529296875, -2.266448974609375, -2.14697265625, -2.027496337890625, -1.90802001953125, -1.788543701171875, -1.6690673828125, -1.549591064453125, -1.43011474609375, -1.310638427734375, -1.191162109375, -1.071685791015625, -0.95220947265625, -0.832733154296875, -0.7132568359375, -0.593780517578125, -0.47430419921875, -0.354827880859375, -0.2353515625, -0.115875244140625, 0.00360107421875, 0.123077392578125, 0.2425537109375, 0.362030029296875, 0.48150634765625, 0.600982666015625, 0.720458984375, 0.839935302734375, 0.95941162109375, 1.078887939453125, 1.1983642578125, 1.317840576171875, 1.43731689453125, 1.556793212890625, 1.67626953125, 1.795745849609375, 1.91522216796875, 2.034698486328125, 2.1541748046875, 2.273651123046875, 2.39312744140625, 2.512603759765625, 2.632080078125, 2.751556396484375, 2.87103271484375, 2.990509033203125, 3.1099853515625, 3.229461669921875, 3.34893798828125, 3.468414306640625, 3.587890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 8.0, 14.0, 21.0, 20.0, 39.0, 58.0, 84.0, 110.0, 251.0, 441.0, 840.0, 1671.0, 3500.0, 8132.0, 20802.0, 59980.0, 191938.0, 417424.0, 229208.0, 72469.0, 24346.0, 9268.0, 3914.0, 1895.0, 899.0, 454.0, 283.0, 156.0, 91.0, 64.0, 42.0, 31.0, 20.0, 15.0, 17.0, 10.0, 2.0, 3.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8229522705078125, -1.766998291015625, -1.7110443115234375, -1.65509033203125, -1.5991363525390625, -1.543182373046875, -1.4872283935546875, -1.4312744140625, -1.3753204345703125, -1.319366455078125, -1.2634124755859375, -1.20745849609375, -1.1515045166015625, -1.095550537109375, -1.0395965576171875, -0.983642578125, -0.9276885986328125, -0.871734619140625, -0.8157806396484375, -0.75982666015625, -0.7038726806640625, -0.647918701171875, -0.5919647216796875, -0.5360107421875, -0.4800567626953125, -0.424102783203125, -0.3681488037109375, -0.31219482421875, -0.2562408447265625, -0.200286865234375, -0.1443328857421875, -0.08837890625, -0.0324249267578125, 0.023529052734375, 0.0794830322265625, 0.13543701171875, 0.1913909912109375, 0.247344970703125, 0.3032989501953125, 0.3592529296875, 0.4152069091796875, 0.471160888671875, 0.5271148681640625, 0.58306884765625, 0.6390228271484375, 0.694976806640625, 0.7509307861328125, 0.806884765625, 0.8628387451171875, 0.918792724609375, 0.9747467041015625, 1.03070068359375, 1.0866546630859375, 1.142608642578125, 1.1985626220703125, 1.2545166015625, 1.3104705810546875, 1.366424560546875, 1.4223785400390625, 1.47833251953125, 1.5342864990234375, 1.590240478515625, 1.6461944580078125, 1.7021484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 7.0, 9.0, 9.0, 5.0, 10.0, 15.0, 24.0, 26.0, 37.0, 42.0, 63.0, 96.0, 106.0, 127.0, 102.0, 80.0, 78.0, 40.0, 25.0, 19.0, 18.0, 18.0, 9.0, 3.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004763603210449219, -0.00046058744192123413, -0.0004448145627975464, -0.00042904168367385864, -0.0004132688045501709, -0.00039749592542648315, -0.0003817230463027954, -0.00036595016717910767, -0.0003501772880554199, -0.0003344044089317322, -0.00031863152980804443, -0.0003028586506843567, -0.00028708577156066895, -0.0002713128924369812, -0.00025554001331329346, -0.0002397671341896057, -0.00022399425506591797, -0.00020822137594223022, -0.00019244849681854248, -0.00017667561769485474, -0.000160902738571167, -0.00014512985944747925, -0.0001293569803237915, -0.00011358410120010376, -9.781122207641602e-05, -8.203834295272827e-05, -6.626546382904053e-05, -5.049258470535278e-05, -3.471970558166504e-05, -1.8946826457977295e-05, -3.1739473342895508e-06, 1.2598931789398193e-05, 2.8371810913085938e-05, 4.414469003677368e-05, 5.9917569160461426e-05, 7.569044828414917e-05, 9.146332740783691e-05, 0.00010723620653152466, 0.0001230090856552124, 0.00013878196477890015, 0.0001545548439025879, 0.00017032772302627563, 0.00018610060214996338, 0.00020187348127365112, 0.00021764636039733887, 0.0002334192395210266, 0.00024919211864471436, 0.0002649649977684021, 0.00028073787689208984, 0.0002965107560157776, 0.00031228363513946533, 0.0003280565142631531, 0.0003438293933868408, 0.00035960227251052856, 0.0003753751516342163, 0.00039114803075790405, 0.0004069209098815918, 0.00042269378900527954, 0.0004384666681289673, 0.00045423954725265503, 0.0004700124263763428, 0.0004857853055000305, 0.0005015581846237183, 0.000517331063747406, 0.0005331039428710938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 6.0, 12.0, 12.0, 15.0, 36.0, 56.0, 82.0, 172.0, 331.0, 676.0, 1817.0, 6025.0, 26149.0, 184652.0, 678401.0, 122877.0, 19687.0, 4703.0, 1574.0, 616.0, 294.0, 156.0, 84.0, 34.0, 23.0, 18.0, 15.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.5360107421875, -3.415771484375, -3.2955322265625, -3.17529296875, -3.0550537109375, -2.934814453125, -2.8145751953125, -2.6943359375, -2.5740966796875, -2.453857421875, -2.3336181640625, -2.21337890625, -2.0931396484375, -1.972900390625, -1.8526611328125, -1.732421875, -1.6121826171875, -1.491943359375, -1.3717041015625, -1.25146484375, -1.1312255859375, -1.010986328125, -0.8907470703125, -0.7705078125, -0.6502685546875, -0.530029296875, -0.4097900390625, -0.28955078125, -0.1693115234375, -0.049072265625, 0.0711669921875, 0.19140625, 0.3116455078125, 0.431884765625, 0.5521240234375, 0.67236328125, 0.7926025390625, 0.912841796875, 1.0330810546875, 1.1533203125, 1.2735595703125, 1.393798828125, 1.5140380859375, 1.63427734375, 1.7545166015625, 1.874755859375, 1.9949951171875, 2.115234375, 2.2354736328125, 2.355712890625, 2.4759521484375, 2.59619140625, 2.7164306640625, 2.836669921875, 2.9569091796875, 3.0771484375, 3.1973876953125, 3.317626953125, 3.4378662109375, 3.55810546875, 3.6783447265625, 3.798583984375, 3.9188232421875, 4.0390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 11.0, 10.0, 13.0, 12.0, 11.0, 24.0, 29.0, 36.0, 36.0, 55.0, 66.0, 72.0, 106.0, 82.0, 75.0, 70.0, 57.0, 53.0, 40.0, 24.0, 20.0, 14.0, 15.0, 9.0, 7.0, 5.0, 9.0, 4.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.4242095947265625, -1.373809814453125, -1.3234100341796875, -1.27301025390625, -1.2226104736328125, -1.172210693359375, -1.1218109130859375, -1.0714111328125, -1.0210113525390625, -0.970611572265625, -0.9202117919921875, -0.86981201171875, -0.8194122314453125, -0.769012451171875, -0.7186126708984375, -0.668212890625, -0.6178131103515625, -0.567413330078125, -0.5170135498046875, -0.46661376953125, -0.4162139892578125, -0.365814208984375, -0.3154144287109375, -0.2650146484375, -0.2146148681640625, -0.164215087890625, -0.1138153076171875, -0.06341552734375, -0.0130157470703125, 0.037384033203125, 0.0877838134765625, 0.13818359375, 0.1885833740234375, 0.238983154296875, 0.2893829345703125, 0.33978271484375, 0.3901824951171875, 0.440582275390625, 0.4909820556640625, 0.5413818359375, 0.5917816162109375, 0.642181396484375, 0.6925811767578125, 0.74298095703125, 0.7933807373046875, 0.843780517578125, 0.8941802978515625, 0.944580078125, 0.9949798583984375, 1.045379638671875, 1.0957794189453125, 1.14617919921875, 1.1965789794921875, 1.246978759765625, 1.2973785400390625, 1.3477783203125, 1.3981781005859375, 1.448577880859375, 1.4989776611328125, 1.54937744140625, 1.5997772216796875, 1.650177001953125, 1.7005767822265625, 1.7509765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 18.0, 45.0, 65.0, 153.0, 217.0, 225.0, 133.0, 66.0, 39.0, 18.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.15479278564453, -50.661155700683594, -49.167518615722656, -47.67388153076172, -46.18024826049805, -44.68661117553711, -43.19297409057617, -41.699337005615234, -40.20570373535156, -38.712066650390625, -37.21842956542969, -35.72479248046875, -34.23115921020508, -32.73752212524414, -31.243885040283203, -29.750247955322266, -28.256610870361328, -26.76297378540039, -25.269338607788086, -23.77570152282715, -22.282066345214844, -20.788429260253906, -19.29479217529297, -17.80115509033203, -16.307519912719727, -14.813883781433105, -13.320247650146484, -11.826610565185547, -10.332974433898926, -8.839338302612305, -7.345701217651367, -5.852065086364746, -4.358428955078125, -2.864792585372925, -1.3711562156677246, 0.12248039245605469, 1.6161165237426758, 3.109752655029297, 4.603389739990234, 6.0970258712768555, 7.590662002563477, 9.084298133850098, 10.577934265136719, 12.071571350097656, 13.565207481384277, 15.058843612670898, 16.552480697631836, 18.04611587524414, 19.539752960205078, 21.033390045166016, 22.52702522277832, 24.020662307739258, 25.514297485351562, 27.0079345703125, 28.501571655273438, 29.995208740234375, 31.48884391784668, 32.982479095458984, 34.47611618041992, 35.96975326538086, 37.4633903503418, 38.95702362060547, 40.450660705566406, 41.944297790527344, 43.43793487548828]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 7.0, 13.0, 13.0, 20.0, 20.0, 31.0, 35.0, 22.0, 33.0, 38.0, 45.0, 39.0, 38.0, 48.0, 42.0, 48.0, 48.0, 59.0, 38.0, 50.0, 40.0, 36.0, 38.0, 28.0, 21.0, 31.0, 27.0, 15.0, 11.0, 10.0, 10.0, 6.0, 3.0, 5.0, 5.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.474233627319336, -21.867734909057617, -21.2612361907959, -20.65473747253418, -20.04823875427246, -19.441740036010742, -18.835241317749023, -18.228740692138672, -17.622241973876953, -17.015743255615234, -16.409244537353516, -15.802745819091797, -15.196247100830078, -14.58974838256836, -13.983248710632324, -13.376749992370605, -12.770252227783203, -12.163753509521484, -11.557254791259766, -10.950756072998047, -10.344257354736328, -9.73775863647461, -9.131258964538574, -8.524760246276855, -7.918261528015137, -7.311762809753418, -6.705264091491699, -6.098764896392822, -5.4922661781311035, -4.885767459869385, -4.279268264770508, -3.672769546508789, -3.066272735595703, -2.4597740173339844, -1.8532750606536865, -1.2467762231826782, -0.6402773857116699, -0.03377866744995117, 0.5727202892303467, 1.1792192459106445, 1.7857179641723633, 2.392216682434082, 2.99871563911438, 3.6052145957946777, 4.2117133140563965, 4.818212032318115, 5.424711227416992, 6.031209945678711, 6.63770866394043, 7.244207382202148, 7.850706100463867, 8.457204818725586, 9.063703536987305, 9.670202255249023, 10.276701927185059, 10.883200645446777, 11.489699363708496, 12.096198081970215, 12.702696800231934, 13.309195518493652, 13.915695190429688, 14.522193908691406, 15.128692626953125, 15.735191345214844, 16.341690063476562]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 14.0, 23.0, 36.0, 79.0, 234.0, 600.0, 2318.0, 11712.0, 131533.0, 3983200.0, 55158.0, 6946.0, 1553.0, 437.0, 173.0, 68.0, 47.0, 28.0, 19.0, 14.0, 12.0, 14.0, 7.0, 4.0, 4.0, 6.0, 4.0, 9.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.734375, -5.361083984375, -4.98779296875, -4.614501953125, -4.2412109375, -3.867919921875, -3.49462890625, -3.121337890625, -2.748046875, -2.374755859375, -2.00146484375, -1.628173828125, -1.2548828125, -0.881591796875, -0.50830078125, -0.135009765625, 0.23828125, 0.611572265625, 0.98486328125, 1.358154296875, 1.7314453125, 2.104736328125, 2.47802734375, 2.851318359375, 3.224609375, 3.597900390625, 3.97119140625, 4.344482421875, 4.7177734375, 5.091064453125, 5.46435546875, 5.837646484375, 6.2109375, 6.584228515625, 6.95751953125, 7.330810546875, 7.7041015625, 8.077392578125, 8.45068359375, 8.823974609375, 9.197265625, 9.570556640625, 9.94384765625, 10.317138671875, 10.6904296875, 11.063720703125, 11.43701171875, 11.810302734375, 12.18359375, 12.556884765625, 12.93017578125, 13.303466796875, 13.6767578125, 14.050048828125, 14.42333984375, 14.796630859375, 15.169921875, 15.543212890625, 15.91650390625, 16.289794921875, 16.6630859375, 17.036376953125, 17.40966796875, 17.782958984375, 18.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 8.0, 3.0, 16.0, 19.0, 40.0, 69.0, 98.0, 115.0, 134.0, 136.0, 125.0, 95.0, 71.0, 35.0, 28.0, 11.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.720703125, -0.669403076171875, -0.61810302734375, -0.566802978515625, -0.5155029296875, -0.464202880859375, -0.41290283203125, -0.361602783203125, -0.310302734375, -0.259002685546875, -0.20770263671875, -0.156402587890625, -0.1051025390625, -0.053802490234375, -0.00250244140625, 0.048797607421875, 0.10009765625, 0.151397705078125, 0.20269775390625, 0.253997802734375, 0.3052978515625, 0.356597900390625, 0.40789794921875, 0.459197998046875, 0.510498046875, 0.561798095703125, 0.61309814453125, 0.664398193359375, 0.7156982421875, 0.766998291015625, 0.81829833984375, 0.869598388671875, 0.9208984375, 0.972198486328125, 1.02349853515625, 1.074798583984375, 1.1260986328125, 1.177398681640625, 1.22869873046875, 1.279998779296875, 1.331298828125, 1.382598876953125, 1.43389892578125, 1.485198974609375, 1.5364990234375, 1.587799072265625, 1.63909912109375, 1.690399169921875, 1.74169921875, 1.792999267578125, 1.84429931640625, 1.895599365234375, 1.9468994140625, 1.998199462890625, 2.04949951171875, 2.100799560546875, 2.152099609375, 2.203399658203125, 2.25469970703125, 2.305999755859375, 2.3572998046875, 2.408599853515625, 2.45989990234375, 2.511199951171875, 2.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 15.0, 9.0, 15.0, 16.0, 27.0, 37.0, 44.0, 49.0, 92.0, 114.0, 180.0, 347.0, 813.0, 2573.0, 11149.0, 71507.0, 3603132.0, 458440.0, 35207.0, 6947.0, 2055.0, 719.0, 301.0, 152.0, 117.0, 64.0, 47.0, 30.0, 15.0, 17.0, 12.0, 12.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1328125, -8.83642578125, -8.5400390625, -8.24365234375, -7.947265625, -7.65087890625, -7.3544921875, -7.05810546875, -6.76171875, -6.46533203125, -6.1689453125, -5.87255859375, -5.576171875, -5.27978515625, -4.9833984375, -4.68701171875, -4.390625, -4.09423828125, -3.7978515625, -3.50146484375, -3.205078125, -2.90869140625, -2.6123046875, -2.31591796875, -2.01953125, -1.72314453125, -1.4267578125, -1.13037109375, -0.833984375, -0.53759765625, -0.2412109375, 0.05517578125, 0.3515625, 0.64794921875, 0.9443359375, 1.24072265625, 1.537109375, 1.83349609375, 2.1298828125, 2.42626953125, 2.72265625, 3.01904296875, 3.3154296875, 3.61181640625, 3.908203125, 4.20458984375, 4.5009765625, 4.79736328125, 5.09375, 5.39013671875, 5.6865234375, 5.98291015625, 6.279296875, 6.57568359375, 6.8720703125, 7.16845703125, 7.46484375, 7.76123046875, 8.0576171875, 8.35400390625, 8.650390625, 8.94677734375, 9.2431640625, 9.53955078125, 9.8359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 15.0, 24.0, 32.0, 67.0, 153.0, 483.0, 2550.0, 404.0, 143.0, 73.0, 36.0, 35.0, 14.0, 11.0, 16.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.611328125, -3.52825927734375, -3.4451904296875, -3.36212158203125, -3.279052734375, -3.19598388671875, -3.1129150390625, -3.02984619140625, -2.94677734375, -2.86370849609375, -2.7806396484375, -2.69757080078125, -2.614501953125, -2.53143310546875, -2.4483642578125, -2.36529541015625, -2.2822265625, -2.19915771484375, -2.1160888671875, -2.03302001953125, -1.949951171875, -1.86688232421875, -1.7838134765625, -1.70074462890625, -1.61767578125, -1.53460693359375, -1.4515380859375, -1.36846923828125, -1.285400390625, -1.20233154296875, -1.1192626953125, -1.03619384765625, -0.953125, -0.87005615234375, -0.7869873046875, -0.70391845703125, -0.620849609375, -0.53778076171875, -0.4547119140625, -0.37164306640625, -0.28857421875, -0.20550537109375, -0.1224365234375, -0.03936767578125, 0.043701171875, 0.12677001953125, 0.2098388671875, 0.29290771484375, 0.3759765625, 0.45904541015625, 0.5421142578125, 0.62518310546875, 0.708251953125, 0.79132080078125, 0.8743896484375, 0.95745849609375, 1.04052734375, 1.12359619140625, 1.2066650390625, 1.28973388671875, 1.372802734375, 1.45587158203125, 1.5389404296875, 1.62200927734375, 1.705078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 11.0, 26.0, 50.0, 114.0, 185.0, 218.0, 184.0, 105.0, 46.0, 27.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.650727272033691, -7.11739444732666, -6.584061622619629, -6.0507283210754395, -5.517395496368408, -4.984062671661377, -4.4507293701171875, -3.9173965454101562, -3.384063720703125, -2.8507308959960938, -2.3173978328704834, -1.7840648889541626, -1.2507319450378418, -0.7173991203308105, -0.1840660572052002, 0.34926700592041016, 0.8825998306274414, 1.4159327745437622, 1.949265718460083, 2.4825987815856934, 3.0159316062927246, 3.549264430999756, 4.082597732543945, 4.615930557250977, 5.149263381958008, 5.682596206665039, 6.21592903137207, 6.74926233291626, 7.282595157623291, 7.815927982330322, 8.349261283874512, 8.882594108581543, 9.41592788696289, 9.949260711669922, 10.482593536376953, 11.015926361083984, 11.549259185791016, 12.082592010498047, 12.615925788879395, 13.149258613586426, 13.682591438293457, 14.215924263000488, 14.74925708770752, 15.28258991241455, 15.815923690795898, 16.34925651550293, 16.88258934020996, 17.415922164916992, 17.949254989624023, 18.482587814331055, 19.015920639038086, 19.549253463745117, 20.08258628845215, 20.61591911315918, 21.14925193786621, 21.682586669921875, 22.215919494628906, 22.749252319335938, 23.28258514404297, 23.81591796875, 24.34925079345703, 24.882583618164062, 25.415916442871094, 25.949249267578125, 26.482582092285156]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 5.0, 6.0, 15.0, 10.0, 15.0, 26.0, 19.0, 20.0, 32.0, 41.0, 35.0, 29.0, 51.0, 46.0, 52.0, 35.0, 55.0, 38.0, 51.0, 48.0, 41.0, 45.0, 39.0, 45.0, 28.0, 33.0, 29.0, 18.0, 13.0, 17.0, 19.0, 10.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.219491004943848, -5.038363456726074, -4.857235431671143, -4.676107883453369, -4.4949798583984375, -4.313852310180664, -4.132724761962891, -3.951596975326538, -3.7704691886901855, -3.589341402053833, -3.4082136154174805, -3.227086067199707, -3.0459582805633545, -2.864830493927002, -2.6837029457092285, -2.502575159072876, -2.3214473724365234, -2.140319585800171, -1.959191918373108, -1.778064250946045, -1.5969364643096924, -1.4158086776733398, -1.2346810102462769, -1.0535533428192139, -0.8724255561828613, -0.6912978291511536, -0.5101701021194458, -0.32904237508773804, -0.14791464805603027, 0.03321307897567749, 0.21434080600738525, 0.39546847343444824, 0.5765962600708008, 0.7577239871025085, 0.9388517141342163, 1.1199793815612793, 1.3011071681976318, 1.4822349548339844, 1.6633626222610474, 1.8444902896881104, 2.025618076324463, 2.2067458629608154, 2.387873649597168, 2.5690011978149414, 2.750128984451294, 2.9312567710876465, 3.11238431930542, 3.2935121059417725, 3.474639892578125, 3.6557676792144775, 3.83689546585083, 4.0180230140686035, 4.199151039123535, 4.380278587341309, 4.561406135559082, 4.7425336837768555, 4.923661708831787, 5.1047892570495605, 5.285917282104492, 5.467044830322266, 5.648172378540039, 5.829300403594971, 6.010427951812744, 6.191555976867676, 6.372683525085449]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 4.0, 8.0, 9.0, 15.0, 15.0, 23.0, 23.0, 46.0, 56.0, 99.0, 220.0, 598.0, 2453.0, 12563.0, 78340.0, 476348.0, 402481.0, 62028.0, 10232.0, 1937.0, 531.0, 203.0, 84.0, 59.0, 43.0, 35.0, 17.0, 10.0, 17.0, 7.0, 10.0, 10.0, 3.0, 4.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.91015625, -7.6900634765625, -7.469970703125, -7.2498779296875, -7.02978515625, -6.8096923828125, -6.589599609375, -6.3695068359375, -6.1494140625, -5.9293212890625, -5.709228515625, -5.4891357421875, -5.26904296875, -5.0489501953125, -4.828857421875, -4.6087646484375, -4.388671875, -4.1685791015625, -3.948486328125, -3.7283935546875, -3.50830078125, -3.2882080078125, -3.068115234375, -2.8480224609375, -2.6279296875, -2.4078369140625, -2.187744140625, -1.9676513671875, -1.74755859375, -1.5274658203125, -1.307373046875, -1.0872802734375, -0.8671875, -0.6470947265625, -0.427001953125, -0.2069091796875, 0.01318359375, 0.2332763671875, 0.453369140625, 0.6734619140625, 0.8935546875, 1.1136474609375, 1.333740234375, 1.5538330078125, 1.77392578125, 1.9940185546875, 2.214111328125, 2.4342041015625, 2.654296875, 2.8743896484375, 3.094482421875, 3.3145751953125, 3.53466796875, 3.7547607421875, 3.974853515625, 4.1949462890625, 4.4150390625, 4.6351318359375, 4.855224609375, 5.0753173828125, 5.29541015625, 5.5155029296875, 5.735595703125, 5.9556884765625, 6.17578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 6.0, 1.0, 18.0, 18.0, 32.0, 50.0, 52.0, 90.0, 92.0, 109.0, 118.0, 107.0, 94.0, 71.0, 52.0, 41.0, 27.0, 13.0, 12.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5522842407226562, -0.5074005126953125, -0.46251678466796875, -0.417633056640625, -0.37274932861328125, -0.3278656005859375, -0.28298187255859375, -0.23809814453125, -0.19321441650390625, -0.1483306884765625, -0.10344696044921875, -0.058563232421875, -0.01367950439453125, 0.0312042236328125, 0.07608795166015625, 0.1209716796875, 0.16585540771484375, 0.2107391357421875, 0.25562286376953125, 0.300506591796875, 0.34539031982421875, 0.3902740478515625, 0.43515777587890625, 0.48004150390625, 0.5249252319335938, 0.5698089599609375, 0.6146926879882812, 0.659576416015625, 0.7044601440429688, 0.7493438720703125, 0.7942276000976562, 0.839111328125, 0.8839950561523438, 0.9288787841796875, 0.9737625122070312, 1.018646240234375, 1.0635299682617188, 1.1084136962890625, 1.1532974243164062, 1.19818115234375, 1.2430648803710938, 1.2879486083984375, 1.3328323364257812, 1.377716064453125, 1.4225997924804688, 1.4674835205078125, 1.5123672485351562, 1.5572509765625, 1.6021347045898438, 1.6470184326171875, 1.6919021606445312, 1.736785888671875, 1.7816696166992188, 1.8265533447265625, 1.8714370727539062, 1.91632080078125, 1.9612045288085938, 2.0060882568359375, 2.0509719848632812, 2.095855712890625, 2.1407394409179688, 2.1856231689453125, 2.2305068969726562, 2.275390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 8.0, 3.0, 14.0, 6.0, 16.0, 18.0, 34.0, 43.0, 64.0, 65.0, 104.0, 169.0, 283.0, 458.0, 856.0, 1734.0, 3947.0, 10669.0, 32153.0, 109168.0, 356281.0, 366409.0, 113422.0, 33659.0, 10833.0, 4144.0, 1792.0, 888.0, 458.0, 293.0, 177.0, 116.0, 95.0, 65.0, 32.0, 22.0, 16.0, 10.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.41015625, -4.284210205078125, -4.15826416015625, -4.032318115234375, -3.9063720703125, -3.780426025390625, -3.65447998046875, -3.528533935546875, -3.402587890625, -3.276641845703125, -3.15069580078125, -3.024749755859375, -2.8988037109375, -2.772857666015625, -2.64691162109375, -2.520965576171875, -2.39501953125, -2.269073486328125, -2.14312744140625, -2.017181396484375, -1.8912353515625, -1.765289306640625, -1.63934326171875, -1.513397216796875, -1.387451171875, -1.261505126953125, -1.13555908203125, -1.009613037109375, -0.8836669921875, -0.757720947265625, -0.63177490234375, -0.505828857421875, -0.3798828125, -0.253936767578125, -0.12799072265625, -0.002044677734375, 0.1239013671875, 0.249847412109375, 0.37579345703125, 0.501739501953125, 0.627685546875, 0.753631591796875, 0.87957763671875, 1.005523681640625, 1.1314697265625, 1.257415771484375, 1.38336181640625, 1.509307861328125, 1.63525390625, 1.761199951171875, 1.88714599609375, 2.013092041015625, 2.1390380859375, 2.264984130859375, 2.39093017578125, 2.516876220703125, 2.642822265625, 2.768768310546875, 2.89471435546875, 3.020660400390625, 3.1466064453125, 3.272552490234375, 3.39849853515625, 3.524444580078125, 3.650390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 5.0, 9.0, 8.0, 21.0, 20.0, 22.0, 27.0, 18.0, 32.0, 45.0, 49.0, 46.0, 41.0, 54.0, 55.0, 53.0, 43.0, 55.0, 44.0, 45.0, 54.0, 45.0, 34.0, 32.0, 27.0, 22.0, 14.0, 21.0, 17.0, 6.0, 6.0, 8.0, 4.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.6807861328125, -2.572509765625, -2.4642333984375, -2.35595703125, -2.2476806640625, -2.139404296875, -2.0311279296875, -1.9228515625, -1.8145751953125, -1.706298828125, -1.5980224609375, -1.48974609375, -1.3814697265625, -1.273193359375, -1.1649169921875, -1.056640625, -0.9483642578125, -0.840087890625, -0.7318115234375, -0.62353515625, -0.5152587890625, -0.406982421875, -0.2987060546875, -0.1904296875, -0.0821533203125, 0.026123046875, 0.1343994140625, 0.24267578125, 0.3509521484375, 0.459228515625, 0.5675048828125, 0.67578125, 0.7840576171875, 0.892333984375, 1.0006103515625, 1.10888671875, 1.2171630859375, 1.325439453125, 1.4337158203125, 1.5419921875, 1.6502685546875, 1.758544921875, 1.8668212890625, 1.97509765625, 2.0833740234375, 2.191650390625, 2.2999267578125, 2.408203125, 2.5164794921875, 2.624755859375, 2.7330322265625, 2.84130859375, 2.9495849609375, 3.057861328125, 3.1661376953125, 3.2744140625, 3.3826904296875, 3.490966796875, 3.5992431640625, 3.70751953125, 3.8157958984375, 3.924072265625, 4.0323486328125, 4.140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 19.0, 20.0, 40.0, 63.0, 128.0, 211.0, 430.0, 802.0, 1742.0, 4062.0, 11260.0, 37077.0, 160964.0, 506651.0, 246106.0, 54086.0, 15286.0, 5377.0, 2144.0, 970.0, 448.0, 245.0, 164.0, 80.0, 58.0, 36.0, 14.0, 18.0, 10.0, 10.0, 7.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.48828125, -2.425506591796875, -2.36273193359375, -2.299957275390625, -2.2371826171875, -2.174407958984375, -2.11163330078125, -2.048858642578125, -1.986083984375, -1.923309326171875, -1.86053466796875, -1.797760009765625, -1.7349853515625, -1.672210693359375, -1.60943603515625, -1.546661376953125, -1.48388671875, -1.421112060546875, -1.35833740234375, -1.295562744140625, -1.2327880859375, -1.170013427734375, -1.10723876953125, -1.044464111328125, -0.981689453125, -0.918914794921875, -0.85614013671875, -0.793365478515625, -0.7305908203125, -0.667816162109375, -0.60504150390625, -0.542266845703125, -0.4794921875, -0.416717529296875, -0.35394287109375, -0.291168212890625, -0.2283935546875, -0.165618896484375, -0.10284423828125, -0.040069580078125, 0.022705078125, 0.085479736328125, 0.14825439453125, 0.211029052734375, 0.2738037109375, 0.336578369140625, 0.39935302734375, 0.462127685546875, 0.52490234375, 0.587677001953125, 0.65045166015625, 0.713226318359375, 0.7760009765625, 0.838775634765625, 0.90155029296875, 0.964324951171875, 1.027099609375, 1.089874267578125, 1.15264892578125, 1.215423583984375, 1.2781982421875, 1.340972900390625, 1.40374755859375, 1.466522216796875, 1.529296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 10.0, 11.0, 21.0, 25.0, 40.0, 45.0, 63.0, 75.0, 145.0, 149.0, 133.0, 82.0, 41.0, 38.0, 30.0, 25.0, 13.0, 13.0, 8.0, 7.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005025863647460938, -0.00048595666885375977, -0.0004693269729614258, -0.0004526972770690918, -0.0004360675811767578, -0.00041943788528442383, -0.00040280818939208984, -0.00038617849349975586, -0.0003695487976074219, -0.0003529191017150879, -0.0003362894058227539, -0.0003196597099304199, -0.00030303001403808594, -0.00028640031814575195, -0.00026977062225341797, -0.000253140926361084, -0.00023651123046875, -0.00021988153457641602, -0.00020325183868408203, -0.00018662214279174805, -0.00016999244689941406, -0.00015336275100708008, -0.0001367330551147461, -0.00012010335922241211, -0.00010347366333007812, -8.684396743774414e-05, -7.021427154541016e-05, -5.358457565307617e-05, -3.695487976074219e-05, -2.0325183868408203e-05, -3.6954879760742188e-06, 1.2934207916259766e-05, 2.956390380859375e-05, 4.6193599700927734e-05, 6.282329559326172e-05, 7.94529914855957e-05, 9.608268737792969e-05, 0.00011271238327026367, 0.00012934207916259766, 0.00014597177505493164, 0.00016260147094726562, 0.0001792311668395996, 0.0001958608627319336, 0.00021249055862426758, 0.00022912025451660156, 0.00024574995040893555, 0.00026237964630126953, 0.0002790093421936035, 0.0002956390380859375, 0.0003122687339782715, 0.00032889842987060547, 0.00034552812576293945, 0.00036215782165527344, 0.0003787875175476074, 0.0003954172134399414, 0.0004120469093322754, 0.0004286766052246094, 0.00044530630111694336, 0.00046193599700927734, 0.00047856569290161133, 0.0004951953887939453, 0.0005118250846862793, 0.0005284547805786133, 0.0005450844764709473, 0.0005617141723632812]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 16.0, 19.0, 35.0, 69.0, 139.0, 257.0, 504.0, 1193.0, 3105.0, 10571.0, 49424.0, 378455.0, 514744.0, 69578.0, 13864.0, 3987.0, 1422.0, 559.0, 252.0, 156.0, 74.0, 40.0, 22.0, 12.0, 4.0, 11.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9453125, -2.847442626953125, -2.74957275390625, -2.651702880859375, -2.5538330078125, -2.455963134765625, -2.35809326171875, -2.260223388671875, -2.162353515625, -2.064483642578125, -1.96661376953125, -1.868743896484375, -1.7708740234375, -1.673004150390625, -1.57513427734375, -1.477264404296875, -1.37939453125, -1.281524658203125, -1.18365478515625, -1.085784912109375, -0.9879150390625, -0.890045166015625, -0.79217529296875, -0.694305419921875, -0.596435546875, -0.498565673828125, -0.40069580078125, -0.302825927734375, -0.2049560546875, -0.107086181640625, -0.00921630859375, 0.088653564453125, 0.1865234375, 0.284393310546875, 0.38226318359375, 0.480133056640625, 0.5780029296875, 0.675872802734375, 0.77374267578125, 0.871612548828125, 0.969482421875, 1.067352294921875, 1.16522216796875, 1.263092041015625, 1.3609619140625, 1.458831787109375, 1.55670166015625, 1.654571533203125, 1.75244140625, 1.850311279296875, 1.94818115234375, 2.046051025390625, 2.1439208984375, 2.241790771484375, 2.33966064453125, 2.437530517578125, 2.535400390625, 2.633270263671875, 2.73114013671875, 2.829010009765625, 2.9268798828125, 3.024749755859375, 3.12261962890625, 3.220489501953125, 3.318359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 6.0, 5.0, 13.0, 18.0, 14.0, 31.0, 35.0, 46.0, 64.0, 65.0, 74.0, 102.0, 89.0, 98.0, 70.0, 65.0, 52.0, 32.0, 20.0, 24.0, 17.0, 11.0, 5.0, 4.0, 9.0, 8.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7265625, -1.67120361328125, -1.6158447265625, -1.56048583984375, -1.505126953125, -1.44976806640625, -1.3944091796875, -1.33905029296875, -1.28369140625, -1.22833251953125, -1.1729736328125, -1.11761474609375, -1.062255859375, -1.00689697265625, -0.9515380859375, -0.89617919921875, -0.8408203125, -0.78546142578125, -0.7301025390625, -0.67474365234375, -0.619384765625, -0.56402587890625, -0.5086669921875, -0.45330810546875, -0.39794921875, -0.34259033203125, -0.2872314453125, -0.23187255859375, -0.176513671875, -0.12115478515625, -0.0657958984375, -0.01043701171875, 0.044921875, 0.10028076171875, 0.1556396484375, 0.21099853515625, 0.266357421875, 0.32171630859375, 0.3770751953125, 0.43243408203125, 0.48779296875, 0.54315185546875, 0.5985107421875, 0.65386962890625, 0.709228515625, 0.76458740234375, 0.8199462890625, 0.87530517578125, 0.9306640625, 0.98602294921875, 1.0413818359375, 1.09674072265625, 1.152099609375, 1.20745849609375, 1.2628173828125, 1.31817626953125, 1.37353515625, 1.42889404296875, 1.4842529296875, 1.53961181640625, 1.594970703125, 1.65032958984375, 1.7056884765625, 1.76104736328125, 1.81640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 29.0, 33.0, 58.0, 80.0, 109.0, 155.0, 144.0, 133.0, 93.0, 68.0, 37.0, 22.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28330421447754, -24.386962890625, -23.490623474121094, -22.594282150268555, -21.697940826416016, -20.80160140991211, -19.90526008605957, -19.00891876220703, -18.112579345703125, -17.216238021850586, -16.31989860534668, -15.42355728149414, -14.527216911315918, -13.630876541137695, -12.734535217285156, -11.838194847106934, -10.941854476928711, -10.045514106750488, -9.149173736572266, -8.252832412719727, -7.356492042541504, -6.460151672363281, -5.5638108253479, -4.6674699783325195, -3.771129608154297, -2.874788999557495, -1.9784483909606934, -1.0821077823638916, -0.18576717376708984, 0.7105731964111328, 1.6069140434265137, 2.5032548904418945, 3.39959716796875, 4.295937538146973, 5.1922783851623535, 6.088619232177734, 6.984959602355957, 7.88129997253418, 8.777641296386719, 9.673981666564941, 10.570322036743164, 11.466662406921387, 12.36300277709961, 13.259344100952148, 14.155684471130371, 15.052024841308594, 15.948366165161133, 16.844707489013672, 17.741046905517578, 18.637388229370117, 19.533727645874023, 20.430068969726562, 21.32640838623047, 22.222749710083008, 23.119091033935547, 24.015430450439453, 24.911771774291992, 25.80811309814453, 26.704452514648438, 27.600793838500977, 28.497135162353516, 29.393474578857422, 30.28981590270996, 31.1861572265625, 32.082496643066406]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 18.0, 15.0, 17.0, 25.0, 39.0, 28.0, 33.0, 49.0, 50.0, 42.0, 56.0, 51.0, 52.0, 50.0, 48.0, 57.0, 47.0, 45.0, 51.0, 45.0, 29.0, 26.0, 17.0, 17.0, 16.0, 11.0, 13.0, 6.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.823549270629883, -19.22077178955078, -18.617992401123047, -18.015214920043945, -17.412437438964844, -16.809659957885742, -16.20688247680664, -15.604103088378906, -15.001325607299805, -14.398548126220703, -13.795769691467285, -13.192991256713867, -12.590213775634766, -11.987436294555664, -11.384657859802246, -10.781879425048828, -10.179101943969727, -9.576324462890625, -8.973546028137207, -8.370767593383789, -7.7679901123046875, -7.165212154388428, -6.562434196472168, -5.959656238555908, -5.356878280639648, -4.754100322723389, -4.151322364807129, -3.548544406890869, -2.9457664489746094, -2.3429884910583496, -1.7402105331420898, -1.13743257522583, -0.5346565246582031, 0.06812143325805664, 0.6708993911743164, 1.2736773490905762, 1.876455307006836, 2.4792332649230957, 3.0820112228393555, 3.6847891807556152, 4.287567138671875, 4.890345096588135, 5.4931230545043945, 6.095901012420654, 6.698678970336914, 7.301456928253174, 7.904234886169434, 8.507013320922852, 9.109790802001953, 9.712568283081055, 10.315346717834473, 10.91812515258789, 11.520902633666992, 12.123680114746094, 12.726458549499512, 13.32923698425293, 13.932014465332031, 14.534791946411133, 15.13757038116455, 15.740348815917969, 16.34312629699707, 16.945903778076172, 17.548683166503906, 18.151460647583008, 18.75423812866211]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 11.0, 21.0, 39.0, 103.0, 281.0, 916.0, 3609.0, 22305.0, 327906.0, 3765581.0, 63081.0, 7747.0, 1718.0, 500.0, 202.0, 73.0, 43.0, 28.0, 20.0, 15.0, 17.0, 14.0, 14.0, 7.0, 6.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -3.893310546875, -3.59912109375, -3.304931640625, -3.0107421875, -2.716552734375, -2.42236328125, -2.128173828125, -1.833984375, -1.539794921875, -1.24560546875, -0.951416015625, -0.6572265625, -0.363037109375, -0.06884765625, 0.225341796875, 0.51953125, 0.813720703125, 1.10791015625, 1.402099609375, 1.6962890625, 1.990478515625, 2.28466796875, 2.578857421875, 2.873046875, 3.167236328125, 3.46142578125, 3.755615234375, 4.0498046875, 4.343994140625, 4.63818359375, 4.932373046875, 5.2265625, 5.520751953125, 5.81494140625, 6.109130859375, 6.4033203125, 6.697509765625, 6.99169921875, 7.285888671875, 7.580078125, 7.874267578125, 8.16845703125, 8.462646484375, 8.7568359375, 9.051025390625, 9.34521484375, 9.639404296875, 9.93359375, 10.227783203125, 10.52197265625, 10.816162109375, 11.1103515625, 11.404541015625, 11.69873046875, 11.992919921875, 12.287109375, 12.581298828125, 12.87548828125, 13.169677734375, 13.4638671875, 13.758056640625, 14.05224609375, 14.346435546875, 14.640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 5.0, 11.0, 30.0, 28.0, 53.0, 62.0, 84.0, 89.0, 114.0, 117.0, 104.0, 82.0, 72.0, 55.0, 49.0, 17.0, 25.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54345703125, -0.49910736083984375, -0.4547576904296875, -0.41040802001953125, -0.366058349609375, -0.32170867919921875, -0.2773590087890625, -0.23300933837890625, -0.18865966796875, -0.14430999755859375, -0.0999603271484375, -0.05561065673828125, -0.011260986328125, 0.03308868408203125, 0.0774383544921875, 0.12178802490234375, 0.1661376953125, 0.21048736572265625, 0.2548370361328125, 0.29918670654296875, 0.343536376953125, 0.38788604736328125, 0.4322357177734375, 0.47658538818359375, 0.52093505859375, 0.5652847290039062, 0.6096343994140625, 0.6539840698242188, 0.698333740234375, 0.7426834106445312, 0.7870330810546875, 0.8313827514648438, 0.875732421875, 0.9200820922851562, 0.9644317626953125, 1.0087814331054688, 1.053131103515625, 1.0974807739257812, 1.1418304443359375, 1.1861801147460938, 1.23052978515625, 1.2748794555664062, 1.3192291259765625, 1.3635787963867188, 1.407928466796875, 1.4522781372070312, 1.4966278076171875, 1.5409774780273438, 1.5853271484375, 1.6296768188476562, 1.6740264892578125, 1.7183761596679688, 1.762725830078125, 1.8070755004882812, 1.8514251708984375, 1.8957748413085938, 1.94012451171875, 1.9844741821289062, 2.0288238525390625, 2.0731735229492188, 2.117523193359375, 2.1618728637695312, 2.2062225341796875, 2.2505722045898438, 2.294921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 10.0, 14.0, 33.0, 64.0, 123.0, 228.0, 473.0, 1390.0, 6813.0, 123379.0, 3998353.0, 56458.0, 4826.0, 1196.0, 438.0, 195.0, 132.0, 73.0, 29.0, 21.0, 11.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2265625, -10.7845458984375, -10.342529296875, -9.9005126953125, -9.45849609375, -9.0164794921875, -8.574462890625, -8.1324462890625, -7.6904296875, -7.2484130859375, -6.806396484375, -6.3643798828125, -5.92236328125, -5.4803466796875, -5.038330078125, -4.5963134765625, -4.154296875, -3.7122802734375, -3.270263671875, -2.8282470703125, -2.38623046875, -1.9442138671875, -1.502197265625, -1.0601806640625, -0.6181640625, -0.1761474609375, 0.265869140625, 0.7078857421875, 1.14990234375, 1.5919189453125, 2.033935546875, 2.4759521484375, 2.91796875, 3.3599853515625, 3.802001953125, 4.2440185546875, 4.68603515625, 5.1280517578125, 5.570068359375, 6.0120849609375, 6.4541015625, 6.8961181640625, 7.338134765625, 7.7801513671875, 8.22216796875, 8.6641845703125, 9.106201171875, 9.5482177734375, 9.990234375, 10.4322509765625, 10.874267578125, 11.3162841796875, 11.75830078125, 12.2003173828125, 12.642333984375, 13.0843505859375, 13.5263671875, 13.9683837890625, 14.410400390625, 14.8524169921875, 15.29443359375, 15.7364501953125, 16.178466796875, 16.6204833984375, 17.0625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 20.0, 24.0, 48.0, 81.0, 161.0, 385.0, 1798.0, 977.0, 271.0, 119.0, 58.0, 41.0, 22.0, 10.0, 16.0, 3.0, 9.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.605712890625, -2.51220703125, -2.418701171875, -2.3251953125, -2.231689453125, -2.13818359375, -2.044677734375, -1.951171875, -1.857666015625, -1.76416015625, -1.670654296875, -1.5771484375, -1.483642578125, -1.39013671875, -1.296630859375, -1.203125, -1.109619140625, -1.01611328125, -0.922607421875, -0.8291015625, -0.735595703125, -0.64208984375, -0.548583984375, -0.455078125, -0.361572265625, -0.26806640625, -0.174560546875, -0.0810546875, 0.012451171875, 0.10595703125, 0.199462890625, 0.29296875, 0.386474609375, 0.47998046875, 0.573486328125, 0.6669921875, 0.760498046875, 0.85400390625, 0.947509765625, 1.041015625, 1.134521484375, 1.22802734375, 1.321533203125, 1.4150390625, 1.508544921875, 1.60205078125, 1.695556640625, 1.7890625, 1.882568359375, 1.97607421875, 2.069580078125, 2.1630859375, 2.256591796875, 2.35009765625, 2.443603515625, 2.537109375, 2.630615234375, 2.72412109375, 2.817626953125, 2.9111328125, 3.004638671875, 3.09814453125, 3.191650390625, 3.28515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 6.0, 22.0, 54.0, 81.0, 164.0, 265.0, 209.0, 114.0, 46.0, 18.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.306617736816406, -30.49951171875, -29.692405700683594, -28.885299682617188, -28.07819175720215, -27.271085739135742, -26.463979721069336, -25.65687370300293, -24.84976577758789, -24.042659759521484, -23.235553741455078, -22.428447723388672, -21.621339797973633, -20.814233779907227, -20.00712776184082, -19.200021743774414, -18.392915725708008, -17.5858097076416, -16.778703689575195, -15.971596717834473, -15.16448974609375, -14.357383728027344, -13.550277709960938, -12.743171691894531, -11.936064720153809, -11.128958702087402, -10.32185173034668, -9.514745712280273, -8.707639694213867, -7.9005327224731445, -7.093426704406738, -6.286320209503174, -5.479213714599609, -4.672107219696045, -3.8650009632110596, -3.057894706726074, -2.2507882118225098, -1.4436817169189453, -0.6365756988525391, 0.1705307960510254, 0.9776372909545898, 1.7847436666488647, 2.5918500423431396, 3.398956298828125, 4.2060627937316895, 5.013169288635254, 5.82027530670166, 6.627381801605225, 7.434488296508789, 8.241594314575195, 9.048701286315918, 9.855807304382324, 10.662914276123047, 11.470020294189453, 12.27712631225586, 13.084232330322266, 13.891339302062988, 14.698445320129395, 15.505552291870117, 16.312658309936523, 17.11976432800293, 17.92687225341797, 18.733978271484375, 19.54108428955078, 20.348190307617188]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 10.0, 19.0, 24.0, 30.0, 42.0, 39.0, 36.0, 48.0, 61.0, 53.0, 53.0, 66.0, 69.0, 84.0, 56.0, 37.0, 50.0, 42.0, 37.0, 31.0, 24.0, 20.0, 6.0, 18.0, 8.0, 12.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.033018112182617, -8.729249000549316, -8.425479888916016, -8.121710777282715, -7.817941665649414, -7.514172554016113, -7.210403919219971, -6.90663480758667, -6.602865695953369, -6.299096584320068, -5.995327472686768, -5.691558361053467, -5.387789726257324, -5.084020614624023, -4.780251502990723, -4.476482391357422, -4.172713279724121, -3.8689441680908203, -3.5651750564575195, -3.261406183242798, -2.957637071609497, -2.6538679599761963, -2.3500990867614746, -2.046329975128174, -1.742560863494873, -1.4387917518615723, -1.135022759437561, -0.831253707408905, -0.527484655380249, -0.22371554374694824, 0.08005344867706299, 0.3838224411010742, 0.6875925064086914, 0.9913615584373474, 1.2951306104660034, 1.5988996028900146, 1.9026687145233154, 2.206437826156616, 2.510206699371338, 2.8139758110046387, 3.1177449226379395, 3.4215140342712402, 3.725283145904541, 4.029052257537842, 4.332820892333984, 4.636590003967285, 4.940359115600586, 5.244128227233887, 5.5478973388671875, 5.851666450500488, 6.155435562133789, 6.45920467376709, 6.762973785400391, 7.066742897033691, 7.370511531829834, 7.674280643463135, 7.9780497550964355, 8.281818389892578, 8.585587501525879, 8.88935661315918, 9.19312572479248, 9.496894836425781, 9.800663948059082, 10.104433059692383, 10.408202171325684]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 5.0, 14.0, 32.0, 47.0, 53.0, 87.0, 177.0, 344.0, 843.0, 2771.0, 11204.0, 59660.0, 358772.0, 506636.0, 86597.0, 15603.0, 3619.0, 1124.0, 414.0, 204.0, 121.0, 65.0, 44.0, 32.0, 16.0, 15.0, 3.0, 8.0, 4.0, 8.0, 1.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.58221435546875, -6.3480224609375, -6.11383056640625, -5.879638671875, -5.64544677734375, -5.4112548828125, -5.17706298828125, -4.94287109375, -4.70867919921875, -4.4744873046875, -4.24029541015625, -4.006103515625, -3.77191162109375, -3.5377197265625, -3.30352783203125, -3.0693359375, -2.83514404296875, -2.6009521484375, -2.36676025390625, -2.132568359375, -1.89837646484375, -1.6641845703125, -1.42999267578125, -1.19580078125, -0.96160888671875, -0.7274169921875, -0.49322509765625, -0.259033203125, -0.02484130859375, 0.2093505859375, 0.44354248046875, 0.677734375, 0.91192626953125, 1.1461181640625, 1.38031005859375, 1.614501953125, 1.84869384765625, 2.0828857421875, 2.31707763671875, 2.55126953125, 2.78546142578125, 3.0196533203125, 3.25384521484375, 3.488037109375, 3.72222900390625, 3.9564208984375, 4.19061279296875, 4.4248046875, 4.65899658203125, 4.8931884765625, 5.12738037109375, 5.361572265625, 5.59576416015625, 5.8299560546875, 6.06414794921875, 6.29833984375, 6.53253173828125, 6.7667236328125, 7.00091552734375, 7.235107421875, 7.46929931640625, 7.7034912109375, 7.93768310546875, 8.171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 10.0, 11.0, 11.0, 21.0, 32.0, 38.0, 65.0, 66.0, 89.0, 102.0, 114.0, 101.0, 80.0, 72.0, 67.0, 44.0, 34.0, 26.0, 6.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.5852737426757812, -0.5450592041015625, -0.5048446655273438, -0.464630126953125, -0.42441558837890625, -0.3842010498046875, -0.34398651123046875, -0.30377197265625, -0.26355743408203125, -0.2233428955078125, -0.18312835693359375, -0.142913818359375, -0.10269927978515625, -0.0624847412109375, -0.02227020263671875, 0.0179443359375, 0.05815887451171875, 0.0983734130859375, 0.13858795166015625, 0.178802490234375, 0.21901702880859375, 0.2592315673828125, 0.29944610595703125, 0.33966064453125, 0.37987518310546875, 0.4200897216796875, 0.46030426025390625, 0.500518798828125, 0.5407333374023438, 0.5809478759765625, 0.6211624145507812, 0.661376953125, 0.7015914916992188, 0.7418060302734375, 0.7820205688476562, 0.822235107421875, 0.8624496459960938, 0.9026641845703125, 0.9428787231445312, 0.98309326171875, 1.0233078002929688, 1.0635223388671875, 1.1037368774414062, 1.143951416015625, 1.1841659545898438, 1.2243804931640625, 1.2645950317382812, 1.3048095703125, 1.3450241088867188, 1.3852386474609375, 1.4254531860351562, 1.465667724609375, 1.5058822631835938, 1.5460968017578125, 1.5863113403320312, 1.62652587890625, 1.6667404174804688, 1.7069549560546875, 1.7471694946289062, 1.787384033203125, 1.8275985717773438, 1.8678131103515625, 1.9080276489257812, 1.9482421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 14.0, 13.0, 14.0, 35.0, 48.0, 110.0, 177.0, 355.0, 648.0, 1539.0, 4415.0, 13630.0, 51806.0, 227085.0, 537307.0, 157731.0, 37296.0, 10397.0, 3449.0, 1290.0, 547.0, 283.0, 152.0, 80.0, 37.0, 33.0, 20.0, 16.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.04754638671875, -3.8880615234375, -3.72857666015625, -3.569091796875, -3.40960693359375, -3.2501220703125, -3.09063720703125, -2.93115234375, -2.77166748046875, -2.6121826171875, -2.45269775390625, -2.293212890625, -2.13372802734375, -1.9742431640625, -1.81475830078125, -1.6552734375, -1.49578857421875, -1.3363037109375, -1.17681884765625, -1.017333984375, -0.85784912109375, -0.6983642578125, -0.53887939453125, -0.37939453125, -0.21990966796875, -0.0604248046875, 0.09906005859375, 0.258544921875, 0.41802978515625, 0.5775146484375, 0.73699951171875, 0.896484375, 1.05596923828125, 1.2154541015625, 1.37493896484375, 1.534423828125, 1.69390869140625, 1.8533935546875, 2.01287841796875, 2.17236328125, 2.33184814453125, 2.4913330078125, 2.65081787109375, 2.810302734375, 2.96978759765625, 3.1292724609375, 3.28875732421875, 3.4482421875, 3.60772705078125, 3.7672119140625, 3.92669677734375, 4.086181640625, 4.24566650390625, 4.4051513671875, 4.56463623046875, 4.72412109375, 4.88360595703125, 5.0430908203125, 5.20257568359375, 5.362060546875, 5.52154541015625, 5.6810302734375, 5.84051513671875, 6.0]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 11.0, 8.0, 15.0, 12.0, 13.0, 17.0, 22.0, 29.0, 21.0, 24.0, 42.0, 46.0, 50.0, 47.0, 56.0, 46.0, 63.0, 40.0, 59.0, 51.0, 42.0, 42.0, 23.0, 36.0, 27.0, 27.0, 19.0, 17.0, 20.0, 13.0, 15.0, 7.0, 11.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15625, -3.050628662109375, -2.94500732421875, -2.839385986328125, -2.7337646484375, -2.628143310546875, -2.52252197265625, -2.416900634765625, -2.311279296875, -2.205657958984375, -2.10003662109375, -1.994415283203125, -1.8887939453125, -1.783172607421875, -1.67755126953125, -1.571929931640625, -1.46630859375, -1.360687255859375, -1.25506591796875, -1.149444580078125, -1.0438232421875, -0.938201904296875, -0.83258056640625, -0.726959228515625, -0.621337890625, -0.515716552734375, -0.41009521484375, -0.304473876953125, -0.1988525390625, -0.093231201171875, 0.01239013671875, 0.118011474609375, 0.2236328125, 0.329254150390625, 0.43487548828125, 0.540496826171875, 0.6461181640625, 0.751739501953125, 0.85736083984375, 0.962982177734375, 1.068603515625, 1.174224853515625, 1.27984619140625, 1.385467529296875, 1.4910888671875, 1.596710205078125, 1.70233154296875, 1.807952880859375, 1.91357421875, 2.019195556640625, 2.12481689453125, 2.230438232421875, 2.3360595703125, 2.441680908203125, 2.54730224609375, 2.652923583984375, 2.758544921875, 2.864166259765625, 2.96978759765625, 3.075408935546875, 3.1810302734375, 3.286651611328125, 3.39227294921875, 3.497894287109375, 3.603515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 14.0, 16.0, 19.0, 27.0, 36.0, 55.0, 125.0, 143.0, 253.0, 427.0, 890.0, 1524.0, 3398.0, 7760.0, 19752.0, 64151.0, 418169.0, 431074.0, 66053.0, 19820.0, 7892.0, 3452.0, 1537.0, 884.0, 397.0, 264.0, 148.0, 89.0, 53.0, 44.0, 28.0, 14.0, 14.0, 14.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.205078125, -3.101715087890625, -2.99835205078125, -2.894989013671875, -2.7916259765625, -2.688262939453125, -2.58489990234375, -2.481536865234375, -2.378173828125, -2.274810791015625, -2.17144775390625, -2.068084716796875, -1.9647216796875, -1.861358642578125, -1.75799560546875, -1.654632568359375, -1.55126953125, -1.447906494140625, -1.34454345703125, -1.241180419921875, -1.1378173828125, -1.034454345703125, -0.93109130859375, -0.827728271484375, -0.724365234375, -0.621002197265625, -0.51763916015625, -0.414276123046875, -0.3109130859375, -0.207550048828125, -0.10418701171875, -0.000823974609375, 0.1025390625, 0.205902099609375, 0.30926513671875, 0.412628173828125, 0.5159912109375, 0.619354248046875, 0.72271728515625, 0.826080322265625, 0.929443359375, 1.032806396484375, 1.13616943359375, 1.239532470703125, 1.3428955078125, 1.446258544921875, 1.54962158203125, 1.652984619140625, 1.75634765625, 1.859710693359375, 1.96307373046875, 2.066436767578125, 2.1697998046875, 2.273162841796875, 2.37652587890625, 2.479888916015625, 2.583251953125, 2.686614990234375, 2.78997802734375, 2.893341064453125, 2.9967041015625, 3.100067138671875, 3.20343017578125, 3.306793212890625, 3.41015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 8.0, 5.0, 7.0, 12.0, 11.0, 18.0, 25.0, 30.0, 40.0, 42.0, 59.0, 76.0, 111.0, 125.0, 102.0, 71.0, 59.0, 32.0, 26.0, 17.0, 19.0, 18.0, 14.0, 13.0, 14.0, 4.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045871734619140625, -0.00044493749737739563, -0.000431157648563385, -0.0004173777997493744, -0.00040359795093536377, -0.00038981810212135315, -0.00037603825330734253, -0.0003622584044933319, -0.0003484785556793213, -0.00033469870686531067, -0.00032091885805130005, -0.00030713900923728943, -0.0002933591604232788, -0.0002795793116092682, -0.00026579946279525757, -0.00025201961398124695, -0.00023823976516723633, -0.0002244599163532257, -0.0002106800675392151, -0.00019690021872520447, -0.00018312036991119385, -0.00016934052109718323, -0.0001555606722831726, -0.000141780823469162, -0.00012800097465515137, -0.00011422112584114075, -0.00010044127702713013, -8.666142821311951e-05, -7.288157939910889e-05, -5.9101730585098267e-05, -4.5321881771087646e-05, -3.1542032957077026e-05, -1.7762184143066406e-05, -3.982335329055786e-06, 9.797513484954834e-06, 2.3577362298965454e-05, 3.7357211112976074e-05, 5.1137059926986694e-05, 6.491690874099731e-05, 7.869675755500793e-05, 9.247660636901855e-05, 0.00010625645518302917, 0.0001200363039970398, 0.00013381615281105042, 0.00014759600162506104, 0.00016137585043907166, 0.00017515569925308228, 0.0001889355480670929, 0.00020271539688110352, 0.00021649524569511414, 0.00023027509450912476, 0.00024405494332313538, 0.000257834792137146, 0.0002716146409511566, 0.00028539448976516724, 0.00029917433857917786, 0.0003129541873931885, 0.0003267340362071991, 0.0003405138850212097, 0.00035429373383522034, 0.00036807358264923096, 0.0003818534314632416, 0.0003956332802772522, 0.0004094131290912628, 0.00042319297790527344]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 12.0, 14.0, 20.0, 20.0, 39.0, 66.0, 91.0, 175.0, 256.0, 561.0, 1051.0, 2204.0, 4480.0, 10208.0, 25227.0, 80272.0, 469761.0, 351762.0, 63886.0, 21575.0, 8831.0, 4008.0, 1834.0, 982.0, 460.0, 261.0, 144.0, 87.0, 73.0, 48.0, 37.0, 30.0, 19.0, 14.0, 5.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.369140625, -3.27264404296875, -3.1761474609375, -3.07965087890625, -2.983154296875, -2.88665771484375, -2.7901611328125, -2.69366455078125, -2.59716796875, -2.50067138671875, -2.4041748046875, -2.30767822265625, -2.211181640625, -2.11468505859375, -2.0181884765625, -1.92169189453125, -1.8251953125, -1.72869873046875, -1.6322021484375, -1.53570556640625, -1.439208984375, -1.34271240234375, -1.2462158203125, -1.14971923828125, -1.05322265625, -0.95672607421875, -0.8602294921875, -0.76373291015625, -0.667236328125, -0.57073974609375, -0.4742431640625, -0.37774658203125, -0.28125, -0.18475341796875, -0.0882568359375, 0.00823974609375, 0.104736328125, 0.20123291015625, 0.2977294921875, 0.39422607421875, 0.49072265625, 0.58721923828125, 0.6837158203125, 0.78021240234375, 0.876708984375, 0.97320556640625, 1.0697021484375, 1.16619873046875, 1.2626953125, 1.35919189453125, 1.4556884765625, 1.55218505859375, 1.648681640625, 1.74517822265625, 1.8416748046875, 1.93817138671875, 2.03466796875, 2.13116455078125, 2.2276611328125, 2.32415771484375, 2.420654296875, 2.51715087890625, 2.6136474609375, 2.71014404296875, 2.806640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 2.0, 8.0, 12.0, 6.0, 7.0, 10.0, 14.0, 19.0, 23.0, 24.0, 29.0, 44.0, 59.0, 77.0, 88.0, 120.0, 89.0, 80.0, 60.0, 47.0, 34.0, 17.0, 20.0, 16.0, 12.0, 8.0, 10.0, 1.0, 6.0, 7.0, 5.0, 4.0, 6.0, 6.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8408203125, -1.782562255859375, -1.72430419921875, -1.666046142578125, -1.6077880859375, -1.549530029296875, -1.49127197265625, -1.433013916015625, -1.374755859375, -1.316497802734375, -1.25823974609375, -1.199981689453125, -1.1417236328125, -1.083465576171875, -1.02520751953125, -0.966949462890625, -0.90869140625, -0.850433349609375, -0.79217529296875, -0.733917236328125, -0.6756591796875, -0.617401123046875, -0.55914306640625, -0.500885009765625, -0.442626953125, -0.384368896484375, -0.32611083984375, -0.267852783203125, -0.2095947265625, -0.151336669921875, -0.09307861328125, -0.034820556640625, 0.0234375, 0.081695556640625, 0.13995361328125, 0.198211669921875, 0.2564697265625, 0.314727783203125, 0.37298583984375, 0.431243896484375, 0.489501953125, 0.547760009765625, 0.60601806640625, 0.664276123046875, 0.7225341796875, 0.780792236328125, 0.83905029296875, 0.897308349609375, 0.95556640625, 1.013824462890625, 1.07208251953125, 1.130340576171875, 1.1885986328125, 1.246856689453125, 1.30511474609375, 1.363372802734375, 1.421630859375, 1.479888916015625, 1.53814697265625, 1.596405029296875, 1.6546630859375, 1.712921142578125, 1.77117919921875, 1.829437255859375, 1.8876953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 21.0, 22.0, 33.0, 72.0, 126.0, 140.0, 187.0, 171.0, 99.0, 58.0, 45.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.832401275634766, -28.50882339477539, -27.185243606567383, -25.861665725708008, -24.5380859375, -23.214508056640625, -21.89093017578125, -20.567352294921875, -19.243772506713867, -17.920194625854492, -16.596614837646484, -15.27303695678711, -13.949458122253418, -12.625879287719727, -11.302301406860352, -9.97872257232666, -8.655143737792969, -7.331564903259277, -6.007986545562744, -4.684408187866211, -3.3608293533325195, -2.037250518798828, -0.7136721611022949, 0.6099061965942383, 1.9334850311279297, 3.257063627243042, 4.580642223358154, 5.9042205810546875, 7.227799415588379, 8.55137825012207, 9.874956130981445, 11.198534965515137, 12.522117614746094, 13.845696449279785, 15.169275283813477, 16.49285316467285, 17.81643295288086, 19.140010833740234, 20.46358871459961, 21.787166595458984, 23.110746383666992, 24.434324264526367, 25.757904052734375, 27.08148193359375, 28.405059814453125, 29.728639602661133, 31.052217483520508, 32.375797271728516, 33.69937515258789, 35.022953033447266, 36.34653091430664, 37.67011260986328, 38.993690490722656, 40.31726837158203, 41.640846252441406, 42.96442413330078, 44.288002014160156, 45.61157989501953, 46.935157775878906, 48.25873947143555, 49.58231735229492, 50.9058952331543, 52.22947311401367, 53.55305099487305, 54.87663269042969]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 6.0, 10.0, 12.0, 10.0, 13.0, 22.0, 24.0, 26.0, 24.0, 38.0, 47.0, 38.0, 37.0, 47.0, 59.0, 33.0, 39.0, 43.0, 42.0, 47.0, 60.0, 45.0, 39.0, 39.0, 34.0, 34.0, 28.0, 14.0, 15.0, 18.0, 12.0, 6.0, 5.0, 7.0, 4.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0], "bins": [-24.094623565673828, -23.49248504638672, -22.890344619750977, -22.288206100463867, -21.686065673828125, -21.083927154541016, -20.481786727905273, -19.879648208618164, -19.277507781982422, -18.675369262695312, -18.07322883605957, -17.47109031677246, -16.86894989013672, -16.26681137084961, -15.664671897888184, -15.062532424926758, -14.460393905639648, -13.858254432678223, -13.256114959716797, -12.653975486755371, -12.051836013793945, -11.449697494506836, -10.84755802154541, -10.245418548583984, -9.643279075622559, -9.041139602661133, -8.439000129699707, -7.8368611335754395, -7.234721660614014, -6.632582187652588, -6.03044319152832, -5.4283037185668945, -4.826164245605469, -4.224024772644043, -3.6218855381011963, -3.0197463035583496, -2.417606830596924, -1.815467357635498, -1.2133281230926514, -0.6111888885498047, -0.009049415588378906, 0.5930899381637573, 1.1952292919158936, 1.7973686456680298, 2.399507999420166, 3.001647472381592, 3.6037867069244385, 4.205925941467285, 4.808065414428711, 5.410204887390137, 6.0123443603515625, 6.61448335647583, 7.216622829437256, 7.818762302398682, 8.42090129852295, 9.023040771484375, 9.6251802444458, 10.227319717407227, 10.829459190368652, 11.431598663330078, 12.033737182617188, 12.63587760925293, 13.238016128540039, 13.840155601501465, 14.44229507446289]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 7.0, 12.0, 16.0, 20.0, 33.0, 44.0, 99.0, 200.0, 406.0, 1067.0, 3508.0, 15590.0, 152087.0, 3930342.0, 76418.0, 10250.0, 2436.0, 855.0, 364.0, 171.0, 105.0, 63.0, 54.0, 28.0, 17.0, 26.0, 7.0, 11.0, 4.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1796875, -6.88525390625, -6.5908203125, -6.29638671875, -6.001953125, -5.70751953125, -5.4130859375, -5.11865234375, -4.82421875, -4.52978515625, -4.2353515625, -3.94091796875, -3.646484375, -3.35205078125, -3.0576171875, -2.76318359375, -2.46875, -2.17431640625, -1.8798828125, -1.58544921875, -1.291015625, -0.99658203125, -0.7021484375, -0.40771484375, -0.11328125, 0.18115234375, 0.4755859375, 0.77001953125, 1.064453125, 1.35888671875, 1.6533203125, 1.94775390625, 2.2421875, 2.53662109375, 2.8310546875, 3.12548828125, 3.419921875, 3.71435546875, 4.0087890625, 4.30322265625, 4.59765625, 4.89208984375, 5.1865234375, 5.48095703125, 5.775390625, 6.06982421875, 6.3642578125, 6.65869140625, 6.953125, 7.24755859375, 7.5419921875, 7.83642578125, 8.130859375, 8.42529296875, 8.7197265625, 9.01416015625, 9.30859375, 9.60302734375, 9.8974609375, 10.19189453125, 10.486328125, 10.78076171875, 11.0751953125, 11.36962890625, 11.6640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 3.0, 6.0, 7.0, 11.0, 13.0, 17.0, 20.0, 33.0, 30.0, 48.0, 48.0, 66.0, 66.0, 68.0, 59.0, 77.0, 77.0, 68.0, 66.0, 50.0, 33.0, 32.0, 31.0, 24.0, 24.0, 7.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5638656616210938, -0.5325164794921875, -0.5011672973632812, -0.469818115234375, -0.43846893310546875, -0.4071197509765625, -0.37577056884765625, -0.34442138671875, -0.31307220458984375, -0.2817230224609375, -0.25037384033203125, -0.219024658203125, -0.18767547607421875, -0.1563262939453125, -0.12497711181640625, -0.0936279296875, -0.06227874755859375, -0.0309295654296875, 0.00041961669921875, 0.031768798828125, 0.06311798095703125, 0.0944671630859375, 0.12581634521484375, 0.15716552734375, 0.18851470947265625, 0.2198638916015625, 0.25121307373046875, 0.282562255859375, 0.31391143798828125, 0.3452606201171875, 0.37660980224609375, 0.407958984375, 0.43930816650390625, 0.4706573486328125, 0.5020065307617188, 0.533355712890625, 0.5647048950195312, 0.5960540771484375, 0.6274032592773438, 0.65875244140625, 0.6901016235351562, 0.7214508056640625, 0.7527999877929688, 0.784149169921875, 0.8154983520507812, 0.8468475341796875, 0.8781967163085938, 0.9095458984375, 0.9408950805664062, 0.9722442626953125, 1.0035934448242188, 1.034942626953125, 1.0662918090820312, 1.0976409912109375, 1.1289901733398438, 1.16033935546875, 1.1916885375976562, 1.2230377197265625, 1.2543869018554688, 1.285736083984375, 1.3170852661132812, 1.3484344482421875, 1.3797836303710938, 1.4111328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 2.0, 5.0, 12.0, 10.0, 24.0, 29.0, 30.0, 54.0, 75.0, 95.0, 143.0, 238.0, 465.0, 1116.0, 2774.0, 8100.0, 29868.0, 172135.0, 3585722.0, 331938.0, 44319.0, 11015.0, 3609.0, 1260.0, 513.0, 297.0, 150.0, 75.0, 61.0, 39.0, 21.0, 22.0, 13.0, 16.0, 7.0, 7.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.46783447265625, -6.2755126953125, -6.08319091796875, -5.890869140625, -5.69854736328125, -5.5062255859375, -5.31390380859375, -5.12158203125, -4.92926025390625, -4.7369384765625, -4.54461669921875, -4.352294921875, -4.15997314453125, -3.9676513671875, -3.77532958984375, -3.5830078125, -3.39068603515625, -3.1983642578125, -3.00604248046875, -2.813720703125, -2.62139892578125, -2.4290771484375, -2.23675537109375, -2.04443359375, -1.85211181640625, -1.6597900390625, -1.46746826171875, -1.275146484375, -1.08282470703125, -0.8905029296875, -0.69818115234375, -0.505859375, -0.31353759765625, -0.1212158203125, 0.07110595703125, 0.263427734375, 0.45574951171875, 0.6480712890625, 0.84039306640625, 1.03271484375, 1.22503662109375, 1.4173583984375, 1.60968017578125, 1.802001953125, 1.99432373046875, 2.1866455078125, 2.37896728515625, 2.5712890625, 2.76361083984375, 2.9559326171875, 3.14825439453125, 3.340576171875, 3.53289794921875, 3.7252197265625, 3.91754150390625, 4.10986328125, 4.30218505859375, 4.4945068359375, 4.68682861328125, 4.879150390625, 5.07147216796875, 5.2637939453125, 5.45611572265625, 5.6484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 7.0, 14.0, 16.0, 17.0, 38.0, 52.0, 48.0, 140.0, 249.0, 821.0, 1837.0, 358.0, 186.0, 94.0, 60.0, 41.0, 28.0, 13.0, 16.0, 9.0, 4.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.5517578125, -2.48828125, -2.4248046875, -2.361328125, -2.2978515625, -2.234375, -2.1708984375, -2.107421875, -2.0439453125, -1.98046875, -1.9169921875, -1.853515625, -1.7900390625, -1.7265625, -1.6630859375, -1.599609375, -1.5361328125, -1.47265625, -1.4091796875, -1.345703125, -1.2822265625, -1.21875, -1.1552734375, -1.091796875, -1.0283203125, -0.96484375, -0.9013671875, -0.837890625, -0.7744140625, -0.7109375, -0.6474609375, -0.583984375, -0.5205078125, -0.45703125, -0.3935546875, -0.330078125, -0.2666015625, -0.203125, -0.1396484375, -0.076171875, -0.0126953125, 0.05078125, 0.1142578125, 0.177734375, 0.2412109375, 0.3046875, 0.3681640625, 0.431640625, 0.4951171875, 0.55859375, 0.6220703125, 0.685546875, 0.7490234375, 0.8125, 0.8759765625, 0.939453125, 1.0029296875, 1.06640625, 1.1298828125, 1.193359375, 1.2568359375, 1.3203125, 1.3837890625, 1.447265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 18.0, 45.0, 71.0, 95.0, 131.0, 151.0, 151.0, 116.0, 79.0, 65.0, 37.0, 20.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.044439315795898, -9.604722023010254, -9.16500473022461, -8.725286483764648, -8.285569190979004, -7.845851898193359, -7.406134605407715, -6.966416835784912, -6.526699066162109, -6.086981773376465, -5.647264003753662, -5.207546710968018, -4.767828941345215, -4.32811164855957, -3.8883941173553467, -3.448676586151123, -3.0089592933654785, -2.569241762161255, -2.1295242309570312, -1.6898068189620972, -1.2500892877578735, -0.8103718757629395, -0.3706543445587158, 0.06906318664550781, 0.5087807178497314, 0.9484982490539551, 1.3882157802581787, 1.8279331922531128, 2.267650604248047, 2.7073681354522705, 3.147085666656494, 3.5868031978607178, 4.026520729064941, 4.466238021850586, 4.905955791473389, 5.345673084259033, 5.785390853881836, 6.2251081466674805, 6.664825439453125, 7.104543209075928, 7.5442609786987305, 7.983978271484375, 8.42369556427002, 8.86341381072998, 9.303131103515625, 9.74284839630127, 10.182565689086914, 10.622283935546875, 11.062000274658203, 11.501717567443848, 11.941434860229492, 12.381153106689453, 12.820870399475098, 13.260587692260742, 13.700304985046387, 14.140022277832031, 14.579740524291992, 15.019457817077637, 15.459175109863281, 15.898893356323242, 16.33860969543457, 16.77832794189453, 17.218046188354492, 17.65776252746582, 18.09748077392578]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 4.0, 6.0, 4.0, 8.0, 11.0, 16.0, 23.0, 18.0, 30.0, 37.0, 25.0, 24.0, 31.0, 34.0, 38.0, 40.0, 45.0, 36.0, 47.0, 41.0, 37.0, 33.0, 37.0, 43.0, 33.0, 41.0, 45.0, 31.0, 26.0, 20.0, 23.0, 20.0, 17.0, 12.0, 9.0, 11.0, 8.0, 8.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109746932983398, -4.942172527313232, -4.774598598480225, -4.607024192810059, -4.439450263977051, -4.271875858306885, -4.104301452636719, -3.936727523803711, -3.769153118133545, -3.601578950881958, -3.434004783630371, -3.266430377960205, -3.098856210708618, -2.9312820434570312, -2.7637078762054443, -2.5961337089538574, -2.4285595417022705, -2.2609853744506836, -2.0934112071990967, -1.9258369207382202, -1.7582626342773438, -1.5906884670257568, -1.42311429977417, -1.2555400133132935, -1.0879658460617065, -0.9203916192054749, -0.7528173923492432, -0.5852432250976562, -0.41766899824142456, -0.25009477138519287, -0.08252060413360596, 0.08505368232727051, 0.2526278495788574, 0.4202020764350891, 0.5877763032913208, 0.7553504705429077, 0.9229246973991394, 1.090498924255371, 1.258073091506958, 1.4256473779678345, 1.5932215452194214, 1.7607957124710083, 1.9283699989318848, 2.0959441661834717, 2.2635183334350586, 2.4310927391052246, 2.5986666679382324, 2.7662410736083984, 2.9338152408599854, 3.1013894081115723, 3.268963575363159, 3.436537742614746, 3.604112148284912, 3.771686315536499, 3.939260482788086, 4.106834888458252, 4.27440881729126, 4.441983222961426, 4.609557151794434, 4.7771315574646, 4.944705486297607, 5.112279891967773, 5.279853820800781, 5.447428226470947, 5.615002632141113]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 4.0, 11.0, 15.0, 21.0, 35.0, 51.0, 73.0, 152.0, 275.0, 564.0, 1299.0, 3258.0, 9106.0, 28616.0, 94507.0, 302541.0, 405220.0, 139947.0, 42006.0, 13054.0, 4493.0, 1740.0, 750.0, 303.0, 190.0, 106.0, 65.0, 44.0, 29.0, 17.0, 16.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08984375, -5.92144775390625, -5.7530517578125, -5.58465576171875, -5.416259765625, -5.24786376953125, -5.0794677734375, -4.91107177734375, -4.74267578125, -4.57427978515625, -4.4058837890625, -4.23748779296875, -4.069091796875, -3.90069580078125, -3.7322998046875, -3.56390380859375, -3.3955078125, -3.22711181640625, -3.0587158203125, -2.89031982421875, -2.721923828125, -2.55352783203125, -2.3851318359375, -2.21673583984375, -2.04833984375, -1.87994384765625, -1.7115478515625, -1.54315185546875, -1.374755859375, -1.20635986328125, -1.0379638671875, -0.86956787109375, -0.701171875, -0.53277587890625, -0.3643798828125, -0.19598388671875, -0.027587890625, 0.14080810546875, 0.3092041015625, 0.47760009765625, 0.64599609375, 0.81439208984375, 0.9827880859375, 1.15118408203125, 1.319580078125, 1.48797607421875, 1.6563720703125, 1.82476806640625, 1.9931640625, 2.16156005859375, 2.3299560546875, 2.49835205078125, 2.666748046875, 2.83514404296875, 3.0035400390625, 3.17193603515625, 3.34033203125, 3.50872802734375, 3.6771240234375, 3.84552001953125, 4.013916015625, 4.18231201171875, 4.3507080078125, 4.51910400390625, 4.6875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 11.0, 14.0, 14.0, 17.0, 23.0, 29.0, 26.0, 33.0, 54.0, 56.0, 53.0, 63.0, 65.0, 69.0, 74.0, 69.0, 63.0, 55.0, 42.0, 47.0, 30.0, 26.0, 25.0, 20.0, 8.0, 7.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.595062255859375, -0.56317138671875, -0.531280517578125, -0.4993896484375, -0.467498779296875, -0.43560791015625, -0.403717041015625, -0.371826171875, -0.339935302734375, -0.30804443359375, -0.276153564453125, -0.2442626953125, -0.212371826171875, -0.18048095703125, -0.148590087890625, -0.11669921875, -0.084808349609375, -0.05291748046875, -0.021026611328125, 0.0108642578125, 0.042755126953125, 0.07464599609375, 0.106536865234375, 0.138427734375, 0.170318603515625, 0.20220947265625, 0.234100341796875, 0.2659912109375, 0.297882080078125, 0.32977294921875, 0.361663818359375, 0.3935546875, 0.425445556640625, 0.45733642578125, 0.489227294921875, 0.5211181640625, 0.553009033203125, 0.58489990234375, 0.616790771484375, 0.648681640625, 0.680572509765625, 0.71246337890625, 0.744354248046875, 0.7762451171875, 0.808135986328125, 0.84002685546875, 0.871917724609375, 0.90380859375, 0.935699462890625, 0.96759033203125, 0.999481201171875, 1.0313720703125, 1.063262939453125, 1.09515380859375, 1.127044677734375, 1.158935546875, 1.190826416015625, 1.22271728515625, 1.254608154296875, 1.2864990234375, 1.318389892578125, 1.35028076171875, 1.382171630859375, 1.4140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 17.0, 10.0, 20.0, 23.0, 47.0, 56.0, 69.0, 98.0, 152.0, 260.0, 385.0, 608.0, 1187.0, 2465.0, 5921.0, 16826.0, 50586.0, 159782.0, 414898.0, 264254.0, 86677.0, 27442.0, 9594.0, 3535.0, 1602.0, 766.0, 421.0, 256.0, 199.0, 133.0, 62.0, 53.0, 38.0, 24.0, 19.0, 26.0, 16.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6796875, -3.555908203125, -3.43212890625, -3.308349609375, -3.1845703125, -3.060791015625, -2.93701171875, -2.813232421875, -2.689453125, -2.565673828125, -2.44189453125, -2.318115234375, -2.1943359375, -2.070556640625, -1.94677734375, -1.822998046875, -1.69921875, -1.575439453125, -1.45166015625, -1.327880859375, -1.2041015625, -1.080322265625, -0.95654296875, -0.832763671875, -0.708984375, -0.585205078125, -0.46142578125, -0.337646484375, -0.2138671875, -0.090087890625, 0.03369140625, 0.157470703125, 0.28125, 0.405029296875, 0.52880859375, 0.652587890625, 0.7763671875, 0.900146484375, 1.02392578125, 1.147705078125, 1.271484375, 1.395263671875, 1.51904296875, 1.642822265625, 1.7666015625, 1.890380859375, 2.01416015625, 2.137939453125, 2.26171875, 2.385498046875, 2.50927734375, 2.633056640625, 2.7568359375, 2.880615234375, 3.00439453125, 3.128173828125, 3.251953125, 3.375732421875, 3.49951171875, 3.623291015625, 3.7470703125, 3.870849609375, 3.99462890625, 4.118408203125, 4.2421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 5.0, 9.0, 5.0, 7.0, 13.0, 24.0, 23.0, 22.0, 27.0, 43.0, 36.0, 26.0, 31.0, 44.0, 39.0, 52.0, 59.0, 44.0, 44.0, 41.0, 43.0, 44.0, 43.0, 41.0, 39.0, 34.0, 28.0, 19.0, 16.0, 19.0, 14.0, 10.0, 12.0, 10.0, 4.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.927734375, -3.819183349609375, -3.71063232421875, -3.602081298828125, -3.4935302734375, -3.384979248046875, -3.27642822265625, -3.167877197265625, -3.059326171875, -2.950775146484375, -2.84222412109375, -2.733673095703125, -2.6251220703125, -2.516571044921875, -2.40802001953125, -2.299468994140625, -2.19091796875, -2.082366943359375, -1.97381591796875, -1.865264892578125, -1.7567138671875, -1.648162841796875, -1.53961181640625, -1.431060791015625, -1.322509765625, -1.213958740234375, -1.10540771484375, -0.996856689453125, -0.8883056640625, -0.779754638671875, -0.67120361328125, -0.562652587890625, -0.4541015625, -0.345550537109375, -0.23699951171875, -0.128448486328125, -0.0198974609375, 0.088653564453125, 0.19720458984375, 0.305755615234375, 0.414306640625, 0.522857666015625, 0.63140869140625, 0.739959716796875, 0.8485107421875, 0.957061767578125, 1.06561279296875, 1.174163818359375, 1.28271484375, 1.391265869140625, 1.49981689453125, 1.608367919921875, 1.7169189453125, 1.825469970703125, 1.93402099609375, 2.042572021484375, 2.151123046875, 2.259674072265625, 2.36822509765625, 2.476776123046875, 2.5853271484375, 2.693878173828125, 2.80242919921875, 2.910980224609375, 3.01953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 3.0, 11.0, 13.0, 13.0, 20.0, 37.0, 50.0, 78.0, 126.0, 201.0, 327.0, 772.0, 1712.0, 4742.0, 25781.0, 831392.0, 167607.0, 10423.0, 2821.0, 1154.0, 508.0, 286.0, 156.0, 94.0, 59.0, 49.0, 28.0, 20.0, 20.0, 13.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0], "bins": [-11.6015625, -11.3238525390625, -11.046142578125, -10.7684326171875, -10.49072265625, -10.2130126953125, -9.935302734375, -9.6575927734375, -9.3798828125, -9.1021728515625, -8.824462890625, -8.5467529296875, -8.26904296875, -7.9913330078125, -7.713623046875, -7.4359130859375, -7.158203125, -6.8804931640625, -6.602783203125, -6.3250732421875, -6.04736328125, -5.7696533203125, -5.491943359375, -5.2142333984375, -4.9365234375, -4.6588134765625, -4.381103515625, -4.1033935546875, -3.82568359375, -3.5479736328125, -3.270263671875, -2.9925537109375, -2.71484375, -2.4371337890625, -2.159423828125, -1.8817138671875, -1.60400390625, -1.3262939453125, -1.048583984375, -0.7708740234375, -0.4931640625, -0.2154541015625, 0.062255859375, 0.3399658203125, 0.61767578125, 0.8953857421875, 1.173095703125, 1.4508056640625, 1.728515625, 2.0062255859375, 2.283935546875, 2.5616455078125, 2.83935546875, 3.1170654296875, 3.394775390625, 3.6724853515625, 3.9501953125, 4.2279052734375, 4.505615234375, 4.7833251953125, 5.06103515625, 5.3387451171875, 5.616455078125, 5.8941650390625, 6.171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 12.0, 22.0, 25.0, 41.0, 72.0, 91.0, 147.0, 183.0, 114.0, 78.0, 60.0, 31.0, 19.0, 10.0, 15.0, 8.0, 7.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010347366333007812, -0.0010084658861160278, -0.0009821951389312744, -0.000955924391746521, -0.0009296536445617676, -0.0009033828973770142, -0.0008771121501922607, -0.0008508414030075073, -0.0008245706558227539, -0.0007982999086380005, -0.0007720291614532471, -0.0007457584142684937, -0.0007194876670837402, -0.0006932169198989868, -0.0006669461727142334, -0.00064067542552948, -0.0006144046783447266, -0.0005881339311599731, -0.0005618631839752197, -0.0005355924367904663, -0.0005093216896057129, -0.00048305094242095947, -0.00045678019523620605, -0.00043050944805145264, -0.0004042387008666992, -0.0003779679536819458, -0.0003516972064971924, -0.00032542645931243896, -0.00029915571212768555, -0.00027288496494293213, -0.0002466142177581787, -0.0002203434705734253, -0.00019407272338867188, -0.00016780197620391846, -0.00014153122901916504, -0.00011526048183441162, -8.89897346496582e-05, -6.271898746490479e-05, -3.644824028015137e-05, -1.017749309539795e-05, 1.609325408935547e-05, 4.236400127410889e-05, 6.86347484588623e-05, 9.490549564361572e-05, 0.00012117624282836914, 0.00014744699001312256, 0.00017371773719787598, 0.0001999884843826294, 0.0002262592315673828, 0.00025252997875213623, 0.00027880072593688965, 0.00030507147312164307, 0.0003313422203063965, 0.0003576129674911499, 0.0003838837146759033, 0.00041015446186065674, 0.00043642520904541016, 0.0004626959562301636, 0.000488966703414917, 0.0005152374505996704, 0.0005415081977844238, 0.0005677789449691772, 0.0005940496921539307, 0.0006203204393386841, 0.0006465911865234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 12.0, 9.0, 11.0, 15.0, 20.0, 36.0, 48.0, 57.0, 107.0, 175.0, 234.0, 437.0, 716.0, 1209.0, 2188.0, 4555.0, 11874.0, 47836.0, 595601.0, 332736.0, 32785.0, 9409.0, 3894.0, 1891.0, 1067.0, 614.0, 364.0, 234.0, 141.0, 91.0, 50.0, 42.0, 26.0, 24.0, 11.0, 11.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.61749267578125, -4.4576416015625, -4.29779052734375, -4.137939453125, -3.97808837890625, -3.8182373046875, -3.65838623046875, -3.49853515625, -3.33868408203125, -3.1788330078125, -3.01898193359375, -2.859130859375, -2.69927978515625, -2.5394287109375, -2.37957763671875, -2.2197265625, -2.05987548828125, -1.9000244140625, -1.74017333984375, -1.580322265625, -1.42047119140625, -1.2606201171875, -1.10076904296875, -0.94091796875, -0.78106689453125, -0.6212158203125, -0.46136474609375, -0.301513671875, -0.14166259765625, 0.0181884765625, 0.17803955078125, 0.337890625, 0.49774169921875, 0.6575927734375, 0.81744384765625, 0.977294921875, 1.13714599609375, 1.2969970703125, 1.45684814453125, 1.61669921875, 1.77655029296875, 1.9364013671875, 2.09625244140625, 2.256103515625, 2.41595458984375, 2.5758056640625, 2.73565673828125, 2.8955078125, 3.05535888671875, 3.2152099609375, 3.37506103515625, 3.534912109375, 3.69476318359375, 3.8546142578125, 4.01446533203125, 4.17431640625, 4.33416748046875, 4.4940185546875, 4.65386962890625, 4.813720703125, 4.97357177734375, 5.1334228515625, 5.29327392578125, 5.453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 13.0, 16.0, 31.0, 39.0, 87.0, 142.0, 219.0, 175.0, 109.0, 65.0, 25.0, 11.0, 10.0, 7.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.51953125, -4.381103515625, -4.24267578125, -4.104248046875, -3.9658203125, -3.827392578125, -3.68896484375, -3.550537109375, -3.412109375, -3.273681640625, -3.13525390625, -2.996826171875, -2.8583984375, -2.719970703125, -2.58154296875, -2.443115234375, -2.3046875, -2.166259765625, -2.02783203125, -1.889404296875, -1.7509765625, -1.612548828125, -1.47412109375, -1.335693359375, -1.197265625, -1.058837890625, -0.92041015625, -0.781982421875, -0.6435546875, -0.505126953125, -0.36669921875, -0.228271484375, -0.08984375, 0.048583984375, 0.18701171875, 0.325439453125, 0.4638671875, 0.602294921875, 0.74072265625, 0.879150390625, 1.017578125, 1.156005859375, 1.29443359375, 1.432861328125, 1.5712890625, 1.709716796875, 1.84814453125, 1.986572265625, 2.125, 2.263427734375, 2.40185546875, 2.540283203125, 2.6787109375, 2.817138671875, 2.95556640625, 3.093994140625, 3.232421875, 3.370849609375, 3.50927734375, 3.647705078125, 3.7861328125, 3.924560546875, 4.06298828125, 4.201416015625, 4.33984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 8.0, 23.0, 34.0, 30.0, 57.0, 81.0, 108.0, 100.0, 122.0, 127.0, 85.0, 65.0, 51.0, 42.0, 28.0, 16.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-31.422992706298828, -30.345224380493164, -29.2674560546875, -28.189685821533203, -27.11191749572754, -26.034149169921875, -24.956378936767578, -23.878610610961914, -22.80084228515625, -21.723073959350586, -20.645305633544922, -19.567535400390625, -18.48976707458496, -17.411998748779297, -16.334228515625, -15.256460189819336, -14.178691864013672, -13.100923538208008, -12.023154258728027, -10.945384979248047, -9.867616653442383, -8.789848327636719, -7.712079048156738, -6.634310245513916, -5.556541442871094, -4.4787726402282715, -3.401003837585449, -2.323235034942627, -1.2454662322998047, -0.16769742965698242, 0.9100713729858398, 1.987840175628662, 3.06561279296875, 4.143381595611572, 5.2211503982543945, 6.298919200897217, 7.376688003540039, 8.454456329345703, 9.532225608825684, 10.609994888305664, 11.687763214111328, 12.765531539916992, 13.843300819396973, 14.921070098876953, 15.998838424682617, 17.07660675048828, 18.154376983642578, 19.232145309448242, 20.309913635253906, 21.38768196105957, 22.465450286865234, 23.54322052001953, 24.620988845825195, 25.69875717163086, 26.776527404785156, 27.85429573059082, 28.932064056396484, 30.00983238220215, 31.087600708007812, 32.16537094116211, 33.243141174316406, 34.32090759277344, 35.398677825927734, 36.476444244384766, 37.55421447753906]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 4.0, 9.0, 13.0, 11.0, 13.0, 17.0, 19.0, 18.0, 23.0, 26.0, 28.0, 35.0, 21.0, 43.0, 39.0, 35.0, 41.0, 41.0, 43.0, 47.0, 36.0, 52.0, 40.0, 42.0, 35.0, 34.0, 29.0, 26.0, 20.0, 23.0, 18.0, 14.0, 11.0, 10.0, 11.0, 10.0, 10.0, 8.0, 9.0, 7.0, 6.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.867626190185547, -18.272266387939453, -17.676908493041992, -17.0815486907959, -16.486188888549805, -15.890830039978027, -15.29547119140625, -14.700111389160156, -14.104751586914062, -13.509392738342285, -12.914032936096191, -12.318674087524414, -11.72331428527832, -11.127955436706543, -10.532596588134766, -9.937236785888672, -9.341877937316895, -8.746519088745117, -8.151159286499023, -7.555800437927246, -6.960440635681152, -6.365081787109375, -5.7697224617004395, -5.174363136291504, -4.579003810882568, -3.983644485473633, -3.3882851600646973, -2.792926073074341, -2.1975667476654053, -1.6022074222564697, -1.0068483352661133, -0.41148900985717773, 0.1838703155517578, 0.7792295813560486, 1.3745888471603394, 1.9699480533599854, 2.565307378768921, 3.1606667041778564, 3.756025791168213, 4.351385116577148, 4.946744441986084, 5.5421037673950195, 6.137463092803955, 6.732822418212891, 7.328181266784668, 7.923541069030762, 8.518899917602539, 9.114259719848633, 9.70961856842041, 10.304977416992188, 10.900337219238281, 11.495696067810059, 12.091055870056152, 12.68641471862793, 13.281774520874023, 13.8771333694458, 14.472492218017578, 15.067851066589355, 15.66321086883545, 16.258569717407227, 16.85392951965332, 17.449289321899414, 18.044647216796875, 18.64000701904297, 19.235366821289062]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 14.0, 25.0, 44.0, 63.0, 133.0, 286.0, 702.0, 1842.0, 5553.0, 21098.0, 100660.0, 3020652.0, 942304.0, 75911.0, 17062.0, 4801.0, 1621.0, 652.0, 333.0, 181.0, 112.0, 65.0, 41.0, 27.0, 22.0, 12.0, 17.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.721405029296875, -3.53460693359375, -3.347808837890625, -3.1610107421875, -2.974212646484375, -2.78741455078125, -2.600616455078125, -2.413818359375, -2.227020263671875, -2.04022216796875, -1.853424072265625, -1.6666259765625, -1.479827880859375, -1.29302978515625, -1.106231689453125, -0.91943359375, -0.732635498046875, -0.54583740234375, -0.359039306640625, -0.1722412109375, 0.014556884765625, 0.20135498046875, 0.388153076171875, 0.574951171875, 0.761749267578125, 0.94854736328125, 1.135345458984375, 1.3221435546875, 1.508941650390625, 1.69573974609375, 1.882537841796875, 2.0693359375, 2.256134033203125, 2.44293212890625, 2.629730224609375, 2.8165283203125, 3.003326416015625, 3.19012451171875, 3.376922607421875, 3.563720703125, 3.750518798828125, 3.93731689453125, 4.124114990234375, 4.3109130859375, 4.497711181640625, 4.68450927734375, 4.871307373046875, 5.05810546875, 5.244903564453125, 5.43170166015625, 5.618499755859375, 5.8052978515625, 5.992095947265625, 6.17889404296875, 6.365692138671875, 6.552490234375, 6.739288330078125, 6.92608642578125, 7.112884521484375, 7.2996826171875, 7.486480712890625, 7.67327880859375, 7.860076904296875, 8.046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 11.0, 8.0, 19.0, 29.0, 26.0, 27.0, 32.0, 42.0, 51.0, 56.0, 55.0, 55.0, 63.0, 66.0, 54.0, 46.0, 58.0, 38.0, 49.0, 44.0, 43.0, 28.0, 22.0, 18.0, 11.0, 17.0, 8.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7748031616210938, -0.7454071044921875, -0.7160110473632812, -0.686614990234375, -0.6572189331054688, -0.6278228759765625, -0.5984268188476562, -0.56903076171875, -0.5396347045898438, -0.5102386474609375, -0.48084259033203125, -0.451446533203125, -0.42205047607421875, -0.3926544189453125, -0.36325836181640625, -0.3338623046875, -0.30446624755859375, -0.2750701904296875, -0.24567413330078125, -0.216278076171875, -0.18688201904296875, -0.1574859619140625, -0.12808990478515625, -0.09869384765625, -0.06929779052734375, -0.0399017333984375, -0.01050567626953125, 0.018890380859375, 0.04828643798828125, 0.0776824951171875, 0.10707855224609375, 0.136474609375, 0.16587066650390625, 0.1952667236328125, 0.22466278076171875, 0.254058837890625, 0.28345489501953125, 0.3128509521484375, 0.34224700927734375, 0.37164306640625, 0.40103912353515625, 0.4304351806640625, 0.45983123779296875, 0.489227294921875, 0.5186233520507812, 0.5480194091796875, 0.5774154663085938, 0.6068115234375, 0.6362075805664062, 0.6656036376953125, 0.6949996948242188, 0.724395751953125, 0.7537918090820312, 0.7831878662109375, 0.8125839233398438, 0.84197998046875, 0.8713760375976562, 0.9007720947265625, 0.9301681518554688, 0.959564208984375, 0.9889602661132812, 1.0183563232421875, 1.0477523803710938, 1.0771484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 4.0, 21.0, 33.0, 61.0, 134.0, 256.0, 612.0, 1718.0, 5785.0, 24779.0, 168973.0, 3541064.0, 396524.0, 41360.0, 8849.0, 2454.0, 937.0, 379.0, 177.0, 66.0, 38.0, 14.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.02099609375, -6.7919921875, -6.56298828125, -6.333984375, -6.10498046875, -5.8759765625, -5.64697265625, -5.41796875, -5.18896484375, -4.9599609375, -4.73095703125, -4.501953125, -4.27294921875, -4.0439453125, -3.81494140625, -3.5859375, -3.35693359375, -3.1279296875, -2.89892578125, -2.669921875, -2.44091796875, -2.2119140625, -1.98291015625, -1.75390625, -1.52490234375, -1.2958984375, -1.06689453125, -0.837890625, -0.60888671875, -0.3798828125, -0.15087890625, 0.078125, 0.30712890625, 0.5361328125, 0.76513671875, 0.994140625, 1.22314453125, 1.4521484375, 1.68115234375, 1.91015625, 2.13916015625, 2.3681640625, 2.59716796875, 2.826171875, 3.05517578125, 3.2841796875, 3.51318359375, 3.7421875, 3.97119140625, 4.2001953125, 4.42919921875, 4.658203125, 4.88720703125, 5.1162109375, 5.34521484375, 5.57421875, 5.80322265625, 6.0322265625, 6.26123046875, 6.490234375, 6.71923828125, 6.9482421875, 7.17724609375, 7.40625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 12.0, 14.0, 18.0, 17.0, 33.0, 40.0, 51.0, 96.0, 163.0, 238.0, 481.0, 1524.0, 591.0, 319.0, 158.0, 95.0, 55.0, 35.0, 33.0, 22.0, 12.0, 16.0, 10.0, 10.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.990234375, -1.923065185546875, -1.85589599609375, -1.788726806640625, -1.7215576171875, -1.654388427734375, -1.58721923828125, -1.520050048828125, -1.452880859375, -1.385711669921875, -1.31854248046875, -1.251373291015625, -1.1842041015625, -1.117034912109375, -1.04986572265625, -0.982696533203125, -0.91552734375, -0.848358154296875, -0.78118896484375, -0.714019775390625, -0.6468505859375, -0.579681396484375, -0.51251220703125, -0.445343017578125, -0.378173828125, -0.311004638671875, -0.24383544921875, -0.176666259765625, -0.1094970703125, -0.042327880859375, 0.02484130859375, 0.092010498046875, 0.1591796875, 0.226348876953125, 0.29351806640625, 0.360687255859375, 0.4278564453125, 0.495025634765625, 0.56219482421875, 0.629364013671875, 0.696533203125, 0.763702392578125, 0.83087158203125, 0.898040771484375, 0.9652099609375, 1.032379150390625, 1.09954833984375, 1.166717529296875, 1.23388671875, 1.301055908203125, 1.36822509765625, 1.435394287109375, 1.5025634765625, 1.569732666015625, 1.63690185546875, 1.704071044921875, 1.771240234375, 1.838409423828125, 1.90557861328125, 1.972747802734375, 2.0399169921875, 2.107086181640625, 2.17425537109375, 2.241424560546875, 2.30859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 44.0, 148.0, 281.0, 306.0, 165.0, 48.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.93492126464844, -64.61772918701172, -63.300537109375, -61.98334503173828, -60.66615295410156, -59.348960876464844, -58.031768798828125, -56.714576721191406, -55.39738464355469, -54.08019256591797, -52.76300048828125, -51.44580841064453, -50.12861633300781, -48.811424255371094, -47.494232177734375, -46.177040100097656, -44.85984802246094, -43.54265594482422, -42.2254638671875, -40.90827178955078, -39.59107971191406, -38.273887634277344, -36.956695556640625, -35.639503479003906, -34.32231521606445, -33.005123138427734, -31.687931060791016, -30.370738983154297, -29.053546905517578, -27.73635482788086, -26.41916275024414, -25.101970672607422, -23.784780502319336, -22.467588424682617, -21.1503963470459, -19.83320426940918, -18.51601219177246, -17.198820114135742, -15.88162899017334, -14.564436912536621, -13.247244834899902, -11.930052757263184, -10.612860679626465, -9.295669555664062, -7.9784770011901855, -6.661284923553467, -5.344093322753906, -4.0269012451171875, -2.7097091674804688, -1.3925172090530396, -0.07532525062561035, 1.2418665885925293, 2.559058666229248, 3.876250743865967, 5.193442344665527, 6.510634422302246, 7.827826499938965, 9.145018577575684, 10.462210655212402, 11.779401779174805, 13.096593856811523, 14.413785934448242, 15.730978012084961, 17.04817008972168, 18.3653621673584]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 13.0, 8.0, 10.0, 4.0, 14.0, 22.0, 15.0, 17.0, 28.0, 39.0, 20.0, 43.0, 39.0, 38.0, 45.0, 45.0, 47.0, 34.0, 36.0, 50.0, 40.0, 36.0, 49.0, 37.0, 31.0, 28.0, 20.0, 30.0, 20.0, 19.0, 24.0, 12.0, 8.0, 9.0, 11.0, 8.0, 3.0, 7.0, 4.0, 7.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.958847999572754, -6.753422737121582, -6.54799747467041, -6.3425726890563965, -6.137147426605225, -5.931722164154053, -5.726297378540039, -5.520872116088867, -5.315446853637695, -5.110021591186523, -4.904596328735352, -4.699171543121338, -4.493746280670166, -4.288321018218994, -4.0828962326049805, -3.8774709701538086, -3.6720457077026367, -3.466620445251465, -3.261195421218872, -3.0557703971862793, -2.8503451347351074, -2.6449198722839355, -2.4394948482513428, -2.23406982421875, -2.028644561767578, -1.8232194185256958, -1.6177942752838135, -1.4123691320419312, -1.2069439888000488, -1.0015188455581665, -0.7960937023162842, -0.5906685590744019, -0.38524341583251953, -0.1798182725906372, 0.025606870651245117, 0.23103201389312744, 0.43645715713500977, 0.6418823003768921, 0.8473074436187744, 1.0527325868606567, 1.258157730102539, 1.4635828733444214, 1.6690080165863037, 1.874433159828186, 2.0798583030700684, 2.2852835655212402, 2.490708589553833, 2.696133613586426, 2.9015588760375977, 3.1069841384887695, 3.3124091625213623, 3.517834186553955, 3.723259449005127, 3.928684711456299, 4.1341094970703125, 4.339534759521484, 4.544960021972656, 4.750385284423828, 4.955810546875, 5.161235332489014, 5.3666605949401855, 5.572085857391357, 5.777510643005371, 5.982935905456543, 6.188361167907715]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 8.0, 4.0, 15.0, 27.0, 35.0, 58.0, 81.0, 175.0, 327.0, 589.0, 1157.0, 2441.0, 5195.0, 11261.0, 26068.0, 65384.0, 211557.0, 485579.0, 148978.0, 51291.0, 20865.0, 9091.0, 4203.0, 1952.0, 1012.0, 528.0, 268.0, 166.0, 97.0, 46.0, 33.0, 29.0, 13.0, 8.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.376678466796875, -3.24359130859375, -3.110504150390625, -2.9774169921875, -2.844329833984375, -2.71124267578125, -2.578155517578125, -2.445068359375, -2.311981201171875, -2.17889404296875, -2.045806884765625, -1.9127197265625, -1.779632568359375, -1.64654541015625, -1.513458251953125, -1.38037109375, -1.247283935546875, -1.11419677734375, -0.981109619140625, -0.8480224609375, -0.714935302734375, -0.58184814453125, -0.448760986328125, -0.315673828125, -0.182586669921875, -0.04949951171875, 0.083587646484375, 0.2166748046875, 0.349761962890625, 0.48284912109375, 0.615936279296875, 0.7490234375, 0.882110595703125, 1.01519775390625, 1.148284912109375, 1.2813720703125, 1.414459228515625, 1.54754638671875, 1.680633544921875, 1.813720703125, 1.946807861328125, 2.07989501953125, 2.212982177734375, 2.3460693359375, 2.479156494140625, 2.61224365234375, 2.745330810546875, 2.87841796875, 3.011505126953125, 3.14459228515625, 3.277679443359375, 3.4107666015625, 3.543853759765625, 3.67694091796875, 3.810028076171875, 3.943115234375, 4.076202392578125, 4.20928955078125, 4.342376708984375, 4.4754638671875, 4.608551025390625, 4.74163818359375, 4.874725341796875, 5.0078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 2.0, 9.0, 16.0, 14.0, 24.0, 22.0, 24.0, 34.0, 41.0, 18.0, 40.0, 40.0, 36.0, 55.0, 51.0, 49.0, 41.0, 49.0, 46.0, 47.0, 51.0, 37.0, 34.0, 42.0, 37.0, 21.0, 27.0, 22.0, 12.0, 12.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62939453125, -0.6044387817382812, -0.5794830322265625, -0.5545272827148438, -0.529571533203125, -0.5046157836914062, -0.4796600341796875, -0.45470428466796875, -0.42974853515625, -0.40479278564453125, -0.3798370361328125, -0.35488128662109375, -0.329925537109375, -0.30496978759765625, -0.2800140380859375, -0.25505828857421875, -0.2301025390625, -0.20514678955078125, -0.1801910400390625, -0.15523529052734375, -0.130279541015625, -0.10532379150390625, -0.0803680419921875, -0.05541229248046875, -0.03045654296875, -0.00550079345703125, 0.0194549560546875, 0.04441070556640625, 0.069366455078125, 0.09432220458984375, 0.1192779541015625, 0.14423370361328125, 0.169189453125, 0.19414520263671875, 0.2191009521484375, 0.24405670166015625, 0.269012451171875, 0.29396820068359375, 0.3189239501953125, 0.34387969970703125, 0.36883544921875, 0.39379119873046875, 0.4187469482421875, 0.44370269775390625, 0.468658447265625, 0.49361419677734375, 0.5185699462890625, 0.5435256958007812, 0.5684814453125, 0.5934371948242188, 0.6183929443359375, 0.6433486938476562, 0.668304443359375, 0.6932601928710938, 0.7182159423828125, 0.7431716918945312, 0.76812744140625, 0.7930831909179688, 0.8180389404296875, 0.8429946899414062, 0.867950439453125, 0.8929061889648438, 0.9178619384765625, 0.9428176879882812, 0.9677734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 19.0, 9.0, 22.0, 35.0, 62.0, 65.0, 117.0, 161.0, 290.0, 523.0, 1075.0, 2340.0, 6616.0, 23202.0, 95501.0, 599074.0, 252307.0, 47501.0, 12445.0, 3920.0, 1533.0, 717.0, 336.0, 231.0, 137.0, 73.0, 77.0, 46.0, 30.0, 19.0, 14.0, 13.0, 11.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -5.03021240234375, -4.8612060546875, -4.69219970703125, -4.523193359375, -4.35418701171875, -4.1851806640625, -4.01617431640625, -3.84716796875, -3.67816162109375, -3.5091552734375, -3.34014892578125, -3.171142578125, -3.00213623046875, -2.8331298828125, -2.66412353515625, -2.4951171875, -2.32611083984375, -2.1571044921875, -1.98809814453125, -1.819091796875, -1.65008544921875, -1.4810791015625, -1.31207275390625, -1.14306640625, -0.97406005859375, -0.8050537109375, -0.63604736328125, -0.467041015625, -0.29803466796875, -0.1290283203125, 0.03997802734375, 0.208984375, 0.37799072265625, 0.5469970703125, 0.71600341796875, 0.885009765625, 1.05401611328125, 1.2230224609375, 1.39202880859375, 1.56103515625, 1.73004150390625, 1.8990478515625, 2.06805419921875, 2.237060546875, 2.40606689453125, 2.5750732421875, 2.74407958984375, 2.9130859375, 3.08209228515625, 3.2510986328125, 3.42010498046875, 3.589111328125, 3.75811767578125, 3.9271240234375, 4.09613037109375, 4.26513671875, 4.43414306640625, 4.6031494140625, 4.77215576171875, 4.941162109375, 5.11016845703125, 5.2791748046875, 5.44818115234375, 5.6171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 6.0, 7.0, 11.0, 14.0, 10.0, 11.0, 8.0, 23.0, 21.0, 27.0, 32.0, 42.0, 58.0, 45.0, 46.0, 60.0, 52.0, 46.0, 43.0, 43.0, 39.0, 53.0, 38.0, 34.0, 42.0, 35.0, 29.0, 24.0, 18.0, 21.0, 11.0, 13.0, 12.0, 6.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.609375, -3.49969482421875, -3.3900146484375, -3.28033447265625, -3.170654296875, -3.06097412109375, -2.9512939453125, -2.84161376953125, -2.73193359375, -2.62225341796875, -2.5125732421875, -2.40289306640625, -2.293212890625, -2.18353271484375, -2.0738525390625, -1.96417236328125, -1.8544921875, -1.74481201171875, -1.6351318359375, -1.52545166015625, -1.415771484375, -1.30609130859375, -1.1964111328125, -1.08673095703125, -0.97705078125, -0.86737060546875, -0.7576904296875, -0.64801025390625, -0.538330078125, -0.42864990234375, -0.3189697265625, -0.20928955078125, -0.099609375, 0.01007080078125, 0.1197509765625, 0.22943115234375, 0.339111328125, 0.44879150390625, 0.5584716796875, 0.66815185546875, 0.77783203125, 0.88751220703125, 0.9971923828125, 1.10687255859375, 1.216552734375, 1.32623291015625, 1.4359130859375, 1.54559326171875, 1.6552734375, 1.76495361328125, 1.8746337890625, 1.98431396484375, 2.093994140625, 2.20367431640625, 2.3133544921875, 2.42303466796875, 2.53271484375, 2.64239501953125, 2.7520751953125, 2.86175537109375, 2.971435546875, 3.08111572265625, 3.1907958984375, 3.30047607421875, 3.41015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 9.0, 11.0, 8.0, 16.0, 24.0, 33.0, 58.0, 94.0, 147.0, 264.0, 520.0, 1168.0, 2719.0, 6781.0, 19254.0, 61528.0, 425852.0, 435684.0, 62788.0, 19498.0, 6922.0, 2737.0, 1150.0, 566.0, 321.0, 166.0, 85.0, 54.0, 33.0, 27.0, 13.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.5546875, -3.455963134765625, -3.35723876953125, -3.258514404296875, -3.1597900390625, -3.061065673828125, -2.96234130859375, -2.863616943359375, -2.764892578125, -2.666168212890625, -2.56744384765625, -2.468719482421875, -2.3699951171875, -2.271270751953125, -2.17254638671875, -2.073822021484375, -1.97509765625, -1.876373291015625, -1.77764892578125, -1.678924560546875, -1.5802001953125, -1.481475830078125, -1.38275146484375, -1.284027099609375, -1.185302734375, -1.086578369140625, -0.98785400390625, -0.889129638671875, -0.7904052734375, -0.691680908203125, -0.59295654296875, -0.494232177734375, -0.3955078125, -0.296783447265625, -0.19805908203125, -0.099334716796875, -0.0006103515625, 0.098114013671875, 0.19683837890625, 0.295562744140625, 0.394287109375, 0.493011474609375, 0.59173583984375, 0.690460205078125, 0.7891845703125, 0.887908935546875, 0.98663330078125, 1.085357666015625, 1.18408203125, 1.282806396484375, 1.38153076171875, 1.480255126953125, 1.5789794921875, 1.677703857421875, 1.77642822265625, 1.875152587890625, 1.973876953125, 2.072601318359375, 2.17132568359375, 2.270050048828125, 2.3687744140625, 2.467498779296875, 2.56622314453125, 2.664947509765625, 2.763671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 3.0, 13.0, 13.0, 21.0, 26.0, 36.0, 50.0, 186.0, 344.0, 140.0, 52.0, 25.0, 24.0, 22.0, 13.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009131431579589844, -0.0008771345019340515, -0.0008411258459091187, -0.0008051171898841858, -0.0007691085338592529, -0.0007330998778343201, -0.0006970912218093872, -0.0006610825657844543, -0.0006250739097595215, -0.0005890652537345886, -0.0005530565977096558, -0.0005170479416847229, -0.00048103928565979004, -0.0004450306296348572, -0.0004090219736099243, -0.00037301331758499146, -0.0003370046615600586, -0.00030099600553512573, -0.00026498734951019287, -0.00022897869348526, -0.00019297003746032715, -0.0001569613814353943, -0.00012095272541046143, -8.494406938552856e-05, -4.89354133605957e-05, -1.2926757335662842e-05, 2.308189868927002e-05, 5.909055471420288e-05, 9.509921073913574e-05, 0.0001311078667640686, 0.00016711652278900146, 0.00020312517881393433, 0.0002391338348388672, 0.00027514249086380005, 0.0003111511468887329, 0.00034715980291366577, 0.00038316845893859863, 0.0004191771149635315, 0.00045518577098846436, 0.0004911944270133972, 0.0005272030830383301, 0.0005632117390632629, 0.0005992203950881958, 0.0006352290511131287, 0.0006712377071380615, 0.0007072463631629944, 0.0007432550191879272, 0.0007792636752128601, 0.000815272331237793, 0.0008512809872627258, 0.0008872896432876587, 0.0009232982993125916, 0.0009593069553375244, 0.0009953156113624573, 0.0010313242673873901, 0.001067332923412323, 0.0011033415794372559, 0.0011393502354621887, 0.0011753588914871216, 0.0012113675475120544, 0.0012473762035369873, 0.0012833848595619202, 0.001319393515586853, 0.0013554021716117859, 0.0013914108276367188]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 5.0, 5.0, 15.0, 26.0, 33.0, 35.0, 67.0, 97.0, 176.0, 269.0, 434.0, 807.0, 1611.0, 3716.0, 10013.0, 30050.0, 97817.0, 647350.0, 185417.0, 45777.0, 15012.0, 5328.0, 2210.0, 943.0, 522.0, 265.0, 168.0, 129.0, 78.0, 49.0, 42.0, 20.0, 17.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.638671875, -2.543365478515625, -2.44805908203125, -2.352752685546875, -2.2574462890625, -2.162139892578125, -2.06683349609375, -1.971527099609375, -1.876220703125, -1.780914306640625, -1.68560791015625, -1.590301513671875, -1.4949951171875, -1.399688720703125, -1.30438232421875, -1.209075927734375, -1.11376953125, -1.018463134765625, -0.92315673828125, -0.827850341796875, -0.7325439453125, -0.637237548828125, -0.54193115234375, -0.446624755859375, -0.351318359375, -0.256011962890625, -0.16070556640625, -0.065399169921875, 0.0299072265625, 0.125213623046875, 0.22052001953125, 0.315826416015625, 0.4111328125, 0.506439208984375, 0.60174560546875, 0.697052001953125, 0.7923583984375, 0.887664794921875, 0.98297119140625, 1.078277587890625, 1.173583984375, 1.268890380859375, 1.36419677734375, 1.459503173828125, 1.5548095703125, 1.650115966796875, 1.74542236328125, 1.840728759765625, 1.93603515625, 2.031341552734375, 2.12664794921875, 2.221954345703125, 2.3172607421875, 2.412567138671875, 2.50787353515625, 2.603179931640625, 2.698486328125, 2.793792724609375, 2.88909912109375, 2.984405517578125, 3.0797119140625, 3.175018310546875, 3.27032470703125, 3.365631103515625, 3.4609375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 8.0, 11.0, 8.0, 11.0, 13.0, 14.0, 22.0, 27.0, 30.0, 50.0, 112.0, 168.0, 187.0, 118.0, 54.0, 44.0, 23.0, 21.0, 13.0, 10.0, 17.0, 10.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.34088134765625, -2.2481689453125, -2.15545654296875, -2.062744140625, -1.97003173828125, -1.8773193359375, -1.78460693359375, -1.69189453125, -1.59918212890625, -1.5064697265625, -1.41375732421875, -1.321044921875, -1.22833251953125, -1.1356201171875, -1.04290771484375, -0.9501953125, -0.85748291015625, -0.7647705078125, -0.67205810546875, -0.579345703125, -0.48663330078125, -0.3939208984375, -0.30120849609375, -0.20849609375, -0.11578369140625, -0.0230712890625, 0.06964111328125, 0.162353515625, 0.25506591796875, 0.3477783203125, 0.44049072265625, 0.533203125, 0.62591552734375, 0.7186279296875, 0.81134033203125, 0.904052734375, 0.99676513671875, 1.0894775390625, 1.18218994140625, 1.27490234375, 1.36761474609375, 1.4603271484375, 1.55303955078125, 1.645751953125, 1.73846435546875, 1.8311767578125, 1.92388916015625, 2.0166015625, 2.10931396484375, 2.2020263671875, 2.29473876953125, 2.387451171875, 2.48016357421875, 2.5728759765625, 2.66558837890625, 2.75830078125, 2.85101318359375, 2.9437255859375, 3.03643798828125, 3.129150390625, 3.22186279296875, 3.3145751953125, 3.40728759765625, 3.5]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 18.0, 72.0, 186.0, 246.0, 270.0, 125.0, 53.0, 24.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.9625244140625, -100.8171615600586, -98.67179870605469, -96.52643585205078, -94.38107299804688, -92.2357177734375, -90.09034729003906, -87.94499206542969, -85.79962921142578, -83.65426635742188, -81.50890350341797, -79.36354064941406, -77.21817779541016, -75.07281494140625, -72.92745971679688, -70.78209686279297, -68.63673400878906, -66.49137115478516, -64.34600830078125, -62.200645446777344, -60.0552864074707, -57.9099235534668, -55.76456069946289, -53.619197845458984, -51.47383117675781, -49.328468322753906, -47.18310546875, -45.037742614746094, -42.89238357543945, -40.74702072143555, -38.60165786743164, -36.456295013427734, -34.310935974121094, -32.16557312011719, -30.020212173461914, -27.874849319458008, -25.729488372802734, -23.584125518798828, -21.438762664794922, -19.293399810791016, -17.148038864135742, -15.002676963806152, -12.857315063476562, -10.711952209472656, -8.566590309143066, -6.421228408813477, -4.27586555480957, -2.1305036544799805, 0.014858245849609375, 2.1602203845977783, 4.305582523345947, 6.450944900512695, 8.596306800842285, 10.741668701171875, 12.887031555175781, 15.032393455505371, 17.17775535583496, 19.323118209838867, 21.46847915649414, 23.613842010498047, 25.759204864501953, 27.904565811157227, 30.049928665161133, 32.195289611816406, 34.34065246582031]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 12.0, 11.0, 13.0, 9.0, 17.0, 16.0, 21.0, 22.0, 34.0, 26.0, 36.0, 27.0, 40.0, 40.0, 36.0, 35.0, 44.0, 42.0, 31.0, 35.0, 37.0, 44.0, 28.0, 37.0, 31.0, 31.0, 21.0, 29.0, 21.0, 24.0, 25.0, 15.0, 14.0, 19.0, 10.0, 7.0, 8.0, 10.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.189441680908203, -14.715103149414062, -14.240764617919922, -13.766426086425781, -13.292086601257324, -12.817748069763184, -12.343409538269043, -11.869071006774902, -11.394731521606445, -10.920392990112305, -10.446054458618164, -9.971715927124023, -9.497376441955566, -9.023037910461426, -8.548699378967285, -8.074360847473145, -7.600022315979004, -7.125683784484863, -6.6513447761535645, -6.177006244659424, -5.702667236328125, -5.228328704833984, -4.753990173339844, -4.279651641845703, -3.8053126335144043, -3.3309738636016846, -2.856635093688965, -2.382296562194824, -1.9079577922821045, -1.4336190223693848, -0.9592804908752441, -0.4849417209625244, -0.010602951049804688, 0.46373575925827026, 0.9380744695663452, 1.4124131202697754, 1.8867518901824951, 2.361090660095215, 2.8354291915893555, 3.309767961502075, 3.784106731414795, 4.2584452629089355, 4.732784271240234, 5.207122802734375, 5.681461334228516, 6.1558003425598145, 6.630138874053955, 7.104477882385254, 7.5788164138793945, 8.053154945373535, 8.527493476867676, 9.001832962036133, 9.476171493530273, 9.950510025024414, 10.424848556518555, 10.899187088012695, 11.373525619506836, 11.847864151000977, 12.322202682495117, 12.796541213989258, 13.270880699157715, 13.745219230651855, 14.219557762145996, 14.693896293640137, 15.168235778808594]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 12.0, 20.0, 31.0, 50.0, 97.0, 182.0, 381.0, 821.0, 1793.0, 4684.0, 13752.0, 49649.0, 350975.0, 3600468.0, 128837.0, 27960.0, 8680.0, 3243.0, 1347.0, 585.0, 281.0, 155.0, 86.0, 48.0, 33.0, 26.0, 22.0, 10.0, 10.0, 6.0, 8.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.5543212890625, -5.350830078125, -5.1473388671875, -4.94384765625, -4.7403564453125, -4.536865234375, -4.3333740234375, -4.1298828125, -3.9263916015625, -3.722900390625, -3.5194091796875, -3.31591796875, -3.1124267578125, -2.908935546875, -2.7054443359375, -2.501953125, -2.2984619140625, -2.094970703125, -1.8914794921875, -1.68798828125, -1.4844970703125, -1.281005859375, -1.0775146484375, -0.8740234375, -0.6705322265625, -0.467041015625, -0.2635498046875, -0.06005859375, 0.1434326171875, 0.346923828125, 0.5504150390625, 0.75390625, 0.9573974609375, 1.160888671875, 1.3643798828125, 1.56787109375, 1.7713623046875, 1.974853515625, 2.1783447265625, 2.3818359375, 2.5853271484375, 2.788818359375, 2.9923095703125, 3.19580078125, 3.3992919921875, 3.602783203125, 3.8062744140625, 4.009765625, 4.2132568359375, 4.416748046875, 4.6202392578125, 4.82373046875, 5.0272216796875, 5.230712890625, 5.4342041015625, 5.6376953125, 5.8411865234375, 6.044677734375, 6.2481689453125, 6.45166015625, 6.6551513671875, 6.858642578125, 7.0621337890625, 7.265625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 9.0, 9.0, 13.0, 13.0, 19.0, 18.0, 24.0, 34.0, 37.0, 32.0, 33.0, 48.0, 43.0, 49.0, 44.0, 52.0, 31.0, 55.0, 26.0, 47.0, 33.0, 36.0, 35.0, 31.0, 34.0, 30.0, 31.0, 27.0, 18.0, 15.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7817306518554688, -0.7563323974609375, -0.7309341430664062, -0.705535888671875, -0.6801376342773438, -0.6547393798828125, -0.6293411254882812, -0.60394287109375, -0.5785446166992188, -0.5531463623046875, -0.5277481079101562, -0.502349853515625, -0.47695159912109375, -0.4515533447265625, -0.42615509033203125, -0.4007568359375, -0.37535858154296875, -0.3499603271484375, -0.32456207275390625, -0.299163818359375, -0.27376556396484375, -0.2483673095703125, -0.22296905517578125, -0.19757080078125, -0.17217254638671875, -0.1467742919921875, -0.12137603759765625, -0.095977783203125, -0.07057952880859375, -0.0451812744140625, -0.01978302001953125, 0.005615234375, 0.03101348876953125, 0.0564117431640625, 0.08180999755859375, 0.107208251953125, 0.13260650634765625, 0.1580047607421875, 0.18340301513671875, 0.20880126953125, 0.23419952392578125, 0.2595977783203125, 0.28499603271484375, 0.310394287109375, 0.33579254150390625, 0.3611907958984375, 0.38658905029296875, 0.4119873046875, 0.43738555908203125, 0.4627838134765625, 0.48818206787109375, 0.513580322265625, 0.5389785766601562, 0.5643768310546875, 0.5897750854492188, 0.61517333984375, 0.6405715942382812, 0.6659698486328125, 0.6913681030273438, 0.716766357421875, 0.7421646118164062, 0.7675628662109375, 0.7929611206054688, 0.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 10.0, 14.0, 17.0, 19.0, 42.0, 54.0, 74.0, 129.0, 234.0, 404.0, 800.0, 1695.0, 4027.0, 11133.0, 38322.0, 220172.0, 3534355.0, 314371.0, 46813.0, 13029.0, 4612.0, 1934.0, 887.0, 461.0, 243.0, 144.0, 106.0, 44.0, 40.0, 31.0, 12.0, 14.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.8226318359375, -5.625732421875, -5.4288330078125, -5.23193359375, -5.0350341796875, -4.838134765625, -4.6412353515625, -4.4443359375, -4.2474365234375, -4.050537109375, -3.8536376953125, -3.65673828125, -3.4598388671875, -3.262939453125, -3.0660400390625, -2.869140625, -2.6722412109375, -2.475341796875, -2.2784423828125, -2.08154296875, -1.8846435546875, -1.687744140625, -1.4908447265625, -1.2939453125, -1.0970458984375, -0.900146484375, -0.7032470703125, -0.50634765625, -0.3094482421875, -0.112548828125, 0.0843505859375, 0.28125, 0.4781494140625, 0.675048828125, 0.8719482421875, 1.06884765625, 1.2657470703125, 1.462646484375, 1.6595458984375, 1.8564453125, 2.0533447265625, 2.250244140625, 2.4471435546875, 2.64404296875, 2.8409423828125, 3.037841796875, 3.2347412109375, 3.431640625, 3.6285400390625, 3.825439453125, 4.0223388671875, 4.21923828125, 4.4161376953125, 4.613037109375, 4.8099365234375, 5.0068359375, 5.2037353515625, 5.400634765625, 5.5975341796875, 5.79443359375, 5.9913330078125, 6.188232421875, 6.3851318359375, 6.58203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 22.0, 8.0, 27.0, 28.0, 45.0, 81.0, 152.0, 302.0, 1051.0, 1558.0, 339.0, 170.0, 98.0, 52.0, 38.0, 18.0, 15.0, 14.0, 8.0, 5.0, 4.0, 8.0, 5.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.452392578125, -2.37353515625, -2.294677734375, -2.2158203125, -2.136962890625, -2.05810546875, -1.979248046875, -1.900390625, -1.821533203125, -1.74267578125, -1.663818359375, -1.5849609375, -1.506103515625, -1.42724609375, -1.348388671875, -1.26953125, -1.190673828125, -1.11181640625, -1.032958984375, -0.9541015625, -0.875244140625, -0.79638671875, -0.717529296875, -0.638671875, -0.559814453125, -0.48095703125, -0.402099609375, -0.3232421875, -0.244384765625, -0.16552734375, -0.086669921875, -0.0078125, 0.071044921875, 0.14990234375, 0.228759765625, 0.3076171875, 0.386474609375, 0.46533203125, 0.544189453125, 0.623046875, 0.701904296875, 0.78076171875, 0.859619140625, 0.9384765625, 1.017333984375, 1.09619140625, 1.175048828125, 1.25390625, 1.332763671875, 1.41162109375, 1.490478515625, 1.5693359375, 1.648193359375, 1.72705078125, 1.805908203125, 1.884765625, 1.963623046875, 2.04248046875, 2.121337890625, 2.2001953125, 2.279052734375, 2.35791015625, 2.436767578125, 2.515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 22.0, 44.0, 105.0, 196.0, 209.0, 175.0, 119.0, 45.0, 38.0, 20.0, 7.0, 9.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.82302474975586, -34.0769157409668, -33.330806732177734, -32.58469772338867, -31.838590621948242, -31.09248161315918, -30.346372604370117, -29.600263595581055, -28.854156494140625, -28.108047485351562, -27.3619384765625, -26.615829467773438, -25.869722366333008, -25.123613357543945, -24.377504348754883, -23.63139533996582, -22.885286331176758, -22.139177322387695, -21.393068313598633, -20.646961212158203, -19.90085220336914, -19.154743194580078, -18.408634185791016, -17.662525177001953, -16.91641616821289, -16.170307159423828, -15.424199104309082, -14.67809009552002, -13.931982040405273, -13.185873031616211, -12.439764022827148, -11.693655014038086, -10.947547912597656, -10.201438903808594, -9.455330848693848, -8.709221839904785, -7.963113307952881, -7.217004776000977, -6.470895767211914, -5.72478723526001, -4.9786787033081055, -4.232570171356201, -3.4864614009857178, -2.7403526306152344, -1.99424409866333, -1.2481355667114258, -0.5020265579223633, 0.24408197402954102, 0.9901905059814453, 1.7362991571426392, 2.482407808303833, 3.2285165786743164, 3.9746251106262207, 4.720733642578125, 5.4668426513671875, 6.212951183319092, 6.959059715270996, 7.7051682472229, 8.451276779174805, 9.197385787963867, 9.94349479675293, 10.689602851867676, 11.435711860656738, 12.181819915771484, 12.927928924560547]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 8.0, 14.0, 9.0, 14.0, 22.0, 11.0, 19.0, 20.0, 27.0, 29.0, 34.0, 36.0, 43.0, 39.0, 39.0, 37.0, 44.0, 38.0, 38.0, 53.0, 47.0, 41.0, 36.0, 29.0, 28.0, 36.0, 22.0, 29.0, 18.0, 16.0, 16.0, 13.0, 17.0, 8.0, 9.0, 5.0, 7.0, 2.0, 8.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.94080924987793, -5.745716094970703, -5.550622940063477, -5.355530261993408, -5.160437107086182, -4.965343952178955, -4.770251274108887, -4.57515811920166, -4.380064964294434, -4.184971809387207, -3.9898788928985596, -3.794785976409912, -3.5996928215026855, -3.404599666595459, -3.2095067501068115, -3.014413833618164, -2.8193206787109375, -2.624227523803711, -2.4291346073150635, -2.234041690826416, -2.0389485359191895, -1.8438555002212524, -1.6487624645233154, -1.4536694288253784, -1.2585763931274414, -1.0634833574295044, -0.8683903217315674, -0.6732972860336304, -0.47820425033569336, -0.28311121463775635, -0.08801817893981934, 0.10707485675811768, 0.3021674156188965, 0.4972604513168335, 0.6923534870147705, 0.8874465227127075, 1.0825395584106445, 1.2776325941085815, 1.4727256298065186, 1.6678186655044556, 1.8629117012023926, 2.058004856109619, 2.2530977725982666, 2.448190689086914, 2.6432838439941406, 2.838376998901367, 3.0334699153900146, 3.228562831878662, 3.4236559867858887, 3.6187491416931152, 3.8138420581817627, 4.00893497467041, 4.204028129577637, 4.399121284484863, 4.59421443939209, 4.789307117462158, 4.984400272369385, 5.179493427276611, 5.37458610534668, 5.569679260253906, 5.764772415161133, 5.959865570068359, 6.154958724975586, 6.350051403045654, 6.545144557952881]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 7.0, 19.0, 25.0, 33.0, 71.0, 82.0, 148.0, 264.0, 440.0, 906.0, 1758.0, 3867.0, 8046.0, 17132.0, 36414.0, 90963.0, 348913.0, 371095.0, 96247.0, 38182.0, 17764.0, 8378.0, 3821.0, 1871.0, 925.0, 459.0, 272.0, 167.0, 78.0, 64.0, 42.0, 24.0, 23.0, 13.0, 8.0, 8.0, 4.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.500457763671875, -3.38763427734375, -3.274810791015625, -3.1619873046875, -3.049163818359375, -2.93634033203125, -2.823516845703125, -2.710693359375, -2.597869873046875, -2.48504638671875, -2.372222900390625, -2.2593994140625, -2.146575927734375, -2.03375244140625, -1.920928955078125, -1.80810546875, -1.695281982421875, -1.58245849609375, -1.469635009765625, -1.3568115234375, -1.243988037109375, -1.13116455078125, -1.018341064453125, -0.905517578125, -0.792694091796875, -0.67987060546875, -0.567047119140625, -0.4542236328125, -0.341400146484375, -0.22857666015625, -0.115753173828125, -0.0029296875, 0.109893798828125, 0.22271728515625, 0.335540771484375, 0.4483642578125, 0.561187744140625, 0.67401123046875, 0.786834716796875, 0.899658203125, 1.012481689453125, 1.12530517578125, 1.238128662109375, 1.3509521484375, 1.463775634765625, 1.57659912109375, 1.689422607421875, 1.80224609375, 1.915069580078125, 2.02789306640625, 2.140716552734375, 2.2535400390625, 2.366363525390625, 2.47918701171875, 2.592010498046875, 2.704833984375, 2.817657470703125, 2.93048095703125, 3.043304443359375, 3.1561279296875, 3.268951416015625, 3.38177490234375, 3.494598388671875, 3.607421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 12.0, 12.0, 26.0, 30.0, 27.0, 30.0, 19.0, 33.0, 60.0, 37.0, 45.0, 52.0, 56.0, 48.0, 45.0, 47.0, 38.0, 29.0, 35.0, 54.0, 35.0, 34.0, 34.0, 31.0, 17.0, 14.0, 22.0, 16.0, 6.0, 10.0, 4.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71142578125, -0.6832046508789062, -0.6549835205078125, -0.6267623901367188, -0.598541259765625, -0.5703201293945312, -0.5420989990234375, -0.5138778686523438, -0.48565673828125, -0.45743560791015625, -0.4292144775390625, -0.40099334716796875, -0.372772216796875, -0.34455108642578125, -0.3163299560546875, -0.28810882568359375, -0.2598876953125, -0.23166656494140625, -0.2034454345703125, -0.17522430419921875, -0.147003173828125, -0.11878204345703125, -0.0905609130859375, -0.06233978271484375, -0.03411865234375, -0.00589752197265625, 0.0223236083984375, 0.05054473876953125, 0.078765869140625, 0.10698699951171875, 0.1352081298828125, 0.16342926025390625, 0.191650390625, 0.21987152099609375, 0.2480926513671875, 0.27631378173828125, 0.304534912109375, 0.33275604248046875, 0.3609771728515625, 0.38919830322265625, 0.41741943359375, 0.44564056396484375, 0.4738616943359375, 0.5020828247070312, 0.530303955078125, 0.5585250854492188, 0.5867462158203125, 0.6149673461914062, 0.6431884765625, 0.6714096069335938, 0.6996307373046875, 0.7278518676757812, 0.756072998046875, 0.7842941284179688, 0.8125152587890625, 0.8407363891601562, 0.86895751953125, 0.8971786499023438, 0.9253997802734375, 0.9536209106445312, 0.981842041015625, 1.0100631713867188, 1.0382843017578125, 1.0665054321289062, 1.0947265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 14.0, 6.0, 11.0, 13.0, 17.0, 23.0, 39.0, 63.0, 78.0, 128.0, 178.0, 289.0, 540.0, 1078.0, 2459.0, 5854.0, 14579.0, 37466.0, 129429.0, 644775.0, 145044.0, 39654.0, 15428.0, 6121.0, 2615.0, 1171.0, 539.0, 344.0, 173.0, 136.0, 81.0, 50.0, 33.0, 31.0, 21.0, 21.0, 10.0, 5.0, 9.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.79071044921875, -3.6478271484375, -3.50494384765625, -3.362060546875, -3.21917724609375, -3.0762939453125, -2.93341064453125, -2.79052734375, -2.64764404296875, -2.5047607421875, -2.36187744140625, -2.218994140625, -2.07611083984375, -1.9332275390625, -1.79034423828125, -1.6474609375, -1.50457763671875, -1.3616943359375, -1.21881103515625, -1.075927734375, -0.93304443359375, -0.7901611328125, -0.64727783203125, -0.50439453125, -0.36151123046875, -0.2186279296875, -0.07574462890625, 0.067138671875, 0.21002197265625, 0.3529052734375, 0.49578857421875, 0.638671875, 0.78155517578125, 0.9244384765625, 1.06732177734375, 1.210205078125, 1.35308837890625, 1.4959716796875, 1.63885498046875, 1.78173828125, 1.92462158203125, 2.0675048828125, 2.21038818359375, 2.353271484375, 2.49615478515625, 2.6390380859375, 2.78192138671875, 2.9248046875, 3.06768798828125, 3.2105712890625, 3.35345458984375, 3.496337890625, 3.63922119140625, 3.7821044921875, 3.92498779296875, 4.06787109375, 4.21075439453125, 4.3536376953125, 4.49652099609375, 4.639404296875, 4.78228759765625, 4.9251708984375, 5.06805419921875, 5.2109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 6.0, 10.0, 16.0, 6.0, 7.0, 16.0, 18.0, 21.0, 26.0, 33.0, 41.0, 61.0, 49.0, 62.0, 51.0, 56.0, 58.0, 52.0, 55.0, 51.0, 51.0, 47.0, 36.0, 32.0, 28.0, 28.0, 6.0, 16.0, 11.0, 15.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.50390625, -4.35760498046875, -4.2113037109375, -4.06500244140625, -3.918701171875, -3.77239990234375, -3.6260986328125, -3.47979736328125, -3.33349609375, -3.18719482421875, -3.0408935546875, -2.89459228515625, -2.748291015625, -2.60198974609375, -2.4556884765625, -2.30938720703125, -2.1630859375, -2.01678466796875, -1.8704833984375, -1.72418212890625, -1.577880859375, -1.43157958984375, -1.2852783203125, -1.13897705078125, -0.99267578125, -0.84637451171875, -0.7000732421875, -0.55377197265625, -0.407470703125, -0.26116943359375, -0.1148681640625, 0.03143310546875, 0.177734375, 0.32403564453125, 0.4703369140625, 0.61663818359375, 0.762939453125, 0.90924072265625, 1.0555419921875, 1.20184326171875, 1.34814453125, 1.49444580078125, 1.6407470703125, 1.78704833984375, 1.933349609375, 2.07965087890625, 2.2259521484375, 2.37225341796875, 2.5185546875, 2.66485595703125, 2.8111572265625, 2.95745849609375, 3.103759765625, 3.25006103515625, 3.3963623046875, 3.54266357421875, 3.68896484375, 3.83526611328125, 3.9815673828125, 4.12786865234375, 4.274169921875, 4.42047119140625, 4.5667724609375, 4.71307373046875, 4.859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 7.0, 8.0, 21.0, 32.0, 46.0, 52.0, 88.0, 131.0, 274.0, 399.0, 654.0, 1094.0, 2071.0, 4213.0, 9409.0, 25737.0, 129456.0, 774558.0, 67288.0, 18254.0, 7297.0, 3407.0, 1704.0, 935.0, 503.0, 326.0, 222.0, 126.0, 71.0, 55.0, 38.0, 32.0, 19.0, 3.0, 5.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.66015625, -4.531951904296875, -4.40374755859375, -4.275543212890625, -4.1473388671875, -4.019134521484375, -3.89093017578125, -3.762725830078125, -3.634521484375, -3.506317138671875, -3.37811279296875, -3.249908447265625, -3.1217041015625, -2.993499755859375, -2.86529541015625, -2.737091064453125, -2.60888671875, -2.480682373046875, -2.35247802734375, -2.224273681640625, -2.0960693359375, -1.967864990234375, -1.83966064453125, -1.711456298828125, -1.583251953125, -1.455047607421875, -1.32684326171875, -1.198638916015625, -1.0704345703125, -0.942230224609375, -0.81402587890625, -0.685821533203125, -0.5576171875, -0.429412841796875, -0.30120849609375, -0.173004150390625, -0.0447998046875, 0.083404541015625, 0.21160888671875, 0.339813232421875, 0.468017578125, 0.596221923828125, 0.72442626953125, 0.852630615234375, 0.9808349609375, 1.109039306640625, 1.23724365234375, 1.365447998046875, 1.49365234375, 1.621856689453125, 1.75006103515625, 1.878265380859375, 2.0064697265625, 2.134674072265625, 2.26287841796875, 2.391082763671875, 2.519287109375, 2.647491455078125, 2.77569580078125, 2.903900146484375, 3.0321044921875, 3.160308837890625, 3.28851318359375, 3.416717529296875, 3.544921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 14.0, 8.0, 8.0, 12.0, 23.0, 32.0, 80.0, 290.0, 292.0, 88.0, 39.0, 22.0, 20.0, 14.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.001308441162109375, -0.0012740567326545715, -0.001239672303199768, -0.0012052878737449646, -0.0011709034442901611, -0.0011365190148353577, -0.0011021345853805542, -0.0010677501559257507, -0.0010333657264709473, -0.0009989812970161438, -0.0009645968675613403, -0.0009302124381065369, -0.0008958280086517334, -0.0008614435791969299, -0.0008270591497421265, -0.000792674720287323, -0.0007582902908325195, -0.0007239058613777161, -0.0006895214319229126, -0.0006551370024681091, -0.0006207525730133057, -0.0005863681435585022, -0.0005519837141036987, -0.0005175992846488953, -0.0004832148551940918, -0.00044883042573928833, -0.00041444599628448486, -0.0003800615668296814, -0.00034567713737487793, -0.00031129270792007446, -0.000276908278465271, -0.00024252384901046753, -0.00020813941955566406, -0.0001737549901008606, -0.00013937056064605713, -0.00010498613119125366, -7.06017017364502e-05, -3.621727228164673e-05, -1.8328428268432617e-06, 3.2551586627960205e-05, 6.693601608276367e-05, 0.00010132044553756714, 0.0001357048749923706, 0.00017008930444717407, 0.00020447373390197754, 0.000238858163356781, 0.00027324259281158447, 0.00030762702226638794, 0.0003420114517211914, 0.0003763958811759949, 0.00041078031063079834, 0.0004451647400856018, 0.0004795491695404053, 0.0005139335989952087, 0.0005483180284500122, 0.0005827024579048157, 0.0006170868873596191, 0.0006514713168144226, 0.0006858557462692261, 0.0007202401757240295, 0.000754624605178833, 0.0007890090346336365, 0.0008233934640884399, 0.0008577778935432434, 0.0008921623229980469]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 17.0, 25.0, 68.0, 151.0, 438.0, 1753.0, 11375.0, 962912.0, 66320.0, 4109.0, 902.0, 274.0, 100.0, 49.0, 23.0, 12.0, 4.0, 7.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -11.9969482421875, -11.548583984375, -11.1002197265625, -10.65185546875, -10.2034912109375, -9.755126953125, -9.3067626953125, -8.8583984375, -8.4100341796875, -7.961669921875, -7.5133056640625, -7.06494140625, -6.6165771484375, -6.168212890625, -5.7198486328125, -5.271484375, -4.8231201171875, -4.374755859375, -3.9263916015625, -3.47802734375, -3.0296630859375, -2.581298828125, -2.1329345703125, -1.6845703125, -1.2362060546875, -0.787841796875, -0.3394775390625, 0.10888671875, 0.5572509765625, 1.005615234375, 1.4539794921875, 1.90234375, 2.3507080078125, 2.799072265625, 3.2474365234375, 3.69580078125, 4.1441650390625, 4.592529296875, 5.0408935546875, 5.4892578125, 5.9376220703125, 6.385986328125, 6.8343505859375, 7.28271484375, 7.7310791015625, 8.179443359375, 8.6278076171875, 9.076171875, 9.5245361328125, 9.972900390625, 10.4212646484375, 10.86962890625, 11.3179931640625, 11.766357421875, 12.2147216796875, 12.6630859375, 13.1114501953125, 13.559814453125, 14.0081787109375, 14.45654296875, 14.9049072265625, 15.353271484375, 15.8016357421875, 16.25]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 11.0, 17.0, 19.0, 36.0, 87.0, 253.0, 338.0, 108.0, 49.0, 27.0, 13.0, 9.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.25634765625, -6.0556640625, -5.85498046875, -5.654296875, -5.45361328125, -5.2529296875, -5.05224609375, -4.8515625, -4.65087890625, -4.4501953125, -4.24951171875, -4.048828125, -3.84814453125, -3.6474609375, -3.44677734375, -3.24609375, -3.04541015625, -2.8447265625, -2.64404296875, -2.443359375, -2.24267578125, -2.0419921875, -1.84130859375, -1.640625, -1.43994140625, -1.2392578125, -1.03857421875, -0.837890625, -0.63720703125, -0.4365234375, -0.23583984375, -0.03515625, 0.16552734375, 0.3662109375, 0.56689453125, 0.767578125, 0.96826171875, 1.1689453125, 1.36962890625, 1.5703125, 1.77099609375, 1.9716796875, 2.17236328125, 2.373046875, 2.57373046875, 2.7744140625, 2.97509765625, 3.17578125, 3.37646484375, 3.5771484375, 3.77783203125, 3.978515625, 4.17919921875, 4.3798828125, 4.58056640625, 4.78125, 4.98193359375, 5.1826171875, 5.38330078125, 5.583984375, 5.78466796875, 5.9853515625, 6.18603515625, 6.38671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 20.0, 47.0, 105.0, 239.0, 286.0, 195.0, 76.0, 30.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.8776092529297, -130.07093811035156, -127.2642593383789, -124.45758056640625, -121.6509017944336, -118.84422302246094, -116.03755187988281, -113.23087310791016, -110.4241943359375, -107.61751556396484, -104.81084442138672, -102.00416564941406, -99.1974868774414, -96.39080810546875, -93.58413696289062, -90.77745819091797, -87.97077941894531, -85.16410064697266, -82.35742950439453, -79.55075073242188, -76.74407196044922, -73.93739318847656, -71.13072204589844, -68.32404327392578, -65.51737213134766, -62.710697174072266, -59.90401840209961, -57.09734344482422, -54.29066467285156, -51.48398971557617, -48.67731475830078, -45.870635986328125, -43.06395721435547, -40.25728225708008, -37.45060348510742, -34.64392852783203, -31.837249755859375, -29.030574798583984, -26.22389793395996, -23.417221069335938, -20.610544204711914, -17.80386734008789, -14.997190475463867, -12.19051456451416, -9.383837699890137, -6.577160835266113, -3.7704849243164062, -0.9638080596923828, 1.8428688049316406, 4.649545669555664, 7.456222057342529, 10.262898445129395, 13.069575309753418, 15.876252174377441, 18.68292808532715, 21.489604949951172, 24.296281814575195, 27.10295867919922, 29.909635543823242, 32.716312408447266, 35.522987365722656, 38.32966613769531, 41.1363410949707, 43.943016052246094, 46.74969482421875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 3.0, 8.0, 5.0, 19.0, 18.0, 21.0, 21.0, 13.0, 21.0, 25.0, 29.0, 30.0, 31.0, 33.0, 39.0, 42.0, 33.0, 40.0, 39.0, 40.0, 47.0, 42.0, 33.0, 26.0, 47.0, 29.0, 36.0, 32.0, 19.0, 24.0, 16.0, 19.0, 19.0, 13.0, 15.0, 14.0, 11.0, 9.0, 8.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0], "bins": [-22.060283660888672, -21.46369743347168, -20.867111206054688, -20.270523071289062, -19.67393684387207, -19.077350616455078, -18.480762481689453, -17.88417625427246, -17.28759002685547, -16.691003799438477, -16.094417572021484, -15.49782943725586, -14.901243209838867, -14.304656982421875, -13.708069801330566, -13.111482620239258, -12.514896392822266, -11.918310165405273, -11.321722984313965, -10.725135803222656, -10.128549575805664, -9.531963348388672, -8.935376167297363, -8.338788986206055, -7.7422027587890625, -7.145616054534912, -6.549029350280762, -5.952442646026611, -5.355855941772461, -4.7592692375183105, -4.16268253326416, -3.5660958290100098, -2.9695072174072266, -2.372920513153076, -1.7763338088989258, -1.1797471046447754, -0.583160400390625, 0.01342630386352539, 0.6100130081176758, 1.2065997123718262, 1.8031864166259766, 2.399773120880127, 2.9963598251342773, 3.5929465293884277, 4.189533233642578, 4.7861199378967285, 5.382706642150879, 5.979293346405029, 6.57588005065918, 7.17246675491333, 7.7690534591674805, 8.365640640258789, 8.962226867675781, 9.558813095092773, 10.155400276184082, 10.75198745727539, 11.348573684692383, 11.945159912109375, 12.541747093200684, 13.138334274291992, 13.734920501708984, 14.331506729125977, 14.928093910217285, 15.524681091308594, 16.121267318725586]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 9.0, 7.0, 16.0, 20.0, 41.0, 65.0, 102.0, 166.0, 307.0, 531.0, 1137.0, 2279.0, 4656.0, 10650.0, 26827.0, 80080.0, 443264.0, 3367755.0, 176970.0, 47268.0, 17471.0, 7383.0, 3436.0, 1681.0, 928.0, 487.0, 277.0, 154.0, 99.0, 61.0, 53.0, 35.0, 17.0, 16.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.182373046875, -5.00537109375, -4.828369140625, -4.6513671875, -4.474365234375, -4.29736328125, -4.120361328125, -3.943359375, -3.766357421875, -3.58935546875, -3.412353515625, -3.2353515625, -3.058349609375, -2.88134765625, -2.704345703125, -2.52734375, -2.350341796875, -2.17333984375, -1.996337890625, -1.8193359375, -1.642333984375, -1.46533203125, -1.288330078125, -1.111328125, -0.934326171875, -0.75732421875, -0.580322265625, -0.4033203125, -0.226318359375, -0.04931640625, 0.127685546875, 0.3046875, 0.481689453125, 0.65869140625, 0.835693359375, 1.0126953125, 1.189697265625, 1.36669921875, 1.543701171875, 1.720703125, 1.897705078125, 2.07470703125, 2.251708984375, 2.4287109375, 2.605712890625, 2.78271484375, 2.959716796875, 3.13671875, 3.313720703125, 3.49072265625, 3.667724609375, 3.8447265625, 4.021728515625, 4.19873046875, 4.375732421875, 4.552734375, 4.729736328125, 4.90673828125, 5.083740234375, 5.2607421875, 5.437744140625, 5.61474609375, 5.791748046875, 5.96875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 17.0, 6.0, 14.0, 20.0, 19.0, 21.0, 40.0, 22.0, 39.0, 40.0, 43.0, 32.0, 40.0, 38.0, 47.0, 56.0, 45.0, 40.0, 34.0, 44.0, 34.0, 34.0, 27.0, 22.0, 30.0, 25.0, 22.0, 25.0, 22.0, 13.0, 9.0, 14.0, 19.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.8024673461914062, -0.7738800048828125, -0.7452926635742188, -0.716705322265625, -0.6881179809570312, -0.6595306396484375, -0.6309432983398438, -0.60235595703125, -0.5737686157226562, -0.5451812744140625, -0.5165939331054688, -0.488006591796875, -0.45941925048828125, -0.4308319091796875, -0.40224456787109375, -0.3736572265625, -0.34506988525390625, -0.3164825439453125, -0.28789520263671875, -0.259307861328125, -0.23072052001953125, -0.2021331787109375, -0.17354583740234375, -0.14495849609375, -0.11637115478515625, -0.0877838134765625, -0.05919647216796875, -0.030609130859375, -0.00202178955078125, 0.0265655517578125, 0.05515289306640625, 0.083740234375, 0.11232757568359375, 0.1409149169921875, 0.16950225830078125, 0.198089599609375, 0.22667694091796875, 0.2552642822265625, 0.28385162353515625, 0.31243896484375, 0.34102630615234375, 0.3696136474609375, 0.39820098876953125, 0.426788330078125, 0.45537567138671875, 0.4839630126953125, 0.5125503540039062, 0.5411376953125, 0.5697250366210938, 0.5983123779296875, 0.6268997192382812, 0.655487060546875, 0.6840744018554688, 0.7126617431640625, 0.7412490844726562, 0.76983642578125, 0.7984237670898438, 0.8270111083984375, 0.8555984497070312, 0.884185791015625, 0.9127731323242188, 0.9413604736328125, 0.9699478149414062, 0.99853515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 12.0, 20.0, 29.0, 37.0, 45.0, 49.0, 77.0, 132.0, 177.0, 262.0, 535.0, 1125.0, 2910.0, 9914.0, 44857.0, 410362.0, 3567276.0, 125639.0, 21736.0, 5501.0, 1770.0, 759.0, 364.0, 208.0, 144.0, 96.0, 51.0, 40.0, 45.0, 26.0, 21.0, 14.0, 12.0, 3.0, 3.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.331298828125, -10.99072265625, -10.650146484375, -10.3095703125, -9.968994140625, -9.62841796875, -9.287841796875, -8.947265625, -8.606689453125, -8.26611328125, -7.925537109375, -7.5849609375, -7.244384765625, -6.90380859375, -6.563232421875, -6.22265625, -5.882080078125, -5.54150390625, -5.200927734375, -4.8603515625, -4.519775390625, -4.17919921875, -3.838623046875, -3.498046875, -3.157470703125, -2.81689453125, -2.476318359375, -2.1357421875, -1.795166015625, -1.45458984375, -1.114013671875, -0.7734375, -0.432861328125, -0.09228515625, 0.248291015625, 0.5888671875, 0.929443359375, 1.27001953125, 1.610595703125, 1.951171875, 2.291748046875, 2.63232421875, 2.972900390625, 3.3134765625, 3.654052734375, 3.99462890625, 4.335205078125, 4.67578125, 5.016357421875, 5.35693359375, 5.697509765625, 6.0380859375, 6.378662109375, 6.71923828125, 7.059814453125, 7.400390625, 7.740966796875, 8.08154296875, 8.422119140625, 8.7626953125, 9.103271484375, 9.44384765625, 9.784423828125, 10.125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 8.0, 10.0, 14.0, 17.0, 27.0, 56.0, 99.0, 167.0, 440.0, 2281.0, 507.0, 202.0, 106.0, 46.0, 37.0, 12.0, 14.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.8480224609375, -4.707763671875, -4.5675048828125, -4.42724609375, -4.2869873046875, -4.146728515625, -4.0064697265625, -3.8662109375, -3.7259521484375, -3.585693359375, -3.4454345703125, -3.30517578125, -3.1649169921875, -3.024658203125, -2.8843994140625, -2.744140625, -2.6038818359375, -2.463623046875, -2.3233642578125, -2.18310546875, -2.0428466796875, -1.902587890625, -1.7623291015625, -1.6220703125, -1.4818115234375, -1.341552734375, -1.2012939453125, -1.06103515625, -0.9207763671875, -0.780517578125, -0.6402587890625, -0.5, -0.3597412109375, -0.219482421875, -0.0792236328125, 0.06103515625, 0.2012939453125, 0.341552734375, 0.4818115234375, 0.6220703125, 0.7623291015625, 0.902587890625, 1.0428466796875, 1.18310546875, 1.3233642578125, 1.463623046875, 1.6038818359375, 1.744140625, 1.8843994140625, 2.024658203125, 2.1649169921875, 2.30517578125, 2.4454345703125, 2.585693359375, 2.7259521484375, 2.8662109375, 3.0064697265625, 3.146728515625, 3.2869873046875, 3.42724609375, 3.5675048828125, 3.707763671875, 3.8480224609375, 3.98828125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 17.0, 33.0, 74.0, 141.0, 189.0, 215.0, 157.0, 79.0, 50.0, 20.0, 6.0, 12.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.639741897583008, -23.57823371887207, -22.516725540161133, -21.455217361450195, -20.393707275390625, -19.332199096679688, -18.27069091796875, -17.209182739257812, -16.147674560546875, -15.086166381835938, -14.024658203125, -12.963149070739746, -11.901640892028809, -10.840132713317871, -9.778623580932617, -8.71711540222168, -7.655607223510742, -6.594099044799805, -5.532590389251709, -4.471081733703613, -3.409573554992676, -2.3480653762817383, -1.2865567207336426, -0.22504806518554688, 0.8364601135253906, 1.8979685306549072, 2.959476947784424, 4.0209856033325195, 5.082493782043457, 6.1440019607543945, 7.20551061630249, 8.267019271850586, 9.328529357910156, 10.390037536621094, 11.451545715332031, 12.513054847717285, 13.574563026428223, 14.63607120513916, 15.697580337524414, 16.75908851623535, 17.82059669494629, 18.882104873657227, 19.943613052368164, 21.0051212310791, 22.066631317138672, 23.12813949584961, 24.189647674560547, 25.251155853271484, 26.312664031982422, 27.37417221069336, 28.435680389404297, 29.497188568115234, 30.558696746826172, 31.62020492553711, 32.68171310424805, 33.74322509765625, 34.80473327636719, 35.866241455078125, 36.92774963378906, 37.9892578125, 39.05076599121094, 40.112274169921875, 41.17378234863281, 42.23529052734375, 43.29679870605469]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 10.0, 8.0, 7.0, 12.0, 11.0, 6.0, 15.0, 15.0, 13.0, 21.0, 20.0, 26.0, 29.0, 30.0, 33.0, 33.0, 47.0, 36.0, 60.0, 33.0, 40.0, 53.0, 50.0, 40.0, 46.0, 34.0, 41.0, 26.0, 33.0, 24.0, 20.0, 19.0, 19.0, 17.0, 16.0, 18.0, 5.0, 8.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.576252937316895, -11.25664234161377, -10.937032699584961, -10.617422103881836, -10.297812461853027, -9.978201866149902, -9.658592224121094, -9.338981628417969, -9.019371032714844, -8.699760437011719, -8.38015079498291, -8.060540199279785, -7.740930557250977, -7.421319961547852, -7.101709842681885, -6.782099723815918, -6.462490081787109, -6.142879962921143, -5.823269844055176, -5.503659725189209, -5.184049606323242, -4.864439010620117, -4.54482889175415, -4.225218772888184, -3.905608654022217, -3.58599853515625, -3.266388416290283, -2.9467780590057373, -2.6271679401397705, -2.3075578212738037, -1.9879475831985474, -1.668337345123291, -1.3487262725830078, -1.029116153717041, -0.7095059156417847, -0.3898957371711731, -0.07028555870056152, 0.24932456016540527, 0.5689347982406616, 0.888545036315918, 1.2081551551818848, 1.5277652740478516, 1.847375512123108, 2.1669857501983643, 2.486595869064331, 2.806205987930298, 3.1258163452148438, 3.4454264640808105, 3.7650365829467773, 4.084646701812744, 4.404256820678711, 4.723866939544678, 5.0434770584106445, 5.3630876541137695, 5.682697772979736, 6.002307891845703, 6.32191801071167, 6.641528129577637, 6.9611382484436035, 7.28074836730957, 7.600358963012695, 7.919968605041504, 8.239579200744629, 8.559188842773438, 8.878799438476562]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 8.0, 3.0, 8.0, 6.0, 16.0, 21.0, 33.0, 37.0, 74.0, 93.0, 168.0, 257.0, 394.0, 753.0, 1318.0, 2574.0, 4947.0, 9457.0, 18617.0, 37344.0, 73092.0, 149720.0, 307943.0, 229025.0, 105165.0, 52841.0, 26382.0, 13500.0, 6682.0, 3536.0, 1919.0, 1055.0, 589.0, 366.0, 211.0, 141.0, 68.0, 53.0, 36.0, 35.0, 22.0, 8.0, 10.0, 9.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.494140625, -3.384124755859375, -3.27410888671875, -3.164093017578125, -3.0540771484375, -2.944061279296875, -2.83404541015625, -2.724029541015625, -2.614013671875, -2.503997802734375, -2.39398193359375, -2.283966064453125, -2.1739501953125, -2.063934326171875, -1.95391845703125, -1.843902587890625, -1.73388671875, -1.623870849609375, -1.51385498046875, -1.403839111328125, -1.2938232421875, -1.183807373046875, -1.07379150390625, -0.963775634765625, -0.853759765625, -0.743743896484375, -0.63372802734375, -0.523712158203125, -0.4136962890625, -0.303680419921875, -0.19366455078125, -0.083648681640625, 0.0263671875, 0.136383056640625, 0.24639892578125, 0.356414794921875, 0.4664306640625, 0.576446533203125, 0.68646240234375, 0.796478271484375, 0.906494140625, 1.016510009765625, 1.12652587890625, 1.236541748046875, 1.3465576171875, 1.456573486328125, 1.56658935546875, 1.676605224609375, 1.78662109375, 1.896636962890625, 2.00665283203125, 2.116668701171875, 2.2266845703125, 2.336700439453125, 2.44671630859375, 2.556732177734375, 2.666748046875, 2.776763916015625, 2.88677978515625, 2.996795654296875, 3.1068115234375, 3.216827392578125, 3.32684326171875, 3.436859130859375, 3.546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 14.0, 19.0, 18.0, 22.0, 12.0, 22.0, 29.0, 37.0, 35.0, 46.0, 47.0, 44.0, 30.0, 53.0, 39.0, 54.0, 42.0, 35.0, 32.0, 36.0, 36.0, 38.0, 33.0, 27.0, 30.0, 17.0, 12.0, 13.0, 14.0, 11.0, 10.0, 9.0, 10.0, 9.0, 5.0, 5.0, 2.0, 5.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0406646728515625, -1.006134033203125, -0.9716033935546875, -0.93707275390625, -0.9025421142578125, -0.868011474609375, -0.8334808349609375, -0.7989501953125, -0.7644195556640625, -0.729888916015625, -0.6953582763671875, -0.66082763671875, -0.6262969970703125, -0.591766357421875, -0.5572357177734375, -0.522705078125, -0.4881744384765625, -0.453643798828125, -0.4191131591796875, -0.38458251953125, -0.3500518798828125, -0.315521240234375, -0.2809906005859375, -0.2464599609375, -0.2119293212890625, -0.177398681640625, -0.1428680419921875, -0.10833740234375, -0.0738067626953125, -0.039276123046875, -0.0047454833984375, 0.02978515625, 0.0643157958984375, 0.098846435546875, 0.1333770751953125, 0.16790771484375, 0.2024383544921875, 0.236968994140625, 0.2714996337890625, 0.3060302734375, 0.3405609130859375, 0.375091552734375, 0.4096221923828125, 0.44415283203125, 0.4786834716796875, 0.513214111328125, 0.5477447509765625, 0.582275390625, 0.6168060302734375, 0.651336669921875, 0.6858673095703125, 0.72039794921875, 0.7549285888671875, 0.789459228515625, 0.8239898681640625, 0.8585205078125, 0.8930511474609375, 0.927581787109375, 0.9621124267578125, 0.99664306640625, 1.0311737060546875, 1.065704345703125, 1.1002349853515625, 1.134765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 8.0, 16.0, 14.0, 28.0, 37.0, 41.0, 69.0, 86.0, 104.0, 161.0, 213.0, 329.0, 511.0, 815.0, 1504.0, 3273.0, 9077.0, 30877.0, 118306.0, 522897.0, 264458.0, 66632.0, 18110.0, 5664.0, 2266.0, 1086.0, 592.0, 433.0, 306.0, 180.0, 105.0, 87.0, 69.0, 54.0, 33.0, 23.0, 21.0, 13.0, 13.0, 12.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.93359375, -6.7083740234375, -6.483154296875, -6.2579345703125, -6.03271484375, -5.8074951171875, -5.582275390625, -5.3570556640625, -5.1318359375, -4.9066162109375, -4.681396484375, -4.4561767578125, -4.23095703125, -4.0057373046875, -3.780517578125, -3.5552978515625, -3.330078125, -3.1048583984375, -2.879638671875, -2.6544189453125, -2.42919921875, -2.2039794921875, -1.978759765625, -1.7535400390625, -1.5283203125, -1.3031005859375, -1.077880859375, -0.8526611328125, -0.62744140625, -0.4022216796875, -0.177001953125, 0.0482177734375, 0.2734375, 0.4986572265625, 0.723876953125, 0.9490966796875, 1.17431640625, 1.3995361328125, 1.624755859375, 1.8499755859375, 2.0751953125, 2.3004150390625, 2.525634765625, 2.7508544921875, 2.97607421875, 3.2012939453125, 3.426513671875, 3.6517333984375, 3.876953125, 4.1021728515625, 4.327392578125, 4.5526123046875, 4.77783203125, 5.0030517578125, 5.228271484375, 5.4534912109375, 5.6787109375, 5.9039306640625, 6.129150390625, 6.3543701171875, 6.57958984375, 6.8048095703125, 7.030029296875, 7.2552490234375, 7.48046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 5.0, 9.0, 10.0, 8.0, 15.0, 18.0, 22.0, 17.0, 28.0, 28.0, 47.0, 46.0, 49.0, 53.0, 54.0, 59.0, 43.0, 53.0, 64.0, 48.0, 38.0, 38.0, 28.0, 35.0, 26.0, 18.0, 22.0, 15.0, 12.0, 17.0, 5.0, 7.0, 6.0, 0.0, 5.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.68359375, -6.4620361328125, -6.240478515625, -6.0189208984375, -5.79736328125, -5.5758056640625, -5.354248046875, -5.1326904296875, -4.9111328125, -4.6895751953125, -4.468017578125, -4.2464599609375, -4.02490234375, -3.8033447265625, -3.581787109375, -3.3602294921875, -3.138671875, -2.9171142578125, -2.695556640625, -2.4739990234375, -2.25244140625, -2.0308837890625, -1.809326171875, -1.5877685546875, -1.3662109375, -1.1446533203125, -0.923095703125, -0.7015380859375, -0.47998046875, -0.2584228515625, -0.036865234375, 0.1846923828125, 0.40625, 0.6278076171875, 0.849365234375, 1.0709228515625, 1.29248046875, 1.5140380859375, 1.735595703125, 1.9571533203125, 2.1787109375, 2.4002685546875, 2.621826171875, 2.8433837890625, 3.06494140625, 3.2864990234375, 3.508056640625, 3.7296142578125, 3.951171875, 4.1727294921875, 4.394287109375, 4.6158447265625, 4.83740234375, 5.0589599609375, 5.280517578125, 5.5020751953125, 5.7236328125, 5.9451904296875, 6.166748046875, 6.3883056640625, 6.60986328125, 6.8314208984375, 7.052978515625, 7.2745361328125, 7.49609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 17.0, 29.0, 33.0, 84.0, 131.0, 246.0, 583.0, 2096.0, 13773.0, 591153.0, 424864.0, 12488.0, 1923.0, 558.0, 247.0, 121.0, 76.0, 48.0, 17.0, 19.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.96875, -15.4844970703125, -15.000244140625, -14.5159912109375, -14.03173828125, -13.5474853515625, -13.063232421875, -12.5789794921875, -12.0947265625, -11.6104736328125, -11.126220703125, -10.6419677734375, -10.15771484375, -9.6734619140625, -9.189208984375, -8.7049560546875, -8.220703125, -7.7364501953125, -7.252197265625, -6.7679443359375, -6.28369140625, -5.7994384765625, -5.315185546875, -4.8309326171875, -4.3466796875, -3.8624267578125, -3.378173828125, -2.8939208984375, -2.40966796875, -1.9254150390625, -1.441162109375, -0.9569091796875, -0.47265625, 0.0115966796875, 0.495849609375, 0.9801025390625, 1.46435546875, 1.9486083984375, 2.432861328125, 2.9171142578125, 3.4013671875, 3.8856201171875, 4.369873046875, 4.8541259765625, 5.33837890625, 5.8226318359375, 6.306884765625, 6.7911376953125, 7.275390625, 7.7596435546875, 8.243896484375, 8.7281494140625, 9.21240234375, 9.6966552734375, 10.180908203125, 10.6651611328125, 11.1494140625, 11.6336669921875, 12.117919921875, 12.6021728515625, 13.08642578125, 13.5706787109375, 14.054931640625, 14.5391845703125, 15.0234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 6.0, 12.0, 17.0, 34.0, 45.0, 59.0, 92.0, 124.0, 271.0, 105.0, 73.0, 54.0, 35.0, 20.0, 15.0, 9.0, 2.0, 6.0, 9.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019397735595703125, -0.0018835067749023438, -0.001827239990234375, -0.0017709732055664062, -0.0017147064208984375, -0.0016584396362304688, -0.0016021728515625, -0.0015459060668945312, -0.0014896392822265625, -0.0014333724975585938, -0.001377105712890625, -0.0013208389282226562, -0.0012645721435546875, -0.0012083053588867188, -0.00115203857421875, -0.0010957717895507812, -0.0010395050048828125, -0.0009832382202148438, -0.000926971435546875, -0.0008707046508789062, -0.0008144378662109375, -0.0007581710815429688, -0.000701904296875, -0.0006456375122070312, -0.0005893707275390625, -0.0005331039428710938, -0.000476837158203125, -0.00042057037353515625, -0.0003643035888671875, -0.00030803680419921875, -0.00025177001953125, -0.00019550323486328125, -0.0001392364501953125, -8.296966552734375e-05, -2.6702880859375e-05, 2.956390380859375e-05, 8.58306884765625e-05, 0.00014209747314453125, 0.0001983642578125, 0.00025463104248046875, 0.0003108978271484375, 0.00036716461181640625, 0.000423431396484375, 0.00047969818115234375, 0.0005359649658203125, 0.0005922317504882812, 0.00064849853515625, 0.0007047653198242188, 0.0007610321044921875, 0.0008172988891601562, 0.000873565673828125, 0.0009298324584960938, 0.0009860992431640625, 0.0010423660278320312, 0.0010986328125, 0.0011548995971679688, 0.0012111663818359375, 0.0012674331665039062, 0.001323699951171875, 0.0013799667358398438, 0.0014362335205078125, 0.0014925003051757812, 0.00154876708984375, 0.0016050338745117188, 0.0016613006591796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 5.0, 5.0, 17.0, 34.0, 35.0, 68.0, 132.0, 246.0, 491.0, 1212.0, 3422.0, 16476.0, 235279.0, 744876.0, 37456.0, 5662.0, 1707.0, 679.0, 345.0, 158.0, 80.0, 65.0, 29.0, 21.0, 11.0, 7.0, 3.0, 4.0, 8.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.2813720703125, -11.922119140625, -11.5628662109375, -11.20361328125, -10.8443603515625, -10.485107421875, -10.1258544921875, -9.7666015625, -9.4073486328125, -9.048095703125, -8.6888427734375, -8.32958984375, -7.9703369140625, -7.611083984375, -7.2518310546875, -6.892578125, -6.5333251953125, -6.174072265625, -5.8148193359375, -5.45556640625, -5.0963134765625, -4.737060546875, -4.3778076171875, -4.0185546875, -3.6593017578125, -3.300048828125, -2.9407958984375, -2.58154296875, -2.2222900390625, -1.863037109375, -1.5037841796875, -1.14453125, -0.7852783203125, -0.426025390625, -0.0667724609375, 0.29248046875, 0.6517333984375, 1.010986328125, 1.3702392578125, 1.7294921875, 2.0887451171875, 2.447998046875, 2.8072509765625, 3.16650390625, 3.5257568359375, 3.885009765625, 4.2442626953125, 4.603515625, 4.9627685546875, 5.322021484375, 5.6812744140625, 6.04052734375, 6.3997802734375, 6.759033203125, 7.1182861328125, 7.4775390625, 7.8367919921875, 8.196044921875, 8.5552978515625, 8.91455078125, 9.2738037109375, 9.633056640625, 9.9923095703125, 10.3515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 1.0, 6.0, 18.0, 22.0, 20.0, 48.0, 70.0, 109.0, 197.0, 175.0, 127.0, 55.0, 43.0, 29.0, 21.0, 15.0, 11.0, 7.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.946044921875, -7.68896484375, -7.431884765625, -7.1748046875, -6.917724609375, -6.66064453125, -6.403564453125, -6.146484375, -5.889404296875, -5.63232421875, -5.375244140625, -5.1181640625, -4.861083984375, -4.60400390625, -4.346923828125, -4.08984375, -3.832763671875, -3.57568359375, -3.318603515625, -3.0615234375, -2.804443359375, -2.54736328125, -2.290283203125, -2.033203125, -1.776123046875, -1.51904296875, -1.261962890625, -1.0048828125, -0.747802734375, -0.49072265625, -0.233642578125, 0.0234375, 0.280517578125, 0.53759765625, 0.794677734375, 1.0517578125, 1.308837890625, 1.56591796875, 1.822998046875, 2.080078125, 2.337158203125, 2.59423828125, 2.851318359375, 3.1083984375, 3.365478515625, 3.62255859375, 3.879638671875, 4.13671875, 4.393798828125, 4.65087890625, 4.907958984375, 5.1650390625, 5.422119140625, 5.67919921875, 5.936279296875, 6.193359375, 6.450439453125, 6.70751953125, 6.964599609375, 7.2216796875, 7.478759765625, 7.73583984375, 7.992919921875, 8.25]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 12.0, 19.0, 35.0, 68.0, 101.0, 165.0, 180.0, 147.0, 114.0, 70.0, 40.0, 26.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.69821548461914, -34.01953887939453, -31.34086036682129, -28.662181854248047, -25.983505249023438, -23.304826736450195, -20.626148223876953, -17.947471618652344, -15.268793106079102, -12.590115547180176, -9.91143798828125, -7.232759475708008, -4.554081916809082, -1.8754043579101562, 0.8032741546630859, 3.4819507598876953, 6.1606292724609375, 8.839306831359863, 11.517984390258789, 14.196662902832031, 16.87533950805664, 19.554018020629883, 22.232696533203125, 24.911373138427734, 27.590051651000977, 30.26873016357422, 32.94740676879883, 35.62608337402344, 38.30476379394531, 40.98344039916992, 43.66211700439453, 46.340797424316406, 49.01947784423828, 51.69815444946289, 54.376834869384766, 57.055511474609375, 59.734188079833984, 62.412864685058594, 65.09154510498047, 67.77021789550781, 70.44889831542969, 73.12757873535156, 75.8062515258789, 78.48493194580078, 81.16361236572266, 83.84228515625, 86.52096557617188, 89.19964599609375, 91.87832641601562, 94.5570068359375, 97.23567962646484, 99.91436004638672, 102.5930404663086, 105.27171325683594, 107.95039367675781, 110.62907409667969, 113.30774688720703, 115.9864273071289, 118.66510009765625, 121.34378051757812, 124.0224609375, 126.70113372802734, 129.37982177734375, 132.05848693847656, 134.73716735839844]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 14.0, 18.0, 18.0, 15.0, 24.0, 26.0, 27.0, 21.0, 33.0, 52.0, 34.0, 48.0, 39.0, 53.0, 51.0, 38.0, 51.0, 43.0, 43.0, 53.0, 41.0, 33.0, 30.0, 21.0, 22.0, 25.0, 27.0, 15.0, 9.0, 10.0, 10.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.68611526489258, -39.48493957519531, -38.28376770019531, -37.08259201049805, -35.88142013549805, -34.68024444580078, -33.47907257080078, -32.277896881103516, -31.076723098754883, -29.87554931640625, -28.674375534057617, -27.473201751708984, -26.27202606201172, -25.07085418701172, -23.869678497314453, -22.66850471496582, -21.467330932617188, -20.266157150268555, -19.064983367919922, -17.86380958557129, -16.662635803222656, -15.461461067199707, -14.260286331176758, -13.059112548828125, -11.857938766479492, -10.65676498413086, -9.455591201782227, -8.254416465759277, -7.0532426834106445, -5.852068901062012, -4.650894641876221, -3.4497203826904297, -2.2485504150390625, -1.0473763942718506, 0.15379762649536133, 1.3549716472625732, 2.556145668029785, 3.757319450378418, 4.958493709564209, 6.15966796875, 7.360841751098633, 8.562015533447266, 9.763189315795898, 10.964364051818848, 12.16553783416748, 13.366711616516113, 14.567886352539062, 15.769060134887695, 16.970233917236328, 18.17140769958496, 19.372581481933594, 20.573755264282227, 21.77492904663086, 22.976104736328125, 24.177278518676758, 25.37845230102539, 26.579626083374023, 27.780799865722656, 28.98197364807129, 30.183147430419922, 31.384323120117188, 32.58549499511719, 33.78667068481445, 34.98784637451172, 36.18901824951172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 10.0, 15.0, 31.0, 26.0, 50.0, 77.0, 147.0, 200.0, 409.0, 799.0, 1540.0, 3260.0, 7400.0, 17449.0, 47226.0, 178921.0, 3079218.0, 701355.0, 101387.0, 31339.0, 12455.0, 5408.0, 2635.0, 1275.0, 675.0, 355.0, 211.0, 135.0, 96.0, 50.0, 38.0, 29.0, 18.0, 10.0, 13.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.6099853515625, -5.415283203125, -5.2205810546875, -5.02587890625, -4.8311767578125, -4.636474609375, -4.4417724609375, -4.2470703125, -4.0523681640625, -3.857666015625, -3.6629638671875, -3.46826171875, -3.2735595703125, -3.078857421875, -2.8841552734375, -2.689453125, -2.4947509765625, -2.300048828125, -2.1053466796875, -1.91064453125, -1.7159423828125, -1.521240234375, -1.3265380859375, -1.1318359375, -0.9371337890625, -0.742431640625, -0.5477294921875, -0.35302734375, -0.1583251953125, 0.036376953125, 0.2310791015625, 0.42578125, 0.6204833984375, 0.815185546875, 1.0098876953125, 1.20458984375, 1.3992919921875, 1.593994140625, 1.7886962890625, 1.9833984375, 2.1781005859375, 2.372802734375, 2.5675048828125, 2.76220703125, 2.9569091796875, 3.151611328125, 3.3463134765625, 3.541015625, 3.7357177734375, 3.930419921875, 4.1251220703125, 4.31982421875, 4.5145263671875, 4.709228515625, 4.9039306640625, 5.0986328125, 5.2933349609375, 5.488037109375, 5.6827392578125, 5.87744140625, 6.0721435546875, 6.266845703125, 6.4615478515625, 6.65625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 13.0, 13.0, 21.0, 21.0, 23.0, 24.0, 42.0, 28.0, 36.0, 47.0, 43.0, 46.0, 58.0, 35.0, 38.0, 45.0, 45.0, 40.0, 45.0, 33.0, 32.0, 26.0, 26.0, 24.0, 20.0, 27.0, 16.0, 18.0, 15.0, 14.0, 13.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1845703125, -1.1458282470703125, -1.107086181640625, -1.0683441162109375, -1.02960205078125, -0.9908599853515625, -0.952117919921875, -0.9133758544921875, -0.8746337890625, -0.8358917236328125, -0.797149658203125, -0.7584075927734375, -0.71966552734375, -0.6809234619140625, -0.642181396484375, -0.6034393310546875, -0.564697265625, -0.5259552001953125, -0.487213134765625, -0.4484710693359375, -0.40972900390625, -0.3709869384765625, -0.332244873046875, -0.2935028076171875, -0.2547607421875, -0.2160186767578125, -0.177276611328125, -0.1385345458984375, -0.09979248046875, -0.0610504150390625, -0.022308349609375, 0.0164337158203125, 0.05517578125, 0.0939178466796875, 0.132659912109375, 0.1714019775390625, 0.21014404296875, 0.2488861083984375, 0.287628173828125, 0.3263702392578125, 0.3651123046875, 0.4038543701171875, 0.442596435546875, 0.4813385009765625, 0.52008056640625, 0.5588226318359375, 0.597564697265625, 0.6363067626953125, 0.675048828125, 0.7137908935546875, 0.752532958984375, 0.7912750244140625, 0.83001708984375, 0.8687591552734375, 0.907501220703125, 0.9462432861328125, 0.9849853515625, 1.0237274169921875, 1.062469482421875, 1.1012115478515625, 1.13995361328125, 1.1786956787109375, 1.217437744140625, 1.2561798095703125, 1.294921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 13.0, 11.0, 12.0, 20.0, 12.0, 31.0, 33.0, 38.0, 60.0, 110.0, 127.0, 189.0, 231.0, 397.0, 653.0, 1101.0, 2111.0, 4765.0, 12151.0, 38342.0, 168976.0, 2777199.0, 1027755.0, 113100.0, 28645.0, 9690.0, 3974.0, 1767.0, 1039.0, 584.0, 360.0, 214.0, 152.0, 122.0, 90.0, 51.0, 50.0, 36.0, 10.0, 22.0, 17.0, 6.0, 5.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7734375, -7.5133056640625, -7.253173828125, -6.9930419921875, -6.73291015625, -6.4727783203125, -6.212646484375, -5.9525146484375, -5.6923828125, -5.4322509765625, -5.172119140625, -4.9119873046875, -4.65185546875, -4.3917236328125, -4.131591796875, -3.8714599609375, -3.611328125, -3.3511962890625, -3.091064453125, -2.8309326171875, -2.57080078125, -2.3106689453125, -2.050537109375, -1.7904052734375, -1.5302734375, -1.2701416015625, -1.010009765625, -0.7498779296875, -0.48974609375, -0.2296142578125, 0.030517578125, 0.2906494140625, 0.55078125, 0.8109130859375, 1.071044921875, 1.3311767578125, 1.59130859375, 1.8514404296875, 2.111572265625, 2.3717041015625, 2.6318359375, 2.8919677734375, 3.152099609375, 3.4122314453125, 3.67236328125, 3.9324951171875, 4.192626953125, 4.4527587890625, 4.712890625, 4.9730224609375, 5.233154296875, 5.4932861328125, 5.75341796875, 6.0135498046875, 6.273681640625, 6.5338134765625, 6.7939453125, 7.0540771484375, 7.314208984375, 7.5743408203125, 7.83447265625, 8.0946044921875, 8.354736328125, 8.6148681640625, 8.875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 8.0, 6.0, 26.0, 38.0, 46.0, 93.0, 179.0, 438.0, 1805.0, 832.0, 284.0, 138.0, 70.0, 34.0, 26.0, 13.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.44720458984375, -7.2498779296875, -7.05255126953125, -6.855224609375, -6.65789794921875, -6.4605712890625, -6.26324462890625, -6.06591796875, -5.86859130859375, -5.6712646484375, -5.47393798828125, -5.276611328125, -5.07928466796875, -4.8819580078125, -4.68463134765625, -4.4873046875, -4.28997802734375, -4.0926513671875, -3.89532470703125, -3.697998046875, -3.50067138671875, -3.3033447265625, -3.10601806640625, -2.90869140625, -2.71136474609375, -2.5140380859375, -2.31671142578125, -2.119384765625, -1.92205810546875, -1.7247314453125, -1.52740478515625, -1.330078125, -1.13275146484375, -0.9354248046875, -0.73809814453125, -0.540771484375, -0.34344482421875, -0.1461181640625, 0.05120849609375, 0.24853515625, 0.44586181640625, 0.6431884765625, 0.84051513671875, 1.037841796875, 1.23516845703125, 1.4324951171875, 1.62982177734375, 1.8271484375, 2.02447509765625, 2.2218017578125, 2.41912841796875, 2.616455078125, 2.81378173828125, 3.0111083984375, 3.20843505859375, 3.40576171875, 3.60308837890625, 3.8004150390625, 3.99774169921875, 4.195068359375, 4.39239501953125, 4.5897216796875, 4.78704833984375, 4.984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 15.0, 104.0, 304.0, 395.0, 149.0, 32.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.40753173828125, -133.38243103027344, -130.35731506347656, -127.33221435546875, -124.3071060180664, -121.28199768066406, -118.25688934326172, -115.23178100585938, -112.20667266845703, -109.18156433105469, -106.15645599365234, -103.13134765625, -100.10624694824219, -97.08113861083984, -94.0560302734375, -91.03092193603516, -88.00581359863281, -84.98070526123047, -81.95559692382812, -78.93049621582031, -75.90538787841797, -72.88027954101562, -69.85517120361328, -66.83006286621094, -63.804962158203125, -60.77985382080078, -57.7547492980957, -54.72964096069336, -51.704532623291016, -48.67942810058594, -45.654319763183594, -42.62921142578125, -39.60410690307617, -36.57899856567383, -33.55389404296875, -30.528785705566406, -27.503677368164062, -24.47857093811035, -21.45346450805664, -18.428356170654297, -15.403249740600586, -12.378142356872559, -9.353034973144531, -6.32792854309082, -3.302821159362793, -0.2777137756347656, 2.7473926544189453, 5.772500991821289, 8.797607421875, 11.822714805603027, 14.847822189331055, 17.872928619384766, 20.89803695678711, 23.92314338684082, 26.94824981689453, 29.973358154296875, 32.99846649169922, 36.02357482910156, 39.04867935180664, 42.073787689208984, 45.09889602661133, 48.124000549316406, 51.14910888671875, 54.174217224121094, 57.19932174682617]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 17.0, 18.0, 14.0, 25.0, 30.0, 30.0, 40.0, 45.0, 41.0, 59.0, 56.0, 48.0, 64.0, 57.0, 58.0, 47.0, 36.0, 45.0, 51.0, 32.0, 31.0, 34.0, 25.0, 9.0, 23.0, 9.0, 10.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.324492454528809, -12.765583038330078, -12.206673622131348, -11.647764205932617, -11.088855743408203, -10.529945373535156, -9.971036911010742, -9.412127494812012, -8.853218078613281, -8.29430866241455, -7.73539924621582, -7.176490306854248, -6.617580890655518, -6.058671474456787, -5.499762535095215, -4.940853118896484, -4.381943702697754, -3.8230342864990234, -3.264125108718872, -2.7052159309387207, -2.1463065147399902, -1.5873970985412598, -1.0284879207611084, -0.46957874298095703, 0.08933067321777344, 0.6482399702072144, 1.2071492671966553, 1.7660585641860962, 2.324967861175537, 2.8838772773742676, 3.442786455154419, 4.00169563293457, 4.560604095458984, 5.119513511657715, 5.678422927856445, 6.237331867218018, 6.796241283416748, 7.3551506996154785, 7.914059638977051, 8.472969055175781, 9.031878471374512, 9.590787887573242, 10.149697303771973, 10.708606719970703, 11.267515182495117, 11.826425552368164, 12.385334014892578, 12.944243431091309, 13.503152847290039, 14.06206226348877, 14.6209716796875, 15.17988109588623, 15.738790512084961, 16.297698974609375, 16.856609344482422, 17.415517807006836, 17.97442626953125, 18.533334732055664, 19.09224510192871, 19.651153564453125, 20.210063934326172, 20.768972396850586, 21.327882766723633, 21.886791229248047, 22.445701599121094]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 9.0, 20.0, 37.0, 47.0, 57.0, 104.0, 146.0, 231.0, 400.0, 583.0, 953.0, 1602.0, 2751.0, 4760.0, 7821.0, 14287.0, 25142.0, 46109.0, 84653.0, 152210.0, 224717.0, 203884.0, 124565.0, 68114.0, 37084.0, 20520.0, 11515.0, 6574.0, 3791.0, 2233.0, 1361.0, 852.0, 515.0, 303.0, 200.0, 133.0, 80.0, 62.0, 36.0, 29.0, 18.0, 9.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.814453125, -2.716796875, -2.619140625, -2.521484375, -2.423828125, -2.326171875, -2.228515625, -2.130859375, -2.033203125, -1.935546875, -1.837890625, -1.740234375, -1.642578125, -1.544921875, -1.447265625, -1.349609375, -1.251953125, -1.154296875, -1.056640625, -0.958984375, -0.861328125, -0.763671875, -0.666015625, -0.568359375, -0.470703125, -0.373046875, -0.275390625, -0.177734375, -0.080078125, 0.017578125, 0.115234375, 0.212890625, 0.310546875, 0.408203125, 0.505859375, 0.603515625, 0.701171875, 0.798828125, 0.896484375, 0.994140625, 1.091796875, 1.189453125, 1.287109375, 1.384765625, 1.482421875, 1.580078125, 1.677734375, 1.775390625, 1.873046875, 1.970703125, 2.068359375, 2.166015625, 2.263671875, 2.361328125, 2.458984375, 2.556640625, 2.654296875, 2.751953125, 2.849609375, 2.947265625, 3.044921875, 3.142578125, 3.240234375, 3.337890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 9.0, 11.0, 24.0, 15.0, 16.0, 16.0, 29.0, 21.0, 46.0, 33.0, 37.0, 51.0, 57.0, 52.0, 59.0, 59.0, 56.0, 45.0, 44.0, 36.0, 35.0, 30.0, 33.0, 35.0, 20.0, 19.0, 22.0, 14.0, 17.0, 12.0, 7.0, 11.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5913238525390625, -1.541046142578125, -1.4907684326171875, -1.44049072265625, -1.3902130126953125, -1.339935302734375, -1.2896575927734375, -1.2393798828125, -1.1891021728515625, -1.138824462890625, -1.0885467529296875, -1.03826904296875, -0.9879913330078125, -0.937713623046875, -0.8874359130859375, -0.837158203125, -0.7868804931640625, -0.736602783203125, -0.6863250732421875, -0.63604736328125, -0.5857696533203125, -0.535491943359375, -0.4852142333984375, -0.4349365234375, -0.3846588134765625, -0.334381103515625, -0.2841033935546875, -0.23382568359375, -0.1835479736328125, -0.133270263671875, -0.0829925537109375, -0.03271484375, 0.0175628662109375, 0.067840576171875, 0.1181182861328125, 0.16839599609375, 0.2186737060546875, 0.268951416015625, 0.3192291259765625, 0.3695068359375, 0.4197845458984375, 0.470062255859375, 0.5203399658203125, 0.57061767578125, 0.6208953857421875, 0.671173095703125, 0.7214508056640625, 0.771728515625, 0.8220062255859375, 0.872283935546875, 0.9225616455078125, 0.97283935546875, 1.0231170654296875, 1.073394775390625, 1.1236724853515625, 1.1739501953125, 1.2242279052734375, 1.274505615234375, 1.3247833251953125, 1.37506103515625, 1.4253387451171875, 1.475616455078125, 1.5258941650390625, 1.576171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 7.0, 7.0, 13.0, 9.0, 14.0, 32.0, 27.0, 56.0, 71.0, 64.0, 99.0, 155.0, 176.0, 268.0, 337.0, 547.0, 839.0, 1510.0, 3197.0, 7941.0, 22469.0, 73299.0, 250638.0, 436368.0, 172537.0, 49961.0, 16098.0, 5629.0, 2503.0, 1250.0, 706.0, 436.0, 343.0, 232.0, 153.0, 143.0, 94.0, 67.0, 44.0, 44.0, 31.0, 36.0, 25.0, 20.0, 16.0, 9.0, 9.0, 3.0, 6.0, 4.0, 3.0, 1.0], "bins": [-6.8515625, -6.65771484375, -6.4638671875, -6.27001953125, -6.076171875, -5.88232421875, -5.6884765625, -5.49462890625, -5.30078125, -5.10693359375, -4.9130859375, -4.71923828125, -4.525390625, -4.33154296875, -4.1376953125, -3.94384765625, -3.75, -3.55615234375, -3.3623046875, -3.16845703125, -2.974609375, -2.78076171875, -2.5869140625, -2.39306640625, -2.19921875, -2.00537109375, -1.8115234375, -1.61767578125, -1.423828125, -1.22998046875, -1.0361328125, -0.84228515625, -0.6484375, -0.45458984375, -0.2607421875, -0.06689453125, 0.126953125, 0.32080078125, 0.5146484375, 0.70849609375, 0.90234375, 1.09619140625, 1.2900390625, 1.48388671875, 1.677734375, 1.87158203125, 2.0654296875, 2.25927734375, 2.453125, 2.64697265625, 2.8408203125, 3.03466796875, 3.228515625, 3.42236328125, 3.6162109375, 3.81005859375, 4.00390625, 4.19775390625, 4.3916015625, 4.58544921875, 4.779296875, 4.97314453125, 5.1669921875, 5.36083984375, 5.5546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 10.0, 7.0, 13.0, 9.0, 7.0, 10.0, 10.0, 15.0, 21.0, 25.0, 22.0, 23.0, 26.0, 26.0, 35.0, 34.0, 36.0, 40.0, 31.0, 43.0, 46.0, 39.0, 51.0, 39.0, 36.0, 34.0, 35.0, 36.0, 21.0, 26.0, 35.0, 12.0, 17.0, 18.0, 15.0, 18.0, 16.0, 12.0, 7.0, 3.0, 8.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.015625, -7.77813720703125, -7.5406494140625, -7.30316162109375, -7.065673828125, -6.82818603515625, -6.5906982421875, -6.35321044921875, -6.11572265625, -5.87823486328125, -5.6407470703125, -5.40325927734375, -5.165771484375, -4.92828369140625, -4.6907958984375, -4.45330810546875, -4.2158203125, -3.97833251953125, -3.7408447265625, -3.50335693359375, -3.265869140625, -3.02838134765625, -2.7908935546875, -2.55340576171875, -2.31591796875, -2.07843017578125, -1.8409423828125, -1.60345458984375, -1.365966796875, -1.12847900390625, -0.8909912109375, -0.65350341796875, -0.416015625, -0.17852783203125, 0.0589599609375, 0.29644775390625, 0.533935546875, 0.77142333984375, 1.0089111328125, 1.24639892578125, 1.48388671875, 1.72137451171875, 1.9588623046875, 2.19635009765625, 2.433837890625, 2.67132568359375, 2.9088134765625, 3.14630126953125, 3.3837890625, 3.62127685546875, 3.8587646484375, 4.09625244140625, 4.333740234375, 4.57122802734375, 4.8087158203125, 5.04620361328125, 5.28369140625, 5.52117919921875, 5.7586669921875, 5.99615478515625, 6.233642578125, 6.47113037109375, 6.7086181640625, 6.94610595703125, 7.18359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 17.0, 18.0, 24.0, 40.0, 64.0, 107.0, 148.0, 337.0, 657.0, 1429.0, 4095.0, 21730.0, 526168.0, 466957.0, 20081.0, 3933.0, 1400.0, 577.0, 332.0, 148.0, 97.0, 60.0, 32.0, 28.0, 16.0, 11.0, 13.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.490966796875, -14.09912109375, -13.707275390625, -13.3154296875, -12.923583984375, -12.53173828125, -12.139892578125, -11.748046875, -11.356201171875, -10.96435546875, -10.572509765625, -10.1806640625, -9.788818359375, -9.39697265625, -9.005126953125, -8.61328125, -8.221435546875, -7.82958984375, -7.437744140625, -7.0458984375, -6.654052734375, -6.26220703125, -5.870361328125, -5.478515625, -5.086669921875, -4.69482421875, -4.302978515625, -3.9111328125, -3.519287109375, -3.12744140625, -2.735595703125, -2.34375, -1.951904296875, -1.56005859375, -1.168212890625, -0.7763671875, -0.384521484375, 0.00732421875, 0.399169921875, 0.791015625, 1.182861328125, 1.57470703125, 1.966552734375, 2.3583984375, 2.750244140625, 3.14208984375, 3.533935546875, 3.92578125, 4.317626953125, 4.70947265625, 5.101318359375, 5.4931640625, 5.885009765625, 6.27685546875, 6.668701171875, 7.060546875, 7.452392578125, 7.84423828125, 8.236083984375, 8.6279296875, 9.019775390625, 9.41162109375, 9.803466796875, 10.1953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 23.0, 30.0, 103.0, 258.0, 308.0, 143.0, 65.0, 34.0, 20.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00382232666015625, -0.0037223100662231445, -0.003622293472290039, -0.0035222768783569336, -0.003422260284423828, -0.0033222436904907227, -0.003222227096557617, -0.0031222105026245117, -0.0030221939086914062, -0.0029221773147583008, -0.0028221607208251953, -0.00272214412689209, -0.0026221275329589844, -0.002522110939025879, -0.0024220943450927734, -0.002322077751159668, -0.0022220611572265625, -0.002122044563293457, -0.0020220279693603516, -0.001922011375427246, -0.0018219947814941406, -0.0017219781875610352, -0.0016219615936279297, -0.0015219449996948242, -0.0014219284057617188, -0.0013219118118286133, -0.0012218952178955078, -0.0011218786239624023, -0.0010218620300292969, -0.0009218454360961914, -0.0008218288421630859, -0.0007218122482299805, -0.000621795654296875, -0.0005217790603637695, -0.00042176246643066406, -0.0003217458724975586, -0.00022172927856445312, -0.00012171268463134766, -2.1696090698242188e-05, 7.832050323486328e-05, 0.00017833709716796875, 0.0002783536911010742, 0.0003783702850341797, 0.00047838687896728516, 0.0005784034729003906, 0.0006784200668334961, 0.0007784366607666016, 0.000878453254699707, 0.0009784698486328125, 0.001078486442565918, 0.0011785030364990234, 0.001278519630432129, 0.0013785362243652344, 0.0014785528182983398, 0.0015785694122314453, 0.0016785860061645508, 0.0017786026000976562, 0.0018786191940307617, 0.001978635787963867, 0.0020786523818969727, 0.002178668975830078, 0.0022786855697631836, 0.002378702163696289, 0.0024787187576293945, 0.0025787353515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 16.0, 21.0, 37.0, 40.0, 70.0, 130.0, 202.0, 365.0, 654.0, 1473.0, 3816.0, 12446.0, 83258.0, 712263.0, 202432.0, 21842.0, 5583.0, 1970.0, 865.0, 418.0, 259.0, 145.0, 72.0, 53.0, 31.0, 24.0, 15.0, 14.0, 8.0, 1.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.01220703125, -7.7509765625, -7.48974609375, -7.228515625, -6.96728515625, -6.7060546875, -6.44482421875, -6.18359375, -5.92236328125, -5.6611328125, -5.39990234375, -5.138671875, -4.87744140625, -4.6162109375, -4.35498046875, -4.09375, -3.83251953125, -3.5712890625, -3.31005859375, -3.048828125, -2.78759765625, -2.5263671875, -2.26513671875, -2.00390625, -1.74267578125, -1.4814453125, -1.22021484375, -0.958984375, -0.69775390625, -0.4365234375, -0.17529296875, 0.0859375, 0.34716796875, 0.6083984375, 0.86962890625, 1.130859375, 1.39208984375, 1.6533203125, 1.91455078125, 2.17578125, 2.43701171875, 2.6982421875, 2.95947265625, 3.220703125, 3.48193359375, 3.7431640625, 4.00439453125, 4.265625, 4.52685546875, 4.7880859375, 5.04931640625, 5.310546875, 5.57177734375, 5.8330078125, 6.09423828125, 6.35546875, 6.61669921875, 6.8779296875, 7.13916015625, 7.400390625, 7.66162109375, 7.9228515625, 8.18408203125, 8.4453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 6.0, 7.0, 9.0, 8.0, 16.0, 27.0, 25.0, 48.0, 61.0, 100.0, 126.0, 120.0, 126.0, 96.0, 58.0, 56.0, 29.0, 14.0, 18.0, 17.0, 12.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -7.00946044921875, -6.8001708984375, -6.59088134765625, -6.381591796875, -6.17230224609375, -5.9630126953125, -5.75372314453125, -5.54443359375, -5.33514404296875, -5.1258544921875, -4.91656494140625, -4.707275390625, -4.49798583984375, -4.2886962890625, -4.07940673828125, -3.8701171875, -3.66082763671875, -3.4515380859375, -3.24224853515625, -3.032958984375, -2.82366943359375, -2.6143798828125, -2.40509033203125, -2.19580078125, -1.98651123046875, -1.7772216796875, -1.56793212890625, -1.358642578125, -1.14935302734375, -0.9400634765625, -0.73077392578125, -0.521484375, -0.31219482421875, -0.1029052734375, 0.10638427734375, 0.315673828125, 0.52496337890625, 0.7342529296875, 0.94354248046875, 1.15283203125, 1.36212158203125, 1.5714111328125, 1.78070068359375, 1.989990234375, 2.19927978515625, 2.4085693359375, 2.61785888671875, 2.8271484375, 3.03643798828125, 3.2457275390625, 3.45501708984375, 3.664306640625, 3.87359619140625, 4.0828857421875, 4.29217529296875, 4.50146484375, 4.71075439453125, 4.9200439453125, 5.12933349609375, 5.338623046875, 5.54791259765625, 5.7572021484375, 5.96649169921875, 6.17578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 19.0, 33.0, 73.0, 99.0, 151.0, 171.0, 162.0, 114.0, 82.0, 40.0, 26.0, 10.0, 6.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.50238800048828, -82.61936950683594, -79.7363510131836, -76.85333251953125, -73.97032165527344, -71.0873031616211, -68.20428466796875, -65.3212661743164, -62.43824768066406, -59.55522918701172, -56.672210693359375, -53.7891960144043, -50.90617752075195, -48.02315902709961, -45.14014434814453, -42.25712585449219, -39.374107360839844, -36.4910888671875, -33.608070373535156, -30.725055694580078, -27.842037200927734, -24.95901870727539, -22.07600212097168, -19.19298553466797, -16.309967041015625, -13.426949501037598, -10.54393196105957, -7.660914421081543, -4.777896881103516, -1.8948793411254883, 0.9881381988525391, 3.87115478515625, 6.754180908203125, 9.637198448181152, 12.52021598815918, 15.403233528137207, 18.286251068115234, 21.169269561767578, 24.05228614807129, 26.935302734375, 29.818321228027344, 32.70133972167969, 35.58435821533203, 38.46737289428711, 41.35039138793945, 44.2334098815918, 47.116424560546875, 49.99944305419922, 52.88246154785156, 55.765480041503906, 58.64849853515625, 61.53151321411133, 64.41453552246094, 67.29754638671875, 70.1805648803711, 73.06358337402344, 75.94660186767578, 78.82962036132812, 81.71263885498047, 84.59565734863281, 87.47866821289062, 90.36168670654297, 93.24470520019531, 96.12772369384766, 99.0107421875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 13.0, 6.0, 5.0, 15.0, 10.0, 16.0, 21.0, 27.0, 23.0, 28.0, 28.0, 44.0, 46.0, 30.0, 44.0, 47.0, 47.0, 53.0, 45.0, 45.0, 63.0, 41.0, 36.0, 24.0, 27.0, 38.0, 37.0, 25.0, 24.0, 15.0, 17.0, 11.0, 11.0, 9.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.44374084472656, -41.995845794677734, -40.54794692993164, -39.10005187988281, -37.65215301513672, -36.20425796508789, -34.75636291503906, -33.30846405029297, -31.860567092895508, -30.412670135498047, -28.964773178100586, -27.516876220703125, -26.068981170654297, -24.621082305908203, -23.173187255859375, -21.725290298461914, -20.277393341064453, -18.829496383666992, -17.38159942626953, -15.933703422546387, -14.485806465148926, -13.037909507751465, -11.59001350402832, -10.14211654663086, -8.694219589233398, -7.2463226318359375, -5.798426151275635, -4.350529670715332, -2.902632713317871, -1.4547357559204102, -0.006839752197265625, 1.4410572052001953, 2.8889541625976562, 4.336851119995117, 5.78474760055542, 7.232644081115723, 8.680541038513184, 10.128437995910645, 11.576333999633789, 13.02423095703125, 14.472127914428711, 15.920024871826172, 17.367921829223633, 18.815818786621094, 20.263713836669922, 21.711612701416016, 23.159507751464844, 24.607404708862305, 26.055301666259766, 27.503198623657227, 28.951095581054688, 30.398990631103516, 31.84688949584961, 33.29478454589844, 34.74268341064453, 36.19057846069336, 37.63847351074219, 39.086368560791016, 40.53426742553711, 41.98216247558594, 43.43006134033203, 44.87795639038086, 46.32585144042969, 47.77375030517578, 49.221649169921875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 14.0, 10.0, 22.0, 28.0, 62.0, 70.0, 129.0, 202.0, 322.0, 540.0, 931.0, 1626.0, 3165.0, 6951.0, 19925.0, 150253.0, 3949346.0, 40042.0, 11049.0, 4445.0, 2125.0, 1199.0, 671.0, 413.0, 255.0, 172.0, 110.0, 70.0, 38.0, 26.0, 20.0, 11.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.0242919921875, -9.681396484375, -9.3385009765625, -8.99560546875, -8.6527099609375, -8.309814453125, -7.9669189453125, -7.6240234375, -7.2811279296875, -6.938232421875, -6.5953369140625, -6.25244140625, -5.9095458984375, -5.566650390625, -5.2237548828125, -4.880859375, -4.5379638671875, -4.195068359375, -3.8521728515625, -3.50927734375, -3.1663818359375, -2.823486328125, -2.4805908203125, -2.1376953125, -1.7947998046875, -1.451904296875, -1.1090087890625, -0.76611328125, -0.4232177734375, -0.080322265625, 0.2625732421875, 0.60546875, 0.9483642578125, 1.291259765625, 1.6341552734375, 1.97705078125, 2.3199462890625, 2.662841796875, 3.0057373046875, 3.3486328125, 3.6915283203125, 4.034423828125, 4.3773193359375, 4.72021484375, 5.0631103515625, 5.406005859375, 5.7489013671875, 6.091796875, 6.4346923828125, 6.777587890625, 7.1204833984375, 7.46337890625, 7.8062744140625, 8.149169921875, 8.4920654296875, 8.8349609375, 9.1778564453125, 9.520751953125, 9.8636474609375, 10.20654296875, 10.5494384765625, 10.892333984375, 11.2352294921875, 11.578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 9.0, 7.0, 9.0, 11.0, 10.0, 16.0, 22.0, 19.0, 30.0, 23.0, 29.0, 35.0, 49.0, 46.0, 44.0, 46.0, 50.0, 46.0, 36.0, 39.0, 45.0, 41.0, 48.0, 32.0, 31.0, 23.0, 29.0, 28.0, 22.0, 16.0, 12.0, 14.0, 17.0, 9.0, 11.0, 6.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.583984375, -1.5329742431640625, -1.481964111328125, -1.4309539794921875, -1.37994384765625, -1.3289337158203125, -1.277923583984375, -1.2269134521484375, -1.1759033203125, -1.1248931884765625, -1.073883056640625, -1.0228729248046875, -0.97186279296875, -0.9208526611328125, -0.869842529296875, -0.8188323974609375, -0.767822265625, -0.7168121337890625, -0.665802001953125, -0.6147918701171875, -0.56378173828125, -0.5127716064453125, -0.461761474609375, -0.4107513427734375, -0.3597412109375, -0.3087310791015625, -0.257720947265625, -0.2067108154296875, -0.15570068359375, -0.1046905517578125, -0.053680419921875, -0.0026702880859375, 0.04833984375, 0.0993499755859375, 0.150360107421875, 0.2013702392578125, 0.25238037109375, 0.3033905029296875, 0.354400634765625, 0.4054107666015625, 0.4564208984375, 0.5074310302734375, 0.558441162109375, 0.6094512939453125, 0.66046142578125, 0.7114715576171875, 0.762481689453125, 0.8134918212890625, 0.864501953125, 0.9155120849609375, 0.966522216796875, 1.0175323486328125, 1.06854248046875, 1.1195526123046875, 1.170562744140625, 1.2215728759765625, 1.2725830078125, 1.3235931396484375, 1.374603271484375, 1.4256134033203125, 1.47662353515625, 1.5276336669921875, 1.578643798828125, 1.6296539306640625, 1.6806640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 11.0, 18.0, 29.0, 44.0, 48.0, 71.0, 105.0, 187.0, 303.0, 527.0, 941.0, 2235.0, 6024.0, 22580.0, 3374899.0, 753740.0, 22157.0, 5830.0, 2260.0, 1009.0, 530.0, 252.0, 188.0, 105.0, 61.0, 44.0, 24.0, 19.0, 9.0, 15.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.87109375, -16.2890625, -15.70703125, -15.125, -14.54296875, -13.9609375, -13.37890625, -12.796875, -12.21484375, -11.6328125, -11.05078125, -10.46875, -9.88671875, -9.3046875, -8.72265625, -8.140625, -7.55859375, -6.9765625, -6.39453125, -5.8125, -5.23046875, -4.6484375, -4.06640625, -3.484375, -2.90234375, -2.3203125, -1.73828125, -1.15625, -0.57421875, 0.0078125, 0.58984375, 1.171875, 1.75390625, 2.3359375, 2.91796875, 3.5, 4.08203125, 4.6640625, 5.24609375, 5.828125, 6.41015625, 6.9921875, 7.57421875, 8.15625, 8.73828125, 9.3203125, 9.90234375, 10.484375, 11.06640625, 11.6484375, 12.23046875, 12.8125, 13.39453125, 13.9765625, 14.55859375, 15.140625, 15.72265625, 16.3046875, 16.88671875, 17.46875, 18.05078125, 18.6328125, 19.21484375, 19.796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 13.0, 16.0, 23.0, 33.0, 72.0, 226.0, 3268.0, 214.0, 70.0, 45.0, 18.0, 15.0, 11.0, 3.0, 6.0, 9.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.117645263671875, -3.03216552734375, -2.946685791015625, -2.8612060546875, -2.775726318359375, -2.69024658203125, -2.604766845703125, -2.519287109375, -2.433807373046875, -2.34832763671875, -2.262847900390625, -2.1773681640625, -2.091888427734375, -2.00640869140625, -1.920928955078125, -1.83544921875, -1.749969482421875, -1.66448974609375, -1.579010009765625, -1.4935302734375, -1.408050537109375, -1.32257080078125, -1.237091064453125, -1.151611328125, -1.066131591796875, -0.98065185546875, -0.895172119140625, -0.8096923828125, -0.724212646484375, -0.63873291015625, -0.553253173828125, -0.4677734375, -0.382293701171875, -0.29681396484375, -0.211334228515625, -0.1258544921875, -0.040374755859375, 0.04510498046875, 0.130584716796875, 0.216064453125, 0.301544189453125, 0.38702392578125, 0.472503662109375, 0.5579833984375, 0.643463134765625, 0.72894287109375, 0.814422607421875, 0.89990234375, 0.985382080078125, 1.07086181640625, 1.156341552734375, 1.2418212890625, 1.327301025390625, 1.41278076171875, 1.498260498046875, 1.583740234375, 1.669219970703125, 1.75469970703125, 1.840179443359375, 1.9256591796875, 2.011138916015625, 2.09661865234375, 2.182098388671875, 2.267578125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 22.0, 36.0, 28.0, 83.0, 99.0, 110.0, 99.0, 136.0, 112.0, 83.0, 61.0, 45.0, 28.0, 21.0, 11.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.909124374389648, -8.530203819274902, -8.151283264160156, -7.772363185882568, -7.393442630767822, -7.014522552490234, -6.635601997375488, -6.256681442260742, -5.877760887145996, -5.49884033203125, -5.119920253753662, -4.740999698638916, -4.36207914352417, -3.983158826828003, -3.604238510131836, -3.22531795501709, -2.846397876739502, -2.467477560043335, -2.088557004928589, -1.7096366882324219, -1.3307162523269653, -0.9517958164215088, -0.5728754997253418, -0.1939549446105957, 0.1849653720855713, 0.5638858079910278, 0.9428061842918396, 1.3217265605926514, 1.700646996498108, 2.0795674324035645, 2.4584877490997314, 2.8374083042144775, 3.2163286209106445, 3.5952489376068115, 3.9741694927215576, 4.353089809417725, 4.732010364532471, 5.110930442810059, 5.489850997924805, 5.868771553039551, 6.247692108154297, 6.626612663269043, 7.005532741546631, 7.384453296661377, 7.763373851776123, 8.142293930053711, 8.521214485168457, 8.900135040283203, 9.279054641723633, 9.657975196838379, 10.036895751953125, 10.415815353393555, 10.7947359085083, 11.173656463623047, 11.552577018737793, 11.931497573852539, 12.310418128967285, 12.689338684082031, 13.068259239196777, 13.447179794311523, 13.826099395751953, 14.2050199508667, 14.583940505981445, 14.962861061096191, 15.341781616210938]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 8.0, 12.0, 7.0, 18.0, 23.0, 27.0, 32.0, 30.0, 25.0, 25.0, 37.0, 25.0, 35.0, 40.0, 44.0, 48.0, 31.0, 34.0, 38.0, 54.0, 32.0, 42.0, 36.0, 36.0, 29.0, 30.0, 32.0, 27.0, 25.0, 9.0, 18.0, 23.0, 10.0, 10.0, 14.0, 2.0, 8.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.986153602600098, -4.822961330413818, -4.659769058227539, -4.49657678604126, -4.3333845138549805, -4.170192241668701, -4.006999969482422, -3.8438076972961426, -3.6806154251098633, -3.517423152923584, -3.3542308807373047, -3.1910386085510254, -3.027846336364746, -2.864654064178467, -2.7014617919921875, -2.538269519805908, -2.37507700920105, -2.2118847370147705, -2.048692464828491, -1.885500192642212, -1.7223079204559326, -1.5591156482696533, -1.3959232568740845, -1.2327309846878052, -1.0695387125015259, -0.9063464403152466, -0.7431541681289673, -0.5799618363380432, -0.4167695641517639, -0.2535772919654846, -0.09038496017456055, 0.07280731201171875, 0.23599958419799805, 0.39919185638427734, 0.5623841285705566, 0.7255764603614807, 0.88876873254776, 1.0519609451293945, 1.2151533365249634, 1.3783456087112427, 1.541537880897522, 1.7047301530838013, 1.8679224252700806, 2.0311148166656494, 2.1943070888519287, 2.357499361038208, 2.5206916332244873, 2.6838839054107666, 2.847076177597046, 3.010268449783325, 3.1734607219696045, 3.336652994155884, 3.499845266342163, 3.6630375385284424, 3.826230049133301, 3.98942232131958, 4.152614593505859, 4.315806865692139, 4.478999137878418, 4.642191410064697, 4.805383682250977, 4.968575954437256, 5.131768226623535, 5.2949604988098145, 5.458152770996094]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 7.0, 13.0, 14.0, 17.0, 21.0, 23.0, 51.0, 75.0, 149.0, 258.0, 546.0, 1116.0, 2292.0, 5224.0, 11548.0, 25963.0, 60854.0, 146565.0, 291954.0, 274956.0, 130343.0, 53747.0, 23393.0, 10429.0, 4789.0, 2065.0, 982.0, 498.0, 263.0, 150.0, 88.0, 49.0, 40.0, 32.0, 11.0, 7.0, 8.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.23828125, -5.0792236328125, -4.920166015625, -4.7611083984375, -4.60205078125, -4.4429931640625, -4.283935546875, -4.1248779296875, -3.9658203125, -3.8067626953125, -3.647705078125, -3.4886474609375, -3.32958984375, -3.1705322265625, -3.011474609375, -2.8524169921875, -2.693359375, -2.5343017578125, -2.375244140625, -2.2161865234375, -2.05712890625, -1.8980712890625, -1.739013671875, -1.5799560546875, -1.4208984375, -1.2618408203125, -1.102783203125, -0.9437255859375, -0.78466796875, -0.6256103515625, -0.466552734375, -0.3074951171875, -0.1484375, 0.0106201171875, 0.169677734375, 0.3287353515625, 0.48779296875, 0.6468505859375, 0.805908203125, 0.9649658203125, 1.1240234375, 1.2830810546875, 1.442138671875, 1.6011962890625, 1.76025390625, 1.9193115234375, 2.078369140625, 2.2374267578125, 2.396484375, 2.5555419921875, 2.714599609375, 2.8736572265625, 3.03271484375, 3.1917724609375, 3.350830078125, 3.5098876953125, 3.6689453125, 3.8280029296875, 3.987060546875, 4.1461181640625, 4.30517578125, 4.4642333984375, 4.623291015625, 4.7823486328125, 4.94140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 6.0, 9.0, 9.0, 17.0, 22.0, 22.0, 18.0, 23.0, 32.0, 24.0, 33.0, 41.0, 34.0, 34.0, 34.0, 52.0, 49.0, 46.0, 45.0, 47.0, 41.0, 47.0, 35.0, 40.0, 24.0, 34.0, 23.0, 21.0, 23.0, 20.0, 10.0, 12.0, 14.0, 8.0, 8.0, 4.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7027740478515625, -1.642852783203125, -1.5829315185546875, -1.52301025390625, -1.4630889892578125, -1.403167724609375, -1.3432464599609375, -1.2833251953125, -1.2234039306640625, -1.163482666015625, -1.1035614013671875, -1.04364013671875, -0.9837188720703125, -0.923797607421875, -0.8638763427734375, -0.803955078125, -0.7440338134765625, -0.684112548828125, -0.6241912841796875, -0.56427001953125, -0.5043487548828125, -0.444427490234375, -0.3845062255859375, -0.3245849609375, -0.2646636962890625, -0.204742431640625, -0.1448211669921875, -0.08489990234375, -0.0249786376953125, 0.034942626953125, 0.0948638916015625, 0.15478515625, 0.2147064208984375, 0.274627685546875, 0.3345489501953125, 0.39447021484375, 0.4543914794921875, 0.514312744140625, 0.5742340087890625, 0.6341552734375, 0.6940765380859375, 0.753997802734375, 0.8139190673828125, 0.87384033203125, 0.9337615966796875, 0.993682861328125, 1.0536041259765625, 1.113525390625, 1.1734466552734375, 1.233367919921875, 1.2932891845703125, 1.35321044921875, 1.4131317138671875, 1.473052978515625, 1.5329742431640625, 1.5928955078125, 1.6528167724609375, 1.712738037109375, 1.7726593017578125, 1.83258056640625, 1.8925018310546875, 1.952423095703125, 2.0123443603515625, 2.072265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 9.0, 12.0, 24.0, 35.0, 65.0, 87.0, 130.0, 206.0, 282.0, 498.0, 839.0, 1763.0, 4974.0, 19396.0, 103032.0, 592129.0, 268880.0, 41351.0, 9148.0, 2786.0, 1196.0, 613.0, 394.0, 245.0, 178.0, 86.0, 57.0, 47.0, 35.0, 19.0, 15.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.0546875, -13.709716796875, -13.36474609375, -13.019775390625, -12.6748046875, -12.329833984375, -11.98486328125, -11.639892578125, -11.294921875, -10.949951171875, -10.60498046875, -10.260009765625, -9.9150390625, -9.570068359375, -9.22509765625, -8.880126953125, -8.53515625, -8.190185546875, -7.84521484375, -7.500244140625, -7.1552734375, -6.810302734375, -6.46533203125, -6.120361328125, -5.775390625, -5.430419921875, -5.08544921875, -4.740478515625, -4.3955078125, -4.050537109375, -3.70556640625, -3.360595703125, -3.015625, -2.670654296875, -2.32568359375, -1.980712890625, -1.6357421875, -1.290771484375, -0.94580078125, -0.600830078125, -0.255859375, 0.089111328125, 0.43408203125, 0.779052734375, 1.1240234375, 1.468994140625, 1.81396484375, 2.158935546875, 2.50390625, 2.848876953125, 3.19384765625, 3.538818359375, 3.8837890625, 4.228759765625, 4.57373046875, 4.918701171875, 5.263671875, 5.608642578125, 5.95361328125, 6.298583984375, 6.6435546875, 6.988525390625, 7.33349609375, 7.678466796875, 8.0234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 13.0, 21.0, 18.0, 23.0, 17.0, 15.0, 27.0, 26.0, 32.0, 26.0, 31.0, 46.0, 36.0, 38.0, 33.0, 47.0, 41.0, 35.0, 43.0, 38.0, 43.0, 31.0, 37.0, 36.0, 27.0, 28.0, 32.0, 31.0, 20.0, 15.0, 13.0, 12.0, 14.0, 5.0, 8.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.1502685546875, -8.863037109375, -8.5758056640625, -8.28857421875, -8.0013427734375, -7.714111328125, -7.4268798828125, -7.1396484375, -6.8524169921875, -6.565185546875, -6.2779541015625, -5.99072265625, -5.7034912109375, -5.416259765625, -5.1290283203125, -4.841796875, -4.5545654296875, -4.267333984375, -3.9801025390625, -3.69287109375, -3.4056396484375, -3.118408203125, -2.8311767578125, -2.5439453125, -2.2567138671875, -1.969482421875, -1.6822509765625, -1.39501953125, -1.1077880859375, -0.820556640625, -0.5333251953125, -0.24609375, 0.0411376953125, 0.328369140625, 0.6156005859375, 0.90283203125, 1.1900634765625, 1.477294921875, 1.7645263671875, 2.0517578125, 2.3389892578125, 2.626220703125, 2.9134521484375, 3.20068359375, 3.4879150390625, 3.775146484375, 4.0623779296875, 4.349609375, 4.6368408203125, 4.924072265625, 5.2113037109375, 5.49853515625, 5.7857666015625, 6.072998046875, 6.3602294921875, 6.6474609375, 6.9346923828125, 7.221923828125, 7.5091552734375, 7.79638671875, 8.0836181640625, 8.370849609375, 8.6580810546875, 8.9453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 5.0, 13.0, 19.0, 15.0, 25.0, 45.0, 64.0, 80.0, 127.0, 179.0, 300.0, 590.0, 1067.0, 2487.0, 6500.0, 22698.0, 104008.0, 459954.0, 351202.0, 73224.0, 16642.0, 5064.0, 2019.0, 913.0, 505.0, 280.0, 172.0, 110.0, 85.0, 52.0, 31.0, 18.0, 11.0, 13.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.0703125, -4.92498779296875, -4.7796630859375, -4.63433837890625, -4.489013671875, -4.34368896484375, -4.1983642578125, -4.05303955078125, -3.90771484375, -3.76239013671875, -3.6170654296875, -3.47174072265625, -3.326416015625, -3.18109130859375, -3.0357666015625, -2.89044189453125, -2.7451171875, -2.59979248046875, -2.4544677734375, -2.30914306640625, -2.163818359375, -2.01849365234375, -1.8731689453125, -1.72784423828125, -1.58251953125, -1.43719482421875, -1.2918701171875, -1.14654541015625, -1.001220703125, -0.85589599609375, -0.7105712890625, -0.56524658203125, -0.419921875, -0.27459716796875, -0.1292724609375, 0.01605224609375, 0.161376953125, 0.30670166015625, 0.4520263671875, 0.59735107421875, 0.74267578125, 0.88800048828125, 1.0333251953125, 1.17864990234375, 1.323974609375, 1.46929931640625, 1.6146240234375, 1.75994873046875, 1.9052734375, 2.05059814453125, 2.1959228515625, 2.34124755859375, 2.486572265625, 2.63189697265625, 2.7772216796875, 2.92254638671875, 3.06787109375, 3.21319580078125, 3.3585205078125, 3.50384521484375, 3.649169921875, 3.79449462890625, 3.9398193359375, 4.08514404296875, 4.23046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 7.0, 8.0, 14.0, 25.0, 29.0, 39.0, 55.0, 67.0, 87.0, 87.0, 91.0, 100.0, 90.0, 69.0, 47.0, 41.0, 29.0, 24.0, 20.0, 16.0, 11.0, 5.0, 7.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012235641479492188, -0.001190081238746643, -0.0011565983295440674, -0.0011231154203414917, -0.001089632511138916, -0.0010561496019363403, -0.0010226666927337646, -0.000989183783531189, -0.0009557008743286133, -0.0009222179651260376, -0.0008887350559234619, -0.0008552521467208862, -0.0008217692375183105, -0.0007882863283157349, -0.0007548034191131592, -0.0007213205099105835, -0.0006878376007080078, -0.0006543546915054321, -0.0006208717823028564, -0.0005873888731002808, -0.0005539059638977051, -0.0005204230546951294, -0.0004869401454925537, -0.00045345723628997803, -0.00041997432708740234, -0.00038649141788482666, -0.000353008508682251, -0.0003195255994796753, -0.0002860426902770996, -0.0002525597810745239, -0.00021907687187194824, -0.00018559396266937256, -0.00015211105346679688, -0.00011862814426422119, -8.514523506164551e-05, -5.1662325859069824e-05, -1.817941665649414e-05, 1.5303492546081543e-05, 4.8786401748657227e-05, 8.226931095123291e-05, 0.0001157522201538086, 0.00014923512935638428, 0.00018271803855895996, 0.00021620094776153564, 0.00024968385696411133, 0.000283166766166687, 0.0003166496753692627, 0.0003501325845718384, 0.00038361549377441406, 0.00041709840297698975, 0.00045058131217956543, 0.0004840642213821411, 0.0005175471305847168, 0.0005510300397872925, 0.0005845129489898682, 0.0006179958581924438, 0.0006514787673950195, 0.0006849616765975952, 0.0007184445858001709, 0.0007519274950027466, 0.0007854104042053223, 0.000818893313407898, 0.0008523762226104736, 0.0008858591318130493, 0.000919342041015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 11.0, 16.0, 10.0, 32.0, 30.0, 64.0, 116.0, 252.0, 501.0, 1130.0, 3080.0, 11891.0, 84559.0, 564384.0, 331752.0, 39942.0, 7086.0, 2025.0, 835.0, 388.0, 196.0, 98.0, 52.0, 35.0, 21.0, 16.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.092529296875, -3.89599609375, -3.699462890625, -3.5029296875, -3.306396484375, -3.10986328125, -2.913330078125, -2.716796875, -2.520263671875, -2.32373046875, -2.127197265625, -1.9306640625, -1.734130859375, -1.53759765625, -1.341064453125, -1.14453125, -0.947998046875, -0.75146484375, -0.554931640625, -0.3583984375, -0.161865234375, 0.03466796875, 0.231201171875, 0.427734375, 0.624267578125, 0.82080078125, 1.017333984375, 1.2138671875, 1.410400390625, 1.60693359375, 1.803466796875, 2.0, 2.196533203125, 2.39306640625, 2.589599609375, 2.7861328125, 2.982666015625, 3.17919921875, 3.375732421875, 3.572265625, 3.768798828125, 3.96533203125, 4.161865234375, 4.3583984375, 4.554931640625, 4.75146484375, 4.947998046875, 5.14453125, 5.341064453125, 5.53759765625, 5.734130859375, 5.9306640625, 6.127197265625, 6.32373046875, 6.520263671875, 6.716796875, 6.913330078125, 7.10986328125, 7.306396484375, 7.5029296875, 7.699462890625, 7.89599609375, 8.092529296875, 8.2890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 15.0, 12.0, 17.0, 28.0, 48.0, 51.0, 50.0, 73.0, 67.0, 73.0, 87.0, 70.0, 71.0, 58.0, 52.0, 36.0, 41.0, 31.0, 26.0, 14.0, 19.0, 13.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -5.02740478515625, -4.8790283203125, -4.73065185546875, -4.582275390625, -4.43389892578125, -4.2855224609375, -4.13714599609375, -3.98876953125, -3.84039306640625, -3.6920166015625, -3.54364013671875, -3.395263671875, -3.24688720703125, -3.0985107421875, -2.95013427734375, -2.8017578125, -2.65338134765625, -2.5050048828125, -2.35662841796875, -2.208251953125, -2.05987548828125, -1.9114990234375, -1.76312255859375, -1.61474609375, -1.46636962890625, -1.3179931640625, -1.16961669921875, -1.021240234375, -0.87286376953125, -0.7244873046875, -0.57611083984375, -0.427734375, -0.27935791015625, -0.1309814453125, 0.01739501953125, 0.165771484375, 0.31414794921875, 0.4625244140625, 0.61090087890625, 0.75927734375, 0.90765380859375, 1.0560302734375, 1.20440673828125, 1.352783203125, 1.50115966796875, 1.6495361328125, 1.79791259765625, 1.9462890625, 2.09466552734375, 2.2430419921875, 2.39141845703125, 2.539794921875, 2.68817138671875, 2.8365478515625, 2.98492431640625, 3.13330078125, 3.28167724609375, 3.4300537109375, 3.57843017578125, 3.726806640625, 3.87518310546875, 4.0235595703125, 4.17193603515625, 4.3203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 8.0, 42.0, 155.0, 315.0, 311.0, 129.0, 36.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.0882263183594, -282.3692321777344, -275.6502380371094, -268.9312744140625, -262.2122802734375, -255.4932861328125, -248.7742919921875, -242.05531311035156, -235.33633422851562, -228.61734008789062, -221.8983612060547, -215.1793670654297, -208.46038818359375, -201.74139404296875, -195.02239990234375, -188.3034210205078, -181.5844268798828, -174.8654327392578, -168.14645385742188, -161.42745971679688, -154.70848083496094, -147.98948669433594, -141.2705078125, -134.551513671875, -127.83252716064453, -121.11354064941406, -114.3945541381836, -107.67556762695312, -100.95657348632812, -94.23759460449219, -87.51860046386719, -80.79961395263672, -74.08064270019531, -67.36165618896484, -60.642669677734375, -53.92367935180664, -47.20469284057617, -40.4857063293457, -33.76671600341797, -27.0477294921875, -20.32874298095703, -13.609755516052246, -6.890768051147461, -0.17177963256835938, 6.547206878662109, 13.266193389892578, 19.985183715820312, 26.70417022705078, 33.42315673828125, 40.14214324951172, 46.86112976074219, 53.58012008666992, 60.29910659790039, 67.01809692382812, 73.7370834350586, 80.45606994628906, 87.17505645751953, 93.89404296875, 100.61302947998047, 107.33201599121094, 114.05101013183594, 120.76998901367188, 127.48898315429688, 134.20797729492188, 140.9269561767578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 6.0, 9.0, 8.0, 15.0, 20.0, 19.0, 30.0, 31.0, 32.0, 29.0, 38.0, 36.0, 48.0, 45.0, 62.0, 38.0, 64.0, 52.0, 57.0, 30.0, 45.0, 33.0, 30.0, 42.0, 23.0, 19.0, 30.0, 16.0, 13.0, 11.0, 13.0, 10.0, 9.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-52.65270233154297, -51.0115966796875, -49.37049102783203, -47.7293815612793, -46.08827590942383, -44.44717025756836, -42.80606460571289, -41.164955139160156, -39.52384948730469, -37.88274383544922, -36.24163818359375, -34.600528717041016, -32.95942306518555, -31.318317413330078, -29.67721176147461, -28.036104202270508, -26.39499855041504, -24.75389289855957, -23.11278533935547, -21.4716796875, -19.8305721282959, -18.18946647644043, -16.548358917236328, -14.90725326538086, -13.266146659851074, -11.625040054321289, -9.983933448791504, -8.342826843261719, -6.701720714569092, -5.060614585876465, -3.4195079803466797, -1.7784013748168945, -0.13729476928710938, 1.5038117170333862, 3.144918203353882, 4.786024570465088, 6.427131175994873, 8.0682373046875, 9.709343910217285, 11.35045051574707, 12.991557121276855, 14.63266372680664, 16.27376937866211, 17.91487693786621, 19.55598258972168, 21.19709014892578, 22.83819580078125, 24.47930145263672, 26.12040901184082, 27.76151466369629, 29.40262222290039, 31.04372787475586, 32.68483352661133, 34.32594299316406, 35.96704864501953, 37.608154296875, 39.24925994873047, 40.89036560058594, 42.531471252441406, 44.17258071899414, 45.81368637084961, 47.45479202270508, 49.09589767456055, 50.73700714111328, 52.37811279296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 18.0, 35.0, 60.0, 89.0, 169.0, 282.0, 554.0, 1160.0, 2954.0, 9071.0, 44706.0, 4046348.0, 71240.0, 11271.0, 3506.0, 1382.0, 623.0, 343.0, 191.0, 95.0, 54.0, 36.0, 23.0, 12.0, 11.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.3203125, -14.8502197265625, -14.380126953125, -13.9100341796875, -13.43994140625, -12.9698486328125, -12.499755859375, -12.0296630859375, -11.5595703125, -11.0894775390625, -10.619384765625, -10.1492919921875, -9.67919921875, -9.2091064453125, -8.739013671875, -8.2689208984375, -7.798828125, -7.3287353515625, -6.858642578125, -6.3885498046875, -5.91845703125, -5.4483642578125, -4.978271484375, -4.5081787109375, -4.0380859375, -3.5679931640625, -3.097900390625, -2.6278076171875, -2.15771484375, -1.6876220703125, -1.217529296875, -0.7474365234375, -0.27734375, 0.1927490234375, 0.662841796875, 1.1329345703125, 1.60302734375, 2.0731201171875, 2.543212890625, 3.0133056640625, 3.4833984375, 3.9534912109375, 4.423583984375, 4.8936767578125, 5.36376953125, 5.8338623046875, 6.303955078125, 6.7740478515625, 7.244140625, 7.7142333984375, 8.184326171875, 8.6544189453125, 9.12451171875, 9.5946044921875, 10.064697265625, 10.5347900390625, 11.0048828125, 11.4749755859375, 11.945068359375, 12.4151611328125, 12.88525390625, 13.3553466796875, 13.825439453125, 14.2955322265625, 14.765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 5.0, 11.0, 10.0, 13.0, 21.0, 16.0, 14.0, 23.0, 19.0, 36.0, 45.0, 36.0, 42.0, 44.0, 49.0, 45.0, 43.0, 51.0, 39.0, 54.0, 45.0, 38.0, 24.0, 33.0, 30.0, 13.0, 35.0, 18.0, 25.0, 19.0, 16.0, 11.0, 14.0, 5.0, 10.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7685546875, -1.7097625732421875, -1.650970458984375, -1.5921783447265625, -1.53338623046875, -1.4745941162109375, -1.415802001953125, -1.3570098876953125, -1.2982177734375, -1.2394256591796875, -1.180633544921875, -1.1218414306640625, -1.06304931640625, -1.0042572021484375, -0.945465087890625, -0.8866729736328125, -0.827880859375, -0.7690887451171875, -0.710296630859375, -0.6515045166015625, -0.59271240234375, -0.5339202880859375, -0.475128173828125, -0.4163360595703125, -0.3575439453125, -0.2987518310546875, -0.239959716796875, -0.1811676025390625, -0.12237548828125, -0.0635833740234375, -0.004791259765625, 0.0540008544921875, 0.11279296875, 0.1715850830078125, 0.230377197265625, 0.2891693115234375, 0.34796142578125, 0.4067535400390625, 0.465545654296875, 0.5243377685546875, 0.5831298828125, 0.6419219970703125, 0.700714111328125, 0.7595062255859375, 0.81829833984375, 0.8770904541015625, 0.935882568359375, 0.9946746826171875, 1.053466796875, 1.1122589111328125, 1.171051025390625, 1.2298431396484375, 1.28863525390625, 1.3474273681640625, 1.406219482421875, 1.4650115966796875, 1.5238037109375, 1.5825958251953125, 1.641387939453125, 1.7001800537109375, 1.75897216796875, 1.8177642822265625, 1.876556396484375, 1.9353485107421875, 1.994140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 9.0, 12.0, 36.0, 34.0, 54.0, 72.0, 105.0, 141.0, 188.0, 270.0, 394.0, 586.0, 850.0, 1294.0, 1990.0, 2973.0, 5091.0, 8822.0, 16501.0, 35646.0, 105552.0, 3574037.0, 322511.0, 61334.0, 24773.0, 12426.0, 6755.0, 4228.0, 2555.0, 1590.0, 1058.0, 752.0, 482.0, 337.0, 217.0, 154.0, 123.0, 86.0, 90.0, 34.0, 27.0, 22.0, 20.0, 15.0, 7.0, 5.0, 9.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.22100830078125, -5.0513916015625, -4.88177490234375, -4.712158203125, -4.54254150390625, -4.3729248046875, -4.20330810546875, -4.03369140625, -3.86407470703125, -3.6944580078125, -3.52484130859375, -3.355224609375, -3.18560791015625, -3.0159912109375, -2.84637451171875, -2.6767578125, -2.50714111328125, -2.3375244140625, -2.16790771484375, -1.998291015625, -1.82867431640625, -1.6590576171875, -1.48944091796875, -1.31982421875, -1.15020751953125, -0.9805908203125, -0.81097412109375, -0.641357421875, -0.47174072265625, -0.3021240234375, -0.13250732421875, 0.037109375, 0.20672607421875, 0.3763427734375, 0.54595947265625, 0.715576171875, 0.88519287109375, 1.0548095703125, 1.22442626953125, 1.39404296875, 1.56365966796875, 1.7332763671875, 1.90289306640625, 2.072509765625, 2.24212646484375, 2.4117431640625, 2.58135986328125, 2.7509765625, 2.92059326171875, 3.0902099609375, 3.25982666015625, 3.429443359375, 3.59906005859375, 3.7686767578125, 3.93829345703125, 4.10791015625, 4.27752685546875, 4.4471435546875, 4.61676025390625, 4.786376953125, 4.95599365234375, 5.1256103515625, 5.29522705078125, 5.46484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 1.0, 7.0, 2.0, 9.0, 14.0, 8.0, 16.0, 14.0, 26.0, 53.0, 74.0, 173.0, 2807.0, 534.0, 128.0, 53.0, 44.0, 20.0, 24.0, 13.0, 13.0, 7.0, 10.0, 5.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.9169464111328125, -1.850494384765625, -1.7840423583984375, -1.71759033203125, -1.6511383056640625, -1.584686279296875, -1.5182342529296875, -1.4517822265625, -1.3853302001953125, -1.318878173828125, -1.2524261474609375, -1.18597412109375, -1.1195220947265625, -1.053070068359375, -0.9866180419921875, -0.920166015625, -0.8537139892578125, -0.787261962890625, -0.7208099365234375, -0.65435791015625, -0.5879058837890625, -0.521453857421875, -0.4550018310546875, -0.3885498046875, -0.3220977783203125, -0.255645751953125, -0.1891937255859375, -0.12274169921875, -0.0562896728515625, 0.010162353515625, 0.0766143798828125, 0.14306640625, 0.2095184326171875, 0.275970458984375, 0.3424224853515625, 0.40887451171875, 0.4753265380859375, 0.541778564453125, 0.6082305908203125, 0.6746826171875, 0.7411346435546875, 0.807586669921875, 0.8740386962890625, 0.94049072265625, 1.0069427490234375, 1.073394775390625, 1.1398468017578125, 1.206298828125, 1.2727508544921875, 1.339202880859375, 1.4056549072265625, 1.47210693359375, 1.5385589599609375, 1.605010986328125, 1.6714630126953125, 1.7379150390625, 1.8043670654296875, 1.870819091796875, 1.9372711181640625, 2.00372314453125, 2.0701751708984375, 2.136627197265625, 2.2030792236328125, 2.26953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 18.0, 40.0, 73.0, 108.0, 171.0, 177.0, 146.0, 116.0, 77.0, 36.0, 12.0, 12.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.834344863891602, -15.363054275512695, -14.891762733459473, -14.42047119140625, -13.949180603027344, -13.477890014648438, -13.006598472595215, -12.535306930541992, -12.064016342163086, -11.59272575378418, -11.121434211730957, -10.650142669677734, -10.178852081298828, -9.707561492919922, -9.2362699508667, -8.764978408813477, -8.29368782043457, -7.822396755218506, -7.351105690002441, -6.879814624786377, -6.4085235595703125, -5.937232494354248, -5.465941429138184, -4.994650363922119, -4.523359298706055, -4.05206823348999, -3.580777168273926, -3.1094861030578613, -2.638195037841797, -2.1669039726257324, -1.695612907409668, -1.2243218421936035, -0.7530307769775391, -0.2817397117614746, 0.18955135345458984, 0.6608424186706543, 1.1321334838867188, 1.6034245491027832, 2.0747156143188477, 2.546006679534912, 3.0172977447509766, 3.488588809967041, 3.9598798751831055, 4.43117094039917, 4.902462005615234, 5.373753070831299, 5.845044136047363, 6.316335201263428, 6.787626266479492, 7.258917331695557, 7.730208396911621, 8.201499938964844, 8.67279052734375, 9.144081115722656, 9.615372657775879, 10.086664199829102, 10.557954788208008, 11.029245376586914, 11.500536918640137, 11.97182846069336, 12.443119049072266, 12.914409637451172, 13.385701179504395, 13.856992721557617, 14.328283309936523]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 12.0, 14.0, 27.0, 22.0, 31.0, 30.0, 40.0, 37.0, 45.0, 38.0, 62.0, 68.0, 64.0, 66.0, 44.0, 53.0, 46.0, 42.0, 38.0, 31.0, 38.0, 29.0, 29.0, 17.0, 19.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.51754093170166, -7.320598602294922, -7.123655796051025, -6.926713466644287, -6.729771137237549, -6.532828330993652, -6.335886001586914, -6.138943672180176, -5.942000865936279, -5.745058536529541, -5.5481157302856445, -5.351173400878906, -5.154231071472168, -4.9572882652282715, -4.760345935821533, -4.563403129577637, -4.366460800170898, -4.16951847076416, -3.9725759029388428, -3.7756333351135254, -3.578690767288208, -3.3817481994628906, -3.1848058700561523, -2.987863302230835, -2.790921211242676, -2.5939786434173584, -2.39703631401062, -2.2000937461853027, -2.0031511783599854, -1.8062087297439575, -1.6092662811279297, -1.4123237133026123, -1.215381145477295, -1.018438696861267, -0.8214961290359497, -0.6245536804199219, -0.42761117219924927, -0.23066866397857666, -0.03372621536254883, 0.16321635246276855, 0.3601588010787964, 0.557101309299469, 0.7540438175201416, 0.9509862661361694, 1.1479287147521973, 1.3448712825775146, 1.5418137311935425, 1.7387562990188599, 1.9356987476348877, 2.132641315460205, 2.3295836448669434, 2.5265262126922607, 2.723468780517578, 2.9204111099243164, 3.117353677749634, 3.314296245574951, 3.5112385749816895, 3.708181142807007, 3.905123472213745, 4.1020660400390625, 4.299008369445801, 4.495951175689697, 4.6928935050964355, 4.889836311340332, 5.08677864074707]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 7.0, 6.0, 10.0, 21.0, 30.0, 44.0, 60.0, 91.0, 136.0, 216.0, 314.0, 553.0, 890.0, 1540.0, 2766.0, 4839.0, 9077.0, 17209.0, 33008.0, 63086.0, 116269.0, 192256.0, 230163.0, 168768.0, 97321.0, 51374.0, 27133.0, 14041.0, 7304.0, 4129.0, 2327.0, 1414.0, 766.0, 465.0, 280.0, 210.0, 146.0, 76.0, 68.0, 49.0, 32.0, 17.0, 11.0, 17.0, 6.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3828125, -3.2813720703125, -3.179931640625, -3.0784912109375, -2.97705078125, -2.8756103515625, -2.774169921875, -2.6727294921875, -2.5712890625, -2.4698486328125, -2.368408203125, -2.2669677734375, -2.16552734375, -2.0640869140625, -1.962646484375, -1.8612060546875, -1.759765625, -1.6583251953125, -1.556884765625, -1.4554443359375, -1.35400390625, -1.2525634765625, -1.151123046875, -1.0496826171875, -0.9482421875, -0.8468017578125, -0.745361328125, -0.6439208984375, -0.54248046875, -0.4410400390625, -0.339599609375, -0.2381591796875, -0.13671875, -0.0352783203125, 0.066162109375, 0.1676025390625, 0.26904296875, 0.3704833984375, 0.471923828125, 0.5733642578125, 0.6748046875, 0.7762451171875, 0.877685546875, 0.9791259765625, 1.08056640625, 1.1820068359375, 1.283447265625, 1.3848876953125, 1.486328125, 1.5877685546875, 1.689208984375, 1.7906494140625, 1.89208984375, 1.9935302734375, 2.094970703125, 2.1964111328125, 2.2978515625, 2.3992919921875, 2.500732421875, 2.6021728515625, 2.70361328125, 2.8050537109375, 2.906494140625, 3.0079345703125, 3.109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 6.0, 10.0, 15.0, 11.0, 11.0, 21.0, 25.0, 31.0, 24.0, 28.0, 47.0, 46.0, 40.0, 41.0, 49.0, 53.0, 45.0, 40.0, 40.0, 51.0, 41.0, 43.0, 34.0, 27.0, 34.0, 27.0, 16.0, 29.0, 23.0, 16.0, 4.0, 9.0, 10.0, 8.0, 3.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.075103759765625, -2.00958251953125, -1.944061279296875, -1.8785400390625, -1.813018798828125, -1.74749755859375, -1.681976318359375, -1.616455078125, -1.550933837890625, -1.48541259765625, -1.419891357421875, -1.3543701171875, -1.288848876953125, -1.22332763671875, -1.157806396484375, -1.09228515625, -1.026763916015625, -0.96124267578125, -0.895721435546875, -0.8302001953125, -0.764678955078125, -0.69915771484375, -0.633636474609375, -0.568115234375, -0.502593994140625, -0.43707275390625, -0.371551513671875, -0.3060302734375, -0.240509033203125, -0.17498779296875, -0.109466552734375, -0.0439453125, 0.021575927734375, 0.08709716796875, 0.152618408203125, 0.2181396484375, 0.283660888671875, 0.34918212890625, 0.414703369140625, 0.480224609375, 0.545745849609375, 0.61126708984375, 0.676788330078125, 0.7423095703125, 0.807830810546875, 0.87335205078125, 0.938873291015625, 1.00439453125, 1.069915771484375, 1.13543701171875, 1.200958251953125, 1.2664794921875, 1.332000732421875, 1.39752197265625, 1.463043212890625, 1.528564453125, 1.594085693359375, 1.65960693359375, 1.725128173828125, 1.7906494140625, 1.856170654296875, 1.92169189453125, 1.987213134765625, 2.052734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 10.0, 16.0, 27.0, 26.0, 49.0, 62.0, 79.0, 127.0, 212.0, 360.0, 564.0, 1021.0, 2253.0, 7102.0, 38934.0, 381259.0, 542659.0, 58789.0, 9230.0, 2714.0, 1174.0, 669.0, 406.0, 257.0, 179.0, 111.0, 68.0, 49.0, 36.0, 30.0, 15.0, 12.0, 8.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.2322998046875, -8.925537109375, -8.6187744140625, -8.31201171875, -8.0052490234375, -7.698486328125, -7.3917236328125, -7.0849609375, -6.7781982421875, -6.471435546875, -6.1646728515625, -5.85791015625, -5.5511474609375, -5.244384765625, -4.9376220703125, -4.630859375, -4.3240966796875, -4.017333984375, -3.7105712890625, -3.40380859375, -3.0970458984375, -2.790283203125, -2.4835205078125, -2.1767578125, -1.8699951171875, -1.563232421875, -1.2564697265625, -0.94970703125, -0.6429443359375, -0.336181640625, -0.0294189453125, 0.27734375, 0.5841064453125, 0.890869140625, 1.1976318359375, 1.50439453125, 1.8111572265625, 2.117919921875, 2.4246826171875, 2.7314453125, 3.0382080078125, 3.344970703125, 3.6517333984375, 3.95849609375, 4.2652587890625, 4.572021484375, 4.8787841796875, 5.185546875, 5.4923095703125, 5.799072265625, 6.1058349609375, 6.41259765625, 6.7193603515625, 7.026123046875, 7.3328857421875, 7.6396484375, 7.9464111328125, 8.253173828125, 8.5599365234375, 8.86669921875, 9.1734619140625, 9.480224609375, 9.7869873046875, 10.09375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 7.0, 2.0, 5.0, 9.0, 7.0, 10.0, 5.0, 17.0, 14.0, 20.0, 17.0, 23.0, 26.0, 25.0, 25.0, 34.0, 35.0, 34.0, 47.0, 36.0, 44.0, 48.0, 42.0, 38.0, 45.0, 31.0, 41.0, 37.0, 41.0, 27.0, 31.0, 26.0, 23.0, 20.0, 16.0, 17.0, 14.0, 8.0, 17.0, 11.0, 10.0, 5.0, 3.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0662841796875, -7.796630859375, -7.5269775390625, -7.25732421875, -6.9876708984375, -6.718017578125, -6.4483642578125, -6.1787109375, -5.9090576171875, -5.639404296875, -5.3697509765625, -5.10009765625, -4.8304443359375, -4.560791015625, -4.2911376953125, -4.021484375, -3.7518310546875, -3.482177734375, -3.2125244140625, -2.94287109375, -2.6732177734375, -2.403564453125, -2.1339111328125, -1.8642578125, -1.5946044921875, -1.324951171875, -1.0552978515625, -0.78564453125, -0.5159912109375, -0.246337890625, 0.0233154296875, 0.29296875, 0.5626220703125, 0.832275390625, 1.1019287109375, 1.37158203125, 1.6412353515625, 1.910888671875, 2.1805419921875, 2.4501953125, 2.7198486328125, 2.989501953125, 3.2591552734375, 3.52880859375, 3.7984619140625, 4.068115234375, 4.3377685546875, 4.607421875, 4.8770751953125, 5.146728515625, 5.4163818359375, 5.68603515625, 5.9556884765625, 6.225341796875, 6.4949951171875, 6.7646484375, 7.0343017578125, 7.303955078125, 7.5736083984375, 7.84326171875, 8.1129150390625, 8.382568359375, 8.6522216796875, 8.921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 11.0, 13.0, 20.0, 29.0, 32.0, 56.0, 87.0, 152.0, 303.0, 621.0, 1642.0, 6363.0, 49278.0, 605343.0, 351279.0, 26645.0, 4263.0, 1214.0, 520.0, 259.0, 145.0, 87.0, 52.0, 29.0, 24.0, 24.0, 6.0, 9.0, 4.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.75, -6.56182861328125, -6.3736572265625, -6.18548583984375, -5.997314453125, -5.80914306640625, -5.6209716796875, -5.43280029296875, -5.24462890625, -5.05645751953125, -4.8682861328125, -4.68011474609375, -4.491943359375, -4.30377197265625, -4.1156005859375, -3.92742919921875, -3.7392578125, -3.55108642578125, -3.3629150390625, -3.17474365234375, -2.986572265625, -2.79840087890625, -2.6102294921875, -2.42205810546875, -2.23388671875, -2.04571533203125, -1.8575439453125, -1.66937255859375, -1.481201171875, -1.29302978515625, -1.1048583984375, -0.91668701171875, -0.728515625, -0.54034423828125, -0.3521728515625, -0.16400146484375, 0.024169921875, 0.21234130859375, 0.4005126953125, 0.58868408203125, 0.77685546875, 0.96502685546875, 1.1531982421875, 1.34136962890625, 1.529541015625, 1.71771240234375, 1.9058837890625, 2.09405517578125, 2.2822265625, 2.47039794921875, 2.6585693359375, 2.84674072265625, 3.034912109375, 3.22308349609375, 3.4112548828125, 3.59942626953125, 3.78759765625, 3.97576904296875, 4.1639404296875, 4.35211181640625, 4.540283203125, 4.72845458984375, 4.9166259765625, 5.10479736328125, 5.29296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 16.0, 15.0, 21.0, 24.0, 25.0, 39.0, 38.0, 62.0, 80.0, 75.0, 102.0, 102.0, 84.0, 70.0, 40.0, 46.0, 35.0, 26.0, 19.0, 21.0, 8.0, 8.0, 7.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006594657897949219, -0.0006328299641609192, -0.0006061941385269165, -0.0005795583128929138, -0.0005529224872589111, -0.0005262866616249084, -0.0004996508359909058, -0.0004730150103569031, -0.0004463791847229004, -0.0004197433590888977, -0.000393107533454895, -0.00036647170782089233, -0.00033983588218688965, -0.00031320005655288696, -0.0002865642309188843, -0.0002599284052848816, -0.0002332925796508789, -0.00020665675401687622, -0.00018002092838287354, -0.00015338510274887085, -0.00012674927711486816, -0.00010011345148086548, -7.347762584686279e-05, -4.684180021286011e-05, -2.0205974578857422e-05, 6.429851055145264e-06, 3.306567668914795e-05, 5.9701502323150635e-05, 8.633732795715332e-05, 0.000112973153591156, 0.0001396089792251587, 0.00016624480485916138, 0.00019288063049316406, 0.00021951645612716675, 0.00024615228176116943, 0.0002727881073951721, 0.0002994239330291748, 0.0003260597586631775, 0.0003526955842971802, 0.00037933140993118286, 0.00040596723556518555, 0.00043260306119918823, 0.0004592388868331909, 0.0004858747124671936, 0.0005125105381011963, 0.000539146363735199, 0.0005657821893692017, 0.0005924180150032043, 0.000619053840637207, 0.0006456896662712097, 0.0006723254919052124, 0.0006989613175392151, 0.0007255971431732178, 0.0007522329688072205, 0.0007788687944412231, 0.0008055046200752258, 0.0008321404457092285, 0.0008587762713432312, 0.0008854120969772339, 0.0009120479226112366, 0.0009386837482452393, 0.0009653195738792419, 0.0009919553995132446, 0.0010185912251472473, 0.00104522705078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 15.0, 12.0, 16.0, 32.0, 36.0, 81.0, 174.0, 397.0, 1446.0, 8628.0, 355362.0, 665902.0, 13737.0, 1815.0, 490.0, 206.0, 77.0, 40.0, 28.0, 26.0, 12.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.609375, -11.24755859375, -10.8857421875, -10.52392578125, -10.162109375, -9.80029296875, -9.4384765625, -9.07666015625, -8.71484375, -8.35302734375, -7.9912109375, -7.62939453125, -7.267578125, -6.90576171875, -6.5439453125, -6.18212890625, -5.8203125, -5.45849609375, -5.0966796875, -4.73486328125, -4.373046875, -4.01123046875, -3.6494140625, -3.28759765625, -2.92578125, -2.56396484375, -2.2021484375, -1.84033203125, -1.478515625, -1.11669921875, -0.7548828125, -0.39306640625, -0.03125, 0.33056640625, 0.6923828125, 1.05419921875, 1.416015625, 1.77783203125, 2.1396484375, 2.50146484375, 2.86328125, 3.22509765625, 3.5869140625, 3.94873046875, 4.310546875, 4.67236328125, 5.0341796875, 5.39599609375, 5.7578125, 6.11962890625, 6.4814453125, 6.84326171875, 7.205078125, 7.56689453125, 7.9287109375, 8.29052734375, 8.65234375, 9.01416015625, 9.3759765625, 9.73779296875, 10.099609375, 10.46142578125, 10.8232421875, 11.18505859375, 11.546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 7.0, 16.0, 20.0, 13.0, 23.0, 28.0, 43.0, 40.0, 68.0, 77.0, 68.0, 80.0, 98.0, 90.0, 72.0, 66.0, 52.0, 34.0, 31.0, 18.0, 18.0, 14.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.99609375, -3.874481201171875, -3.75286865234375, -3.631256103515625, -3.5096435546875, -3.388031005859375, -3.26641845703125, -3.144805908203125, -3.023193359375, -2.901580810546875, -2.77996826171875, -2.658355712890625, -2.5367431640625, -2.415130615234375, -2.29351806640625, -2.171905517578125, -2.05029296875, -1.928680419921875, -1.80706787109375, -1.685455322265625, -1.5638427734375, -1.442230224609375, -1.32061767578125, -1.199005126953125, -1.077392578125, -0.955780029296875, -0.83416748046875, -0.712554931640625, -0.5909423828125, -0.469329833984375, -0.34771728515625, -0.226104736328125, -0.1044921875, 0.017120361328125, 0.13873291015625, 0.260345458984375, 0.3819580078125, 0.503570556640625, 0.62518310546875, 0.746795654296875, 0.868408203125, 0.990020751953125, 1.11163330078125, 1.233245849609375, 1.3548583984375, 1.476470947265625, 1.59808349609375, 1.719696044921875, 1.84130859375, 1.962921142578125, 2.08453369140625, 2.206146240234375, 2.3277587890625, 2.449371337890625, 2.57098388671875, 2.692596435546875, 2.814208984375, 2.935821533203125, 3.05743408203125, 3.179046630859375, 3.3006591796875, 3.422271728515625, 3.54388427734375, 3.665496826171875, 3.787109375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 12.0, 28.0, 69.0, 145.0, 214.0, 222.0, 169.0, 77.0, 35.0, 15.0, 8.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.45478820800781, -62.9491081237793, -59.44342803955078, -55.937744140625, -52.432064056396484, -48.92638397216797, -45.42070007324219, -41.91501998901367, -38.409339904785156, -34.90365982055664, -31.397977828979492, -27.892295837402344, -24.386615753173828, -20.880935668945312, -17.375253677368164, -13.869571685791016, -10.3638916015625, -6.858210563659668, -3.352529525756836, 0.1531515121459961, 3.658832550048828, 7.164512634277344, 10.670194625854492, 14.17587661743164, 17.681556701660156, 21.187236785888672, 24.69291877746582, 28.19860076904297, 31.704280853271484, 35.2099609375, 38.71564483642578, 42.2213249206543, 45.72700500488281, 49.23268508911133, 52.738365173339844, 56.244049072265625, 59.74972915649414, 63.255409240722656, 66.76109313964844, 70.26676940917969, 73.77245330810547, 77.27813720703125, 80.7838134765625, 84.28949737548828, 87.79518127441406, 91.30085754394531, 94.8065414428711, 98.31222534179688, 101.81790161132812, 105.3235855102539, 108.82926177978516, 112.33494567871094, 115.84062194824219, 119.34630584716797, 122.85198974609375, 126.357666015625, 129.86334228515625, 133.3690185546875, 136.8747100830078, 140.38038635253906, 143.8860626220703, 147.39175415039062, 150.89743041992188, 154.40310668945312, 157.90879821777344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 5.0, 11.0, 15.0, 12.0, 15.0, 25.0, 21.0, 20.0, 40.0, 28.0, 34.0, 41.0, 46.0, 38.0, 48.0, 50.0, 63.0, 62.0, 44.0, 47.0, 35.0, 44.0, 35.0, 28.0, 24.0, 24.0, 18.0, 22.0, 20.0, 8.0, 14.0, 12.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.3899040222168, -45.90799331665039, -44.426082611083984, -42.94417190551758, -41.46226119995117, -39.980350494384766, -38.498435974121094, -37.01652526855469, -35.53461456298828, -34.052703857421875, -32.57079315185547, -31.088882446289062, -29.606971740722656, -28.12506103515625, -26.64314842224121, -25.161237716674805, -23.67932891845703, -22.197418212890625, -20.71550750732422, -19.233596801757812, -17.751686096191406, -16.269775390625, -14.787862777709961, -13.305952072143555, -11.824041366577148, -10.342130661010742, -8.860219955444336, -7.378308296203613, -5.896397590637207, -4.414486885070801, -2.932575225830078, -1.4506645202636719, 0.03124237060546875, 1.513153314590454, 2.9950642585754395, 4.476975440979004, 5.95888614654541, 7.440796852111816, 8.922708511352539, 10.404619216918945, 11.886529922485352, 13.368440628051758, 14.850351333618164, 16.332263946533203, 17.81417465209961, 19.296085357666016, 20.777996063232422, 22.259906768798828, 23.741817474365234, 25.22372817993164, 26.705638885498047, 28.187549591064453, 29.66946029663086, 31.151371002197266, 32.63328552246094, 34.115196228027344, 35.59710693359375, 37.079017639160156, 38.56092834472656, 40.04283905029297, 41.524749755859375, 43.00666046142578, 44.48857116699219, 45.970481872558594, 47.452392578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 12.0, 21.0, 39.0, 45.0, 84.0, 177.0, 287.0, 695.0, 1509.0, 4447.0, 19739.0, 4104429.0, 51553.0, 7146.0, 2301.0, 912.0, 425.0, 183.0, 113.0, 53.0, 39.0, 21.0, 20.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984375, -16.412353515625, -15.84033203125, -15.268310546875, -14.6962890625, -14.124267578125, -13.55224609375, -12.980224609375, -12.408203125, -11.836181640625, -11.26416015625, -10.692138671875, -10.1201171875, -9.548095703125, -8.97607421875, -8.404052734375, -7.83203125, -7.260009765625, -6.68798828125, -6.115966796875, -5.5439453125, -4.971923828125, -4.39990234375, -3.827880859375, -3.255859375, -2.683837890625, -2.11181640625, -1.539794921875, -0.9677734375, -0.395751953125, 0.17626953125, 0.748291015625, 1.3203125, 1.892333984375, 2.46435546875, 3.036376953125, 3.6083984375, 4.180419921875, 4.75244140625, 5.324462890625, 5.896484375, 6.468505859375, 7.04052734375, 7.612548828125, 8.1845703125, 8.756591796875, 9.32861328125, 9.900634765625, 10.47265625, 11.044677734375, 11.61669921875, 12.188720703125, 12.7607421875, 13.332763671875, 13.90478515625, 14.476806640625, 15.048828125, 15.620849609375, 16.19287109375, 16.764892578125, 17.3369140625, 17.908935546875, 18.48095703125, 19.052978515625, 19.625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 10.0, 10.0, 13.0, 14.0, 8.0, 7.0, 17.0, 22.0, 19.0, 39.0, 29.0, 38.0, 33.0, 34.0, 44.0, 32.0, 41.0, 44.0, 52.0, 42.0, 42.0, 44.0, 40.0, 35.0, 31.0, 29.0, 29.0, 26.0, 22.0, 29.0, 25.0, 19.0, 17.0, 16.0, 7.0, 11.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.091796875, -2.0294952392578125, -1.967193603515625, -1.9048919677734375, -1.84259033203125, -1.7802886962890625, -1.717987060546875, -1.6556854248046875, -1.5933837890625, -1.5310821533203125, -1.468780517578125, -1.4064788818359375, -1.34417724609375, -1.2818756103515625, -1.219573974609375, -1.1572723388671875, -1.094970703125, -1.0326690673828125, -0.970367431640625, -0.9080657958984375, -0.84576416015625, -0.7834625244140625, -0.721160888671875, -0.6588592529296875, -0.5965576171875, -0.5342559814453125, -0.471954345703125, -0.4096527099609375, -0.34735107421875, -0.2850494384765625, -0.222747802734375, -0.1604461669921875, -0.09814453125, -0.0358428955078125, 0.026458740234375, 0.0887603759765625, 0.15106201171875, 0.2133636474609375, 0.275665283203125, 0.3379669189453125, 0.4002685546875, 0.4625701904296875, 0.524871826171875, 0.5871734619140625, 0.64947509765625, 0.7117767333984375, 0.774078369140625, 0.8363800048828125, 0.898681640625, 0.9609832763671875, 1.023284912109375, 1.0855865478515625, 1.14788818359375, 1.2101898193359375, 1.272491455078125, 1.3347930908203125, 1.3970947265625, 1.4593963623046875, 1.521697998046875, 1.5839996337890625, 1.64630126953125, 1.7086029052734375, 1.770904541015625, 1.8332061767578125, 1.8955078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 16.0, 26.0, 27.0, 36.0, 58.0, 81.0, 129.0, 180.0, 279.0, 463.0, 625.0, 1060.0, 1774.0, 3136.0, 5825.0, 12409.0, 34589.0, 283871.0, 3771137.0, 47456.0, 15339.0, 6917.0, 3581.0, 2086.0, 1168.0, 703.0, 438.0, 281.0, 186.0, 122.0, 83.0, 60.0, 42.0, 18.0, 16.0, 18.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.33984375, -7.111328125, -6.8828125, -6.654296875, -6.42578125, -6.197265625, -5.96875, -5.740234375, -5.51171875, -5.283203125, -5.0546875, -4.826171875, -4.59765625, -4.369140625, -4.140625, -3.912109375, -3.68359375, -3.455078125, -3.2265625, -2.998046875, -2.76953125, -2.541015625, -2.3125, -2.083984375, -1.85546875, -1.626953125, -1.3984375, -1.169921875, -0.94140625, -0.712890625, -0.484375, -0.255859375, -0.02734375, 0.201171875, 0.4296875, 0.658203125, 0.88671875, 1.115234375, 1.34375, 1.572265625, 1.80078125, 2.029296875, 2.2578125, 2.486328125, 2.71484375, 2.943359375, 3.171875, 3.400390625, 3.62890625, 3.857421875, 4.0859375, 4.314453125, 4.54296875, 4.771484375, 5.0, 5.228515625, 5.45703125, 5.685546875, 5.9140625, 6.142578125, 6.37109375, 6.599609375, 6.828125, 7.056640625, 7.28515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 10.0, 10.0, 23.0, 29.0, 56.0, 108.0, 785.0, 2770.0, 99.0, 41.0, 35.0, 24.0, 8.0, 6.0, 12.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.265625, -2.206024169921875, -2.14642333984375, -2.086822509765625, -2.0272216796875, -1.967620849609375, -1.90802001953125, -1.848419189453125, -1.788818359375, -1.729217529296875, -1.66961669921875, -1.610015869140625, -1.5504150390625, -1.490814208984375, -1.43121337890625, -1.371612548828125, -1.31201171875, -1.252410888671875, -1.19281005859375, -1.133209228515625, -1.0736083984375, -1.014007568359375, -0.95440673828125, -0.894805908203125, -0.835205078125, -0.775604248046875, -0.71600341796875, -0.656402587890625, -0.5968017578125, -0.537200927734375, -0.47760009765625, -0.417999267578125, -0.3583984375, -0.298797607421875, -0.23919677734375, -0.179595947265625, -0.1199951171875, -0.060394287109375, -0.00079345703125, 0.058807373046875, 0.118408203125, 0.178009033203125, 0.23760986328125, 0.297210693359375, 0.3568115234375, 0.416412353515625, 0.47601318359375, 0.535614013671875, 0.59521484375, 0.654815673828125, 0.71441650390625, 0.774017333984375, 0.8336181640625, 0.893218994140625, 0.95281982421875, 1.012420654296875, 1.072021484375, 1.131622314453125, 1.19122314453125, 1.250823974609375, 1.3104248046875, 1.370025634765625, 1.42962646484375, 1.489227294921875, 1.548828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 17.0, 41.0, 120.0, 261.0, 267.0, 154.0, 81.0, 38.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.034439086914062, -17.463809967041016, -16.89318084716797, -16.322551727294922, -15.751923561096191, -15.181294441223145, -14.610665321350098, -14.04003620147705, -13.46940803527832, -12.898778915405273, -12.328149795532227, -11.75752067565918, -11.18689250946045, -10.616263389587402, -10.045634269714355, -9.475005149841309, -8.904376029968262, -8.333746910095215, -7.763118267059326, -7.192489147186279, -6.621860504150391, -6.051231384277344, -5.480602264404297, -4.90997314453125, -4.339344501495361, -3.7687156200408936, -3.198086738586426, -2.627457618713379, -2.056828737258911, -1.4861998558044434, -0.9155707359313965, -0.3449418544769287, 0.22568702697753906, 0.7963159680366516, 1.3669449090957642, 1.9375739097595215, 2.5082027912139893, 3.078831672668457, 3.649460792541504, 4.220089912414551, 4.7907185554504395, 5.361347675323486, 5.931976318359375, 6.502605438232422, 7.073234558105469, 7.643863201141357, 8.214492797851562, 8.785120964050293, 9.35575008392334, 9.926379203796387, 10.497008323669434, 11.067636489868164, 11.638265609741211, 12.208894729614258, 12.779523849487305, 13.350152969360352, 13.920782089233398, 14.491411209106445, 15.062040328979492, 15.632669448852539, 16.203298568725586, 16.77392578125, 17.344554901123047, 17.915184020996094, 18.48581314086914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 11.0, 11.0, 10.0, 16.0, 20.0, 24.0, 21.0, 31.0, 40.0, 40.0, 44.0, 49.0, 47.0, 48.0, 49.0, 49.0, 47.0, 38.0, 34.0, 42.0, 52.0, 36.0, 39.0, 31.0, 33.0, 26.0, 21.0, 19.0, 20.0, 11.0, 7.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4828200340271, -4.332315921783447, -4.181811332702637, -4.031307220458984, -3.880803108215332, -3.7302987575531006, -3.579794406890869, -3.429290294647217, -3.2787859439849854, -3.128281593322754, -2.9777774810791016, -2.82727313041687, -2.6767687797546387, -2.5262646675109863, -2.375760316848755, -2.2252559661865234, -2.074751853942871, -1.9242476224899292, -1.7737433910369873, -1.6232390403747559, -1.472734808921814, -1.322230577468872, -1.1717262268066406, -1.0212219953536987, -0.8707177639007568, -0.7202135324478149, -0.5697092413902283, -0.419204980134964, -0.2687007188796997, -0.11819648742675781, 0.03230780363082886, 0.18281209468841553, 0.3333158493041992, 0.4838201105594635, 0.6343243718147278, 0.7848286628723145, 0.9353328943252563, 1.0858371257781982, 1.2363414764404297, 1.3868457078933716, 1.5373499393463135, 1.6878541707992554, 1.8383584022521973, 1.9888627529144287, 2.13936710357666, 2.2898712158203125, 2.440375566482544, 2.5908799171447754, 2.7413840293884277, 2.891888380050659, 3.0423924922943115, 3.192896842956543, 3.3434009552001953, 3.4939053058624268, 3.644409656524658, 3.7949137687683105, 3.945418119430542, 4.095922470092773, 4.246426582336426, 4.396930694580078, 4.547435283660889, 4.697939395904541, 4.848443508148193, 4.998948097229004, 5.149452209472656]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 14.0, 10.0, 22.0, 32.0, 48.0, 54.0, 82.0, 136.0, 235.0, 341.0, 481.0, 799.0, 1443.0, 2283.0, 3754.0, 6639.0, 11318.0, 19793.0, 34439.0, 59907.0, 103277.0, 164543.0, 210849.0, 171416.0, 107518.0, 63079.0, 36014.0, 20898.0, 11905.0, 6929.0, 4056.0, 2354.0, 1415.0, 922.0, 546.0, 370.0, 213.0, 147.0, 100.0, 58.0, 43.0, 27.0, 14.0, 16.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.810546875, -2.72918701171875, -2.6478271484375, -2.56646728515625, -2.485107421875, -2.40374755859375, -2.3223876953125, -2.24102783203125, -2.15966796875, -2.07830810546875, -1.9969482421875, -1.91558837890625, -1.834228515625, -1.75286865234375, -1.6715087890625, -1.59014892578125, -1.5087890625, -1.42742919921875, -1.3460693359375, -1.26470947265625, -1.183349609375, -1.10198974609375, -1.0206298828125, -0.93927001953125, -0.85791015625, -0.77655029296875, -0.6951904296875, -0.61383056640625, -0.532470703125, -0.45111083984375, -0.3697509765625, -0.28839111328125, -0.20703125, -0.12567138671875, -0.0443115234375, 0.03704833984375, 0.118408203125, 0.19976806640625, 0.2811279296875, 0.36248779296875, 0.44384765625, 0.52520751953125, 0.6065673828125, 0.68792724609375, 0.769287109375, 0.85064697265625, 0.9320068359375, 1.01336669921875, 1.0947265625, 1.17608642578125, 1.2574462890625, 1.33880615234375, 1.420166015625, 1.50152587890625, 1.5828857421875, 1.66424560546875, 1.74560546875, 1.82696533203125, 1.9083251953125, 1.98968505859375, 2.071044921875, 2.15240478515625, 2.2337646484375, 2.31512451171875, 2.396484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 7.0, 5.0, 9.0, 7.0, 11.0, 10.0, 9.0, 10.0, 15.0, 11.0, 27.0, 22.0, 38.0, 34.0, 34.0, 38.0, 33.0, 51.0, 45.0, 50.0, 48.0, 42.0, 49.0, 31.0, 38.0, 33.0, 40.0, 34.0, 30.0, 33.0, 36.0, 19.0, 18.0, 16.0, 11.0, 15.0, 9.0, 7.0, 4.0, 11.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.925537109375, -1.85888671875, -1.792236328125, -1.7255859375, -1.658935546875, -1.59228515625, -1.525634765625, -1.458984375, -1.392333984375, -1.32568359375, -1.259033203125, -1.1923828125, -1.125732421875, -1.05908203125, -0.992431640625, -0.92578125, -0.859130859375, -0.79248046875, -0.725830078125, -0.6591796875, -0.592529296875, -0.52587890625, -0.459228515625, -0.392578125, -0.325927734375, -0.25927734375, -0.192626953125, -0.1259765625, -0.059326171875, 0.00732421875, 0.073974609375, 0.140625, 0.207275390625, 0.27392578125, 0.340576171875, 0.4072265625, 0.473876953125, 0.54052734375, 0.607177734375, 0.673828125, 0.740478515625, 0.80712890625, 0.873779296875, 0.9404296875, 1.007080078125, 1.07373046875, 1.140380859375, 1.20703125, 1.273681640625, 1.34033203125, 1.406982421875, 1.4736328125, 1.540283203125, 1.60693359375, 1.673583984375, 1.740234375, 1.806884765625, 1.87353515625, 1.940185546875, 2.0068359375, 2.073486328125, 2.14013671875, 2.206787109375, 2.2734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 6.0, 13.0, 26.0, 22.0, 27.0, 58.0, 54.0, 95.0, 142.0, 184.0, 277.0, 429.0, 645.0, 977.0, 1825.0, 4945.0, 21309.0, 152244.0, 680948.0, 153082.0, 21357.0, 4986.0, 1980.0, 918.0, 584.0, 389.0, 285.0, 190.0, 145.0, 112.0, 72.0, 64.0, 35.0, 34.0, 17.0, 16.0, 16.0, 11.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.15234375, -6.9178466796875, -6.683349609375, -6.4488525390625, -6.21435546875, -5.9798583984375, -5.745361328125, -5.5108642578125, -5.2763671875, -5.0418701171875, -4.807373046875, -4.5728759765625, -4.33837890625, -4.1038818359375, -3.869384765625, -3.6348876953125, -3.400390625, -3.1658935546875, -2.931396484375, -2.6968994140625, -2.46240234375, -2.2279052734375, -1.993408203125, -1.7589111328125, -1.5244140625, -1.2899169921875, -1.055419921875, -0.8209228515625, -0.58642578125, -0.3519287109375, -0.117431640625, 0.1170654296875, 0.3515625, 0.5860595703125, 0.820556640625, 1.0550537109375, 1.28955078125, 1.5240478515625, 1.758544921875, 1.9930419921875, 2.2275390625, 2.4620361328125, 2.696533203125, 2.9310302734375, 3.16552734375, 3.4000244140625, 3.634521484375, 3.8690185546875, 4.103515625, 4.3380126953125, 4.572509765625, 4.8070068359375, 5.04150390625, 5.2760009765625, 5.510498046875, 5.7449951171875, 5.9794921875, 6.2139892578125, 6.448486328125, 6.6829833984375, 6.91748046875, 7.1519775390625, 7.386474609375, 7.6209716796875, 7.85546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 5.0, 11.0, 5.0, 10.0, 17.0, 11.0, 14.0, 17.0, 26.0, 25.0, 28.0, 18.0, 46.0, 31.0, 29.0, 36.0, 41.0, 42.0, 49.0, 35.0, 43.0, 47.0, 44.0, 37.0, 35.0, 42.0, 34.0, 23.0, 25.0, 23.0, 21.0, 26.0, 14.0, 19.0, 13.0, 15.0, 13.0, 3.0, 6.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.015625, -9.7249755859375, -9.434326171875, -9.1436767578125, -8.85302734375, -8.5623779296875, -8.271728515625, -7.9810791015625, -7.6904296875, -7.3997802734375, -7.109130859375, -6.8184814453125, -6.52783203125, -6.2371826171875, -5.946533203125, -5.6558837890625, -5.365234375, -5.0745849609375, -4.783935546875, -4.4932861328125, -4.20263671875, -3.9119873046875, -3.621337890625, -3.3306884765625, -3.0400390625, -2.7493896484375, -2.458740234375, -2.1680908203125, -1.87744140625, -1.5867919921875, -1.296142578125, -1.0054931640625, -0.71484375, -0.4241943359375, -0.133544921875, 0.1571044921875, 0.44775390625, 0.7384033203125, 1.029052734375, 1.3197021484375, 1.6103515625, 1.9010009765625, 2.191650390625, 2.4822998046875, 2.77294921875, 3.0635986328125, 3.354248046875, 3.6448974609375, 3.935546875, 4.2261962890625, 4.516845703125, 4.8074951171875, 5.09814453125, 5.3887939453125, 5.679443359375, 5.9700927734375, 6.2607421875, 6.5513916015625, 6.842041015625, 7.1326904296875, 7.42333984375, 7.7139892578125, 8.004638671875, 8.2952880859375, 8.5859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 12.0, 15.0, 15.0, 16.0, 30.0, 46.0, 66.0, 126.0, 216.0, 474.0, 1161.0, 4366.0, 29602.0, 551650.0, 430566.0, 24307.0, 3847.0, 1075.0, 422.0, 219.0, 107.0, 77.0, 50.0, 30.0, 21.0, 13.0, 11.0, 6.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.5, -6.30859375, -6.1171875, -5.92578125, -5.734375, -5.54296875, -5.3515625, -5.16015625, -4.96875, -4.77734375, -4.5859375, -4.39453125, -4.203125, -4.01171875, -3.8203125, -3.62890625, -3.4375, -3.24609375, -3.0546875, -2.86328125, -2.671875, -2.48046875, -2.2890625, -2.09765625, -1.90625, -1.71484375, -1.5234375, -1.33203125, -1.140625, -0.94921875, -0.7578125, -0.56640625, -0.375, -0.18359375, 0.0078125, 0.19921875, 0.390625, 0.58203125, 0.7734375, 0.96484375, 1.15625, 1.34765625, 1.5390625, 1.73046875, 1.921875, 2.11328125, 2.3046875, 2.49609375, 2.6875, 2.87890625, 3.0703125, 3.26171875, 3.453125, 3.64453125, 3.8359375, 4.02734375, 4.21875, 4.41015625, 4.6015625, 4.79296875, 4.984375, 5.17578125, 5.3671875, 5.55859375, 5.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 12.0, 15.0, 12.0, 25.0, 31.0, 51.0, 75.0, 106.0, 152.0, 163.0, 110.0, 87.0, 52.0, 54.0, 19.0, 14.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009241104125976562, -0.0008888691663742065, -0.0008536279201507568, -0.0008183866739273071, -0.0007831454277038574, -0.0007479041814804077, -0.000712662935256958, -0.0006774216890335083, -0.0006421804428100586, -0.0006069391965866089, -0.0005716979503631592, -0.0005364567041397095, -0.0005012154579162598, -0.00046597421169281006, -0.00043073296546936035, -0.00039549171924591064, -0.00036025047302246094, -0.00032500922679901123, -0.0002897679805755615, -0.0002545267343521118, -0.0002192854881286621, -0.0001840442419052124, -0.0001488029956817627, -0.00011356174945831299, -7.832050323486328e-05, -4.3079257011413574e-05, -7.838010787963867e-06, 2.740323543548584e-05, 6.264448165893555e-05, 9.788572788238525e-05, 0.00013312697410583496, 0.00016836822032928467, 0.00020360946655273438, 0.00023885071277618408, 0.0002740919589996338, 0.0003093332052230835, 0.0003445744514465332, 0.0003798156976699829, 0.0004150569438934326, 0.0004502981901168823, 0.00048553943634033203, 0.0005207806825637817, 0.0005560219287872314, 0.0005912631750106812, 0.0006265044212341309, 0.0006617456674575806, 0.0006969869136810303, 0.00073222815990448, 0.0007674694061279297, 0.0008027106523513794, 0.0008379518985748291, 0.0008731931447982788, 0.0009084343910217285, 0.0009436756372451782, 0.000978916883468628, 0.0010141581296920776, 0.0010493993759155273, 0.001084640622138977, 0.0011198818683624268, 0.0011551231145858765, 0.0011903643608093262, 0.0012256056070327759, 0.0012608468532562256, 0.0012960880994796753, 0.001331329345703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 5.0, 11.0, 6.0, 13.0, 23.0, 27.0, 37.0, 40.0, 76.0, 98.0, 125.0, 203.0, 382.0, 694.0, 1335.0, 3072.0, 8247.0, 32935.0, 220502.0, 626631.0, 122624.0, 20552.0, 5850.0, 2394.0, 1143.0, 555.0, 341.0, 167.0, 139.0, 89.0, 73.0, 41.0, 28.0, 16.0, 16.0, 12.0, 5.0, 8.0, 6.0, 2.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.156494140625, -4.02392578125, -3.891357421875, -3.7587890625, -3.626220703125, -3.49365234375, -3.361083984375, -3.228515625, -3.095947265625, -2.96337890625, -2.830810546875, -2.6982421875, -2.565673828125, -2.43310546875, -2.300537109375, -2.16796875, -2.035400390625, -1.90283203125, -1.770263671875, -1.6376953125, -1.505126953125, -1.37255859375, -1.239990234375, -1.107421875, -0.974853515625, -0.84228515625, -0.709716796875, -0.5771484375, -0.444580078125, -0.31201171875, -0.179443359375, -0.046875, 0.085693359375, 0.21826171875, 0.350830078125, 0.4833984375, 0.615966796875, 0.74853515625, 0.881103515625, 1.013671875, 1.146240234375, 1.27880859375, 1.411376953125, 1.5439453125, 1.676513671875, 1.80908203125, 1.941650390625, 2.07421875, 2.206787109375, 2.33935546875, 2.471923828125, 2.6044921875, 2.737060546875, 2.86962890625, 3.002197265625, 3.134765625, 3.267333984375, 3.39990234375, 3.532470703125, 3.6650390625, 3.797607421875, 3.93017578125, 4.062744140625, 4.1953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 5.0, 9.0, 11.0, 11.0, 15.0, 19.0, 24.0, 46.0, 53.0, 46.0, 65.0, 75.0, 91.0, 95.0, 91.0, 70.0, 61.0, 40.0, 43.0, 28.0, 22.0, 19.0, 19.0, 10.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.93359375, -5.8026123046875, -5.671630859375, -5.5406494140625, -5.40966796875, -5.2786865234375, -5.147705078125, -5.0167236328125, -4.8857421875, -4.7547607421875, -4.623779296875, -4.4927978515625, -4.36181640625, -4.2308349609375, -4.099853515625, -3.9688720703125, -3.837890625, -3.7069091796875, -3.575927734375, -3.4449462890625, -3.31396484375, -3.1829833984375, -3.052001953125, -2.9210205078125, -2.7900390625, -2.6590576171875, -2.528076171875, -2.3970947265625, -2.26611328125, -2.1351318359375, -2.004150390625, -1.8731689453125, -1.7421875, -1.6112060546875, -1.480224609375, -1.3492431640625, -1.21826171875, -1.0872802734375, -0.956298828125, -0.8253173828125, -0.6943359375, -0.5633544921875, -0.432373046875, -0.3013916015625, -0.17041015625, -0.0394287109375, 0.091552734375, 0.2225341796875, 0.353515625, 0.4844970703125, 0.615478515625, 0.7464599609375, 0.87744140625, 1.0084228515625, 1.139404296875, 1.2703857421875, 1.4013671875, 1.5323486328125, 1.663330078125, 1.7943115234375, 1.92529296875, 2.0562744140625, 2.187255859375, 2.3182373046875, 2.44921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 27.0, 93.0, 229.0, 300.0, 209.0, 87.0, 25.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.5, -108.67144775390625, -104.84290313720703, -101.01435089111328, -97.18580627441406, -93.35725402832031, -89.52870178222656, -85.70014953613281, -81.8716049194336, -78.04305267333984, -74.21450805664062, -70.38595581054688, -66.55740356445312, -62.728858947753906, -58.900306701660156, -55.07175827026367, -51.24320983886719, -47.4146614074707, -43.58611297607422, -39.75756072998047, -35.929012298583984, -32.1004638671875, -28.271913528442383, -24.443363189697266, -20.61481475830078, -16.786266326904297, -12.95771598815918, -9.129166603088379, -5.300617218017578, -1.4720687866210938, 2.3564815521240234, 6.185031890869141, 10.013580322265625, 13.842129707336426, 17.670679092407227, 21.499229431152344, 25.327777862548828, 29.156326293945312, 32.98487854003906, 36.81342697143555, 40.64197540283203, 44.470523834228516, 48.299072265625, 52.12762451171875, 55.956172943115234, 59.78472137451172, 63.61327362060547, 67.44181823730469, 71.27037048339844, 75.09892272949219, 78.9274673461914, 82.75601959228516, 86.58456420898438, 90.41311645507812, 94.24166870117188, 98.07022094726562, 101.89876556396484, 105.7273178100586, 109.55586242675781, 113.38441467285156, 117.21296691894531, 121.04151153564453, 124.87006378173828, 128.6986083984375, 132.52716064453125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 6.0, 7.0, 17.0, 10.0, 20.0, 24.0, 38.0, 40.0, 43.0, 50.0, 48.0, 50.0, 56.0, 55.0, 66.0, 59.0, 54.0, 68.0, 34.0, 38.0, 41.0, 30.0, 28.0, 21.0, 22.0, 21.0, 12.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-68.15034484863281, -66.32388305664062, -64.49742889404297, -62.67096710205078, -60.84450912475586, -59.01805114746094, -57.191593170166016, -55.365135192871094, -53.538673400878906, -51.712215423583984, -49.88575744628906, -48.059295654296875, -46.23283767700195, -44.40637969970703, -42.57992172241211, -40.75346374511719, -38.927001953125, -37.10054397583008, -35.274085998535156, -33.44762420654297, -31.621166229248047, -29.794708251953125, -27.968250274658203, -26.14179039001465, -24.31533432006836, -22.488876342773438, -20.662416458129883, -18.83595848083496, -17.009498596191406, -15.183040618896484, -13.356581687927246, -11.530122756958008, -9.703662872314453, -7.877203941345215, -6.050745010375977, -4.2242865562438965, -2.397827625274658, -0.5713691711425781, 1.2550897598266602, 3.0815486907958984, 4.908007621765137, 6.734466552734375, 8.560925483703613, 10.387384414672852, 12.213842391967773, 14.040301322937012, 15.86676025390625, 17.693218231201172, 19.519678115844727, 21.34613609313965, 23.172595977783203, 24.999053955078125, 26.82551383972168, 28.6519718170166, 30.478431701660156, 32.30488967895508, 34.13134765625, 35.95780563354492, 37.784263610839844, 39.61072540283203, 41.43718338012695, 43.263641357421875, 45.0900993347168, 46.91655731201172, 48.743019104003906]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 4.0, 6.0, 10.0, 13.0, 18.0, 24.0, 47.0, 87.0, 147.0, 244.0, 557.0, 1598.0, 5048.0, 23582.0, 3737365.0, 399834.0, 18880.0, 4195.0, 1437.0, 606.0, 241.0, 145.0, 57.0, 36.0, 31.0, 19.0, 10.0, 8.0, 6.0, 7.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.517578125, -14.08984375, -13.662109375, -13.234375, -12.806640625, -12.37890625, -11.951171875, -11.5234375, -11.095703125, -10.66796875, -10.240234375, -9.8125, -9.384765625, -8.95703125, -8.529296875, -8.1015625, -7.673828125, -7.24609375, -6.818359375, -6.390625, -5.962890625, -5.53515625, -5.107421875, -4.6796875, -4.251953125, -3.82421875, -3.396484375, -2.96875, -2.541015625, -2.11328125, -1.685546875, -1.2578125, -0.830078125, -0.40234375, 0.025390625, 0.453125, 0.880859375, 1.30859375, 1.736328125, 2.1640625, 2.591796875, 3.01953125, 3.447265625, 3.875, 4.302734375, 4.73046875, 5.158203125, 5.5859375, 6.013671875, 6.44140625, 6.869140625, 7.296875, 7.724609375, 8.15234375, 8.580078125, 9.0078125, 9.435546875, 9.86328125, 10.291015625, 10.71875, 11.146484375, 11.57421875, 12.001953125, 12.4296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 12.0, 18.0, 23.0, 37.0, 45.0, 54.0, 62.0, 56.0, 66.0, 77.0, 57.0, 68.0, 64.0, 53.0, 52.0, 57.0, 43.0, 45.0, 19.0, 20.0, 13.0, 10.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.353515625, -2.254791259765625, -2.15606689453125, -2.057342529296875, -1.9586181640625, -1.859893798828125, -1.76116943359375, -1.662445068359375, -1.563720703125, -1.464996337890625, -1.36627197265625, -1.267547607421875, -1.1688232421875, -1.070098876953125, -0.97137451171875, -0.872650146484375, -0.77392578125, -0.675201416015625, -0.57647705078125, -0.477752685546875, -0.3790283203125, -0.280303955078125, -0.18157958984375, -0.082855224609375, 0.015869140625, 0.114593505859375, 0.21331787109375, 0.312042236328125, 0.4107666015625, 0.509490966796875, 0.60821533203125, 0.706939697265625, 0.8056640625, 0.904388427734375, 1.00311279296875, 1.101837158203125, 1.2005615234375, 1.299285888671875, 1.39801025390625, 1.496734619140625, 1.595458984375, 1.694183349609375, 1.79290771484375, 1.891632080078125, 1.9903564453125, 2.089080810546875, 2.18780517578125, 2.286529541015625, 2.38525390625, 2.483978271484375, 2.58270263671875, 2.681427001953125, 2.7801513671875, 2.878875732421875, 2.97760009765625, 3.076324462890625, 3.175048828125, 3.273773193359375, 3.37249755859375, 3.471221923828125, 3.5699462890625, 3.668670654296875, 3.76739501953125, 3.866119384765625, 3.96484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 6.0, 17.0, 9.0, 14.0, 30.0, 22.0, 42.0, 53.0, 73.0, 102.0, 118.0, 200.0, 302.0, 549.0, 1059.0, 2217.0, 5388.0, 15796.0, 69654.0, 3818294.0, 235731.0, 29034.0, 8705.0, 3348.0, 1515.0, 742.0, 398.0, 238.0, 173.0, 102.0, 86.0, 70.0, 36.0, 34.0, 26.0, 7.0, 12.0, 17.0, 7.0, 9.0, 10.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.96875, -8.6861572265625, -8.403564453125, -8.1209716796875, -7.83837890625, -7.5557861328125, -7.273193359375, -6.9906005859375, -6.7080078125, -6.4254150390625, -6.142822265625, -5.8602294921875, -5.57763671875, -5.2950439453125, -5.012451171875, -4.7298583984375, -4.447265625, -4.1646728515625, -3.882080078125, -3.5994873046875, -3.31689453125, -3.0343017578125, -2.751708984375, -2.4691162109375, -2.1865234375, -1.9039306640625, -1.621337890625, -1.3387451171875, -1.05615234375, -0.7735595703125, -0.490966796875, -0.2083740234375, 0.07421875, 0.3568115234375, 0.639404296875, 0.9219970703125, 1.20458984375, 1.4871826171875, 1.769775390625, 2.0523681640625, 2.3349609375, 2.6175537109375, 2.900146484375, 3.1827392578125, 3.46533203125, 3.7479248046875, 4.030517578125, 4.3131103515625, 4.595703125, 4.8782958984375, 5.160888671875, 5.4434814453125, 5.72607421875, 6.0086669921875, 6.291259765625, 6.5738525390625, 6.8564453125, 7.1390380859375, 7.421630859375, 7.7042236328125, 7.98681640625, 8.2694091796875, 8.552001953125, 8.8345947265625, 9.1171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 13.0, 10.0, 17.0, 43.0, 109.0, 311.0, 3125.0, 266.0, 77.0, 32.0, 28.0, 15.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.66741943359375, -5.4871826171875, -5.30694580078125, -5.126708984375, -4.94647216796875, -4.7662353515625, -4.58599853515625, -4.40576171875, -4.22552490234375, -4.0452880859375, -3.86505126953125, -3.684814453125, -3.50457763671875, -3.3243408203125, -3.14410400390625, -2.9638671875, -2.78363037109375, -2.6033935546875, -2.42315673828125, -2.242919921875, -2.06268310546875, -1.8824462890625, -1.70220947265625, -1.52197265625, -1.34173583984375, -1.1614990234375, -0.98126220703125, -0.801025390625, -0.62078857421875, -0.4405517578125, -0.26031494140625, -0.080078125, 0.10015869140625, 0.2803955078125, 0.46063232421875, 0.640869140625, 0.82110595703125, 1.0013427734375, 1.18157958984375, 1.36181640625, 1.54205322265625, 1.7222900390625, 1.90252685546875, 2.082763671875, 2.26300048828125, 2.4432373046875, 2.62347412109375, 2.8037109375, 2.98394775390625, 3.1641845703125, 3.34442138671875, 3.524658203125, 3.70489501953125, 3.8851318359375, 4.06536865234375, 4.24560546875, 4.42584228515625, 4.6060791015625, 4.78631591796875, 4.966552734375, 5.14678955078125, 5.3270263671875, 5.50726318359375, 5.6875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.0, 5.0, 5.0, 11.0, 11.0, 30.0, 46.0, 70.0, 94.0, 118.0, 127.0, 121.0, 115.0, 87.0, 53.0, 42.0, 19.0, 8.0, 11.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.948150634765625, -14.397525787353516, -13.84689998626709, -13.29627513885498, -12.745649337768555, -12.195024490356445, -11.644399642944336, -11.093774795532227, -10.5431489944458, -9.992524147033691, -9.441898345947266, -8.891273498535156, -8.340648651123047, -7.790022850036621, -7.239398002624512, -6.688772678375244, -6.138147354125977, -5.587522029876709, -5.036896705627441, -4.486271858215332, -3.9356465339660645, -3.385021209716797, -2.8343961238861084, -2.28377103805542, -1.7331457138061523, -1.1825205087661743, -0.6318953037261963, -0.08127009868621826, 0.46935510635375977, 1.0199804306030273, 1.5706055164337158, 2.1212306022644043, 2.671855926513672, 3.2224812507629395, 3.773106336593628, 4.323731422424316, 4.874356746673584, 5.424982070922852, 5.975606918334961, 6.5262322425842285, 7.076857566833496, 7.627482891082764, 8.178108215332031, 8.72873306274414, 9.27935791015625, 9.829983711242676, 10.380608558654785, 10.931234359741211, 11.48185920715332, 12.03248405456543, 12.583109855651855, 13.133734703063965, 13.68436050415039, 14.2349853515625, 14.78561019897461, 15.336235046386719, 15.886860847473145, 16.43748664855957, 16.98811149597168, 17.53873634338379, 18.0893611907959, 18.63998794555664, 19.19061279296875, 19.74123764038086, 20.29186248779297]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 17.0, 12.0, 20.0, 20.0, 27.0, 34.0, 26.0, 40.0, 40.0, 28.0, 33.0, 50.0, 50.0, 41.0, 52.0, 38.0, 31.0, 35.0, 36.0, 37.0, 50.0, 27.0, 44.0, 19.0, 20.0, 26.0, 21.0, 14.0, 11.0, 21.0, 10.0, 5.0, 11.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.943729400634766, -9.657906532287598, -9.372084617614746, -9.086261749267578, -8.800439834594727, -8.514616966247559, -8.22879409790039, -7.942971706390381, -7.657149314880371, -7.371326923370361, -7.085504531860352, -6.799681663513184, -6.513859272003174, -6.228036880493164, -5.942214012145996, -5.656391620635986, -5.370569229125977, -5.084746837615967, -4.798924446105957, -4.513101577758789, -4.227279186248779, -3.9414567947387695, -3.6556341648101807, -3.369811534881592, -3.083989143371582, -2.7981667518615723, -2.5123441219329834, -2.2265214920043945, -1.9406991004943848, -1.6548765897750854, -1.3690540790557861, -1.0832314491271973, -0.7974090576171875, -0.5115865468978882, -0.22576403617858887, 0.06005847454071045, 0.34588098526000977, 0.6317034959793091, 0.9175260066986084, 1.2033486366271973, 1.489171028137207, 1.7749935388565063, 2.0608160495758057, 2.3466386795043945, 2.6324610710144043, 2.918283462524414, 3.204106092453003, 3.489928722381592, 3.7757511138916016, 4.061573505401611, 4.347395896911621, 4.633218765258789, 4.919041156768799, 5.204863548278809, 5.490686416625977, 5.776508808135986, 6.062331199645996, 6.348153591156006, 6.633975982666016, 6.919798851013184, 7.205621242523193, 7.491443634033203, 7.777266502380371, 8.063089370727539, 8.34891128540039]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 20.0, 17.0, 28.0, 34.0, 71.0, 83.0, 162.0, 232.0, 366.0, 581.0, 949.0, 1442.0, 2582.0, 4443.0, 7606.0, 13596.0, 25079.0, 45688.0, 83461.0, 159211.0, 268559.0, 201114.0, 105440.0, 57242.0, 31109.0, 16886.0, 9362.0, 5428.0, 2986.0, 1800.0, 1063.0, 654.0, 400.0, 274.0, 185.0, 119.0, 77.0, 50.0, 34.0, 29.0, 18.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.7890625, -3.669464111328125, -3.54986572265625, -3.430267333984375, -3.3106689453125, -3.191070556640625, -3.07147216796875, -2.951873779296875, -2.832275390625, -2.712677001953125, -2.59307861328125, -2.473480224609375, -2.3538818359375, -2.234283447265625, -2.11468505859375, -1.995086669921875, -1.87548828125, -1.755889892578125, -1.63629150390625, -1.516693115234375, -1.3970947265625, -1.277496337890625, -1.15789794921875, -1.038299560546875, -0.918701171875, -0.799102783203125, -0.67950439453125, -0.559906005859375, -0.4403076171875, -0.320709228515625, -0.20111083984375, -0.081512451171875, 0.0380859375, 0.157684326171875, 0.27728271484375, 0.396881103515625, 0.5164794921875, 0.636077880859375, 0.75567626953125, 0.875274658203125, 0.994873046875, 1.114471435546875, 1.23406982421875, 1.353668212890625, 1.4732666015625, 1.592864990234375, 1.71246337890625, 1.832061767578125, 1.95166015625, 2.071258544921875, 2.19085693359375, 2.310455322265625, 2.4300537109375, 2.549652099609375, 2.66925048828125, 2.788848876953125, 2.908447265625, 3.028045654296875, 3.14764404296875, 3.267242431640625, 3.3868408203125, 3.506439208984375, 3.62603759765625, 3.745635986328125, 3.865234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 4.0, 8.0, 21.0, 15.0, 24.0, 16.0, 34.0, 35.0, 48.0, 39.0, 55.0, 53.0, 59.0, 48.0, 51.0, 56.0, 66.0, 53.0, 48.0, 37.0, 37.0, 35.0, 29.0, 35.0, 16.0, 16.0, 14.0, 13.0, 6.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6328125, -2.54388427734375, -2.4549560546875, -2.36602783203125, -2.277099609375, -2.18817138671875, -2.0992431640625, -2.01031494140625, -1.92138671875, -1.83245849609375, -1.7435302734375, -1.65460205078125, -1.565673828125, -1.47674560546875, -1.3878173828125, -1.29888916015625, -1.2099609375, -1.12103271484375, -1.0321044921875, -0.94317626953125, -0.854248046875, -0.76531982421875, -0.6763916015625, -0.58746337890625, -0.49853515625, -0.40960693359375, -0.3206787109375, -0.23175048828125, -0.142822265625, -0.05389404296875, 0.0350341796875, 0.12396240234375, 0.212890625, 0.30181884765625, 0.3907470703125, 0.47967529296875, 0.568603515625, 0.65753173828125, 0.7464599609375, 0.83538818359375, 0.92431640625, 1.01324462890625, 1.1021728515625, 1.19110107421875, 1.280029296875, 1.36895751953125, 1.4578857421875, 1.54681396484375, 1.6357421875, 1.72467041015625, 1.8135986328125, 1.90252685546875, 1.991455078125, 2.08038330078125, 2.1693115234375, 2.25823974609375, 2.34716796875, 2.43609619140625, 2.5250244140625, 2.61395263671875, 2.702880859375, 2.79180908203125, 2.8807373046875, 2.96966552734375, 3.05859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 10.0, 18.0, 29.0, 36.0, 72.0, 108.0, 131.0, 214.0, 394.0, 609.0, 1067.0, 2207.0, 6321.0, 34097.0, 378211.0, 562849.0, 48605.0, 7992.0, 2497.0, 1281.0, 643.0, 410.0, 276.0, 139.0, 102.0, 76.0, 38.0, 28.0, 24.0, 13.0, 10.0, 9.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -8.9912109375, -8.646484375, -8.3017578125, -7.95703125, -7.6123046875, -7.267578125, -6.9228515625, -6.578125, -6.2333984375, -5.888671875, -5.5439453125, -5.19921875, -4.8544921875, -4.509765625, -4.1650390625, -3.8203125, -3.4755859375, -3.130859375, -2.7861328125, -2.44140625, -2.0966796875, -1.751953125, -1.4072265625, -1.0625, -0.7177734375, -0.373046875, -0.0283203125, 0.31640625, 0.6611328125, 1.005859375, 1.3505859375, 1.6953125, 2.0400390625, 2.384765625, 2.7294921875, 3.07421875, 3.4189453125, 3.763671875, 4.1083984375, 4.453125, 4.7978515625, 5.142578125, 5.4873046875, 5.83203125, 6.1767578125, 6.521484375, 6.8662109375, 7.2109375, 7.5556640625, 7.900390625, 8.2451171875, 8.58984375, 8.9345703125, 9.279296875, 9.6240234375, 9.96875, 10.3134765625, 10.658203125, 11.0029296875, 11.34765625, 11.6923828125, 12.037109375, 12.3818359375, 12.7265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 6.0, 12.0, 5.0, 12.0, 9.0, 10.0, 19.0, 23.0, 25.0, 26.0, 20.0, 28.0, 41.0, 31.0, 36.0, 48.0, 40.0, 47.0, 41.0, 33.0, 44.0, 48.0, 31.0, 31.0, 42.0, 34.0, 38.0, 19.0, 33.0, 26.0, 19.0, 18.0, 19.0, 13.0, 16.0, 6.0, 5.0, 8.0, 9.0, 4.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.09375, -8.8101806640625, -8.526611328125, -8.2430419921875, -7.95947265625, -7.6759033203125, -7.392333984375, -7.1087646484375, -6.8251953125, -6.5416259765625, -6.258056640625, -5.9744873046875, -5.69091796875, -5.4073486328125, -5.123779296875, -4.8402099609375, -4.556640625, -4.2730712890625, -3.989501953125, -3.7059326171875, -3.42236328125, -3.1387939453125, -2.855224609375, -2.5716552734375, -2.2880859375, -2.0045166015625, -1.720947265625, -1.4373779296875, -1.15380859375, -0.8702392578125, -0.586669921875, -0.3031005859375, -0.01953125, 0.2640380859375, 0.547607421875, 0.8311767578125, 1.11474609375, 1.3983154296875, 1.681884765625, 1.9654541015625, 2.2490234375, 2.5325927734375, 2.816162109375, 3.0997314453125, 3.38330078125, 3.6668701171875, 3.950439453125, 4.2340087890625, 4.517578125, 4.8011474609375, 5.084716796875, 5.3682861328125, 5.65185546875, 5.9354248046875, 6.218994140625, 6.5025634765625, 6.7861328125, 7.0697021484375, 7.353271484375, 7.6368408203125, 7.92041015625, 8.2039794921875, 8.487548828125, 8.7711181640625, 9.0546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 14.0, 19.0, 34.0, 50.0, 83.0, 156.0, 226.0, 539.0, 1271.0, 3407.0, 12920.0, 74172.0, 553132.0, 342709.0, 46251.0, 8939.0, 2600.0, 967.0, 461.0, 255.0, 124.0, 80.0, 49.0, 29.0, 12.0, 13.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.40625, -4.295745849609375, -4.18524169921875, -4.074737548828125, -3.9642333984375, -3.853729248046875, -3.74322509765625, -3.632720947265625, -3.522216796875, -3.411712646484375, -3.30120849609375, -3.190704345703125, -3.0802001953125, -2.969696044921875, -2.85919189453125, -2.748687744140625, -2.63818359375, -2.527679443359375, -2.41717529296875, -2.306671142578125, -2.1961669921875, -2.085662841796875, -1.97515869140625, -1.864654541015625, -1.754150390625, -1.643646240234375, -1.53314208984375, -1.422637939453125, -1.3121337890625, -1.201629638671875, -1.09112548828125, -0.980621337890625, -0.8701171875, -0.759613037109375, -0.64910888671875, -0.538604736328125, -0.4281005859375, -0.317596435546875, -0.20709228515625, -0.096588134765625, 0.013916015625, 0.124420166015625, 0.23492431640625, 0.345428466796875, 0.4559326171875, 0.566436767578125, 0.67694091796875, 0.787445068359375, 0.89794921875, 1.008453369140625, 1.11895751953125, 1.229461669921875, 1.3399658203125, 1.450469970703125, 1.56097412109375, 1.671478271484375, 1.781982421875, 1.892486572265625, 2.00299072265625, 2.113494873046875, 2.2239990234375, 2.334503173828125, 2.44500732421875, 2.555511474609375, 2.666015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 9.0, 9.0, 13.0, 14.0, 17.0, 32.0, 37.0, 45.0, 54.0, 59.0, 80.0, 114.0, 105.0, 94.0, 53.0, 42.0, 37.0, 31.0, 27.0, 25.0, 13.0, 10.0, 14.0, 11.0, 8.0, 5.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000888824462890625, -0.0008640140295028687, -0.0008392035961151123, -0.000814393162727356, -0.0007895827293395996, -0.0007647722959518433, -0.0007399618625640869, -0.0007151514291763306, -0.0006903409957885742, -0.0006655305624008179, -0.0006407201290130615, -0.0006159096956253052, -0.0005910992622375488, -0.0005662888288497925, -0.0005414783954620361, -0.0005166679620742798, -0.0004918575286865234, -0.0004670470952987671, -0.00044223666191101074, -0.0004174262285232544, -0.00039261579513549805, -0.0003678053617477417, -0.00034299492835998535, -0.000318184494972229, -0.00029337406158447266, -0.0002685636281967163, -0.00024375319480895996, -0.0002189427614212036, -0.00019413232803344727, -0.00016932189464569092, -0.00014451146125793457, -0.00011970102787017822, -9.489059448242188e-05, -7.008016109466553e-05, -4.526972770690918e-05, -2.0459294319152832e-05, 4.351139068603516e-06, 2.9161572456359863e-05, 5.397200584411621e-05, 7.878243923187256e-05, 0.0001035928726196289, 0.00012840330600738525, 0.0001532137393951416, 0.00017802417278289795, 0.0002028346061706543, 0.00022764503955841064, 0.000252455472946167, 0.00027726590633392334, 0.0003020763397216797, 0.00032688677310943604, 0.0003516972064971924, 0.00037650763988494873, 0.0004013180732727051, 0.0004261285066604614, 0.0004509389400482178, 0.0004757493734359741, 0.0005005598068237305, 0.0005253702402114868, 0.0005501806735992432, 0.0005749911069869995, 0.0005998015403747559, 0.0006246119737625122, 0.0006494224071502686, 0.0006742328405380249, 0.0006990432739257812]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 7.0, 16.0, 16.0, 37.0, 49.0, 128.0, 450.0, 2438.0, 52018.0, 965331.0, 25685.0, 1791.0, 358.0, 116.0, 60.0, 23.0, 19.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0859375, -11.77935791015625, -11.4727783203125, -11.16619873046875, -10.859619140625, -10.55303955078125, -10.2464599609375, -9.93988037109375, -9.63330078125, -9.32672119140625, -9.0201416015625, -8.71356201171875, -8.406982421875, -8.10040283203125, -7.7938232421875, -7.48724365234375, -7.1806640625, -6.87408447265625, -6.5675048828125, -6.26092529296875, -5.954345703125, -5.64776611328125, -5.3411865234375, -5.03460693359375, -4.72802734375, -4.42144775390625, -4.1148681640625, -3.80828857421875, -3.501708984375, -3.19512939453125, -2.8885498046875, -2.58197021484375, -2.275390625, -1.96881103515625, -1.6622314453125, -1.35565185546875, -1.049072265625, -0.74249267578125, -0.4359130859375, -0.12933349609375, 0.17724609375, 0.48382568359375, 0.7904052734375, 1.09698486328125, 1.403564453125, 1.71014404296875, 2.0167236328125, 2.32330322265625, 2.6298828125, 2.93646240234375, 3.2430419921875, 3.54962158203125, 3.856201171875, 4.16278076171875, 4.4693603515625, 4.77593994140625, 5.08251953125, 5.38909912109375, 5.6956787109375, 6.00225830078125, 6.308837890625, 6.61541748046875, 6.9219970703125, 7.22857666015625, 7.53515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 16.0, 28.0, 37.0, 50.0, 61.0, 84.0, 137.0, 127.0, 124.0, 112.0, 59.0, 47.0, 41.0, 34.0, 14.0, 11.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.93359375, -7.7767333984375, -7.619873046875, -7.4630126953125, -7.30615234375, -7.1492919921875, -6.992431640625, -6.8355712890625, -6.6787109375, -6.5218505859375, -6.364990234375, -6.2081298828125, -6.05126953125, -5.8944091796875, -5.737548828125, -5.5806884765625, -5.423828125, -5.2669677734375, -5.110107421875, -4.9532470703125, -4.79638671875, -4.6395263671875, -4.482666015625, -4.3258056640625, -4.1689453125, -4.0120849609375, -3.855224609375, -3.6983642578125, -3.54150390625, -3.3846435546875, -3.227783203125, -3.0709228515625, -2.9140625, -2.7572021484375, -2.600341796875, -2.4434814453125, -2.28662109375, -2.1297607421875, -1.972900390625, -1.8160400390625, -1.6591796875, -1.5023193359375, -1.345458984375, -1.1885986328125, -1.03173828125, -0.8748779296875, -0.718017578125, -0.5611572265625, -0.404296875, -0.2474365234375, -0.090576171875, 0.0662841796875, 0.22314453125, 0.3800048828125, 0.536865234375, 0.6937255859375, 0.8505859375, 1.0074462890625, 1.164306640625, 1.3211669921875, 1.47802734375, 1.6348876953125, 1.791748046875, 1.9486083984375, 2.10546875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 10.0, 15.0, 47.0, 160.0, 313.0, 274.0, 140.0, 28.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.69741821289062, -79.9940414428711, -75.29066467285156, -70.5872802734375, -65.88390350341797, -61.18052673339844, -56.47714614868164, -51.773765563964844, -47.07038879394531, -42.36701202392578, -37.663631439208984, -32.96025085449219, -28.256874084472656, -23.553495407104492, -18.850116729736328, -14.146736145019531, -9.443359375, -4.739980697631836, -0.036602020263671875, 4.666776657104492, 9.370155334472656, 14.07353401184082, 18.776912689208984, 23.48029327392578, 28.183670043945312, 32.887046813964844, 37.59042739868164, 42.29380798339844, 46.99718475341797, 51.7005615234375, 56.4039421081543, 61.107322692871094, 65.81071472167969, 70.51409149169922, 75.21746826171875, 79.92085266113281, 84.62422943115234, 89.32760620117188, 94.03099060058594, 98.73436737060547, 103.437744140625, 108.14112091064453, 112.84449768066406, 117.54788208007812, 122.25125885009766, 126.95463562011719, 131.65802001953125, 136.36138916015625, 141.0647735595703, 145.76815795898438, 150.47152709960938, 155.17491149902344, 159.8782958984375, 164.5816650390625, 169.28504943847656, 173.98843383789062, 178.69180297851562, 183.3951873779297, 188.0985565185547, 192.80194091796875, 197.50531005859375, 202.2086944580078, 206.91207885742188, 211.61544799804688, 216.31883239746094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 6.0, 10.0, 10.0, 15.0, 19.0, 22.0, 32.0, 27.0, 40.0, 33.0, 42.0, 49.0, 51.0, 51.0, 48.0, 55.0, 58.0, 47.0, 47.0, 53.0, 31.0, 38.0, 34.0, 27.0, 31.0, 16.0, 19.0, 20.0, 18.0, 11.0, 6.0, 7.0, 8.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.310977935791016, -43.69022750854492, -42.069480895996094, -40.44873046875, -38.82798385620117, -37.20723342895508, -35.58648681640625, -33.965736389160156, -32.34498596191406, -30.7242374420166, -29.10348892211914, -27.482738494873047, -25.86199188232422, -24.241241455078125, -22.620492935180664, -20.999744415283203, -19.378997802734375, -17.758249282836914, -16.137500762939453, -14.516751289367676, -12.896002769470215, -11.275254249572754, -9.654504776000977, -8.033756256103516, -6.413007736206055, -4.792259216308594, -3.1715102195739746, -1.5507612228393555, 0.06998729705810547, 1.6907358169555664, 3.3114852905273438, 4.932233810424805, 6.552986145019531, 8.173734664916992, 9.794483184814453, 11.41523265838623, 13.035981178283691, 14.656729698181152, 16.27747917175293, 17.89822769165039, 19.51897621154785, 21.139724731445312, 22.760473251342773, 24.381221771240234, 26.001972198486328, 27.622718811035156, 29.24346923828125, 30.86421775817871, 32.48496627807617, 34.105716705322266, 35.726463317871094, 37.34721374511719, 38.967960357666016, 40.58871078491211, 42.20945739746094, 43.83020782470703, 45.450958251953125, 47.07170867919922, 48.69245529174805, 50.31320571899414, 51.93395233154297, 53.55470275878906, 55.175453186035156, 56.796199798583984, 58.41694641113281]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 19.0, 25.0, 63.0, 172.0, 437.0, 1285.0, 5014.0, 26614.0, 262454.0, 3596930.0, 266251.0, 26985.0, 5578.0, 1572.0, 499.0, 198.0, 92.0, 42.0, 15.0, 11.0, 4.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.14892578125, -8.8837890625, -8.61865234375, -8.353515625, -8.08837890625, -7.8232421875, -7.55810546875, -7.29296875, -7.02783203125, -6.7626953125, -6.49755859375, -6.232421875, -5.96728515625, -5.7021484375, -5.43701171875, -5.171875, -4.90673828125, -4.6416015625, -4.37646484375, -4.111328125, -3.84619140625, -3.5810546875, -3.31591796875, -3.05078125, -2.78564453125, -2.5205078125, -2.25537109375, -1.990234375, -1.72509765625, -1.4599609375, -1.19482421875, -0.9296875, -0.66455078125, -0.3994140625, -0.13427734375, 0.130859375, 0.39599609375, 0.6611328125, 0.92626953125, 1.19140625, 1.45654296875, 1.7216796875, 1.98681640625, 2.251953125, 2.51708984375, 2.7822265625, 3.04736328125, 3.3125, 3.57763671875, 3.8427734375, 4.10791015625, 4.373046875, 4.63818359375, 4.9033203125, 5.16845703125, 5.43359375, 5.69873046875, 5.9638671875, 6.22900390625, 6.494140625, 6.75927734375, 7.0244140625, 7.28955078125, 7.5546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 18.0, 16.0, 26.0, 38.0, 40.0, 53.0, 38.0, 54.0, 70.0, 91.0, 75.0, 67.0, 47.0, 63.0, 47.0, 45.0, 33.0, 43.0, 32.0, 15.0, 15.0, 11.0, 12.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.63677978515625, -1.5391845703125, -1.44158935546875, -1.343994140625, -1.24639892578125, -1.1488037109375, -1.05120849609375, -0.95361328125, -0.85601806640625, -0.7584228515625, -0.66082763671875, -0.563232421875, -0.46563720703125, -0.3680419921875, -0.27044677734375, -0.1728515625, -0.07525634765625, 0.0223388671875, 0.11993408203125, 0.217529296875, 0.31512451171875, 0.4127197265625, 0.51031494140625, 0.60791015625, 0.70550537109375, 0.8031005859375, 0.90069580078125, 0.998291015625, 1.09588623046875, 1.1934814453125, 1.29107666015625, 1.388671875, 1.48626708984375, 1.5838623046875, 1.68145751953125, 1.779052734375, 1.87664794921875, 1.9742431640625, 2.07183837890625, 2.16943359375, 2.26702880859375, 2.3646240234375, 2.46221923828125, 2.559814453125, 2.65740966796875, 2.7550048828125, 2.85260009765625, 2.9501953125, 3.04779052734375, 3.1453857421875, 3.24298095703125, 3.340576171875, 3.43817138671875, 3.5357666015625, 3.63336181640625, 3.73095703125, 3.82855224609375, 3.9261474609375, 4.02374267578125, 4.121337890625, 4.21893310546875, 4.3165283203125, 4.41412353515625, 4.51171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 12.0, 12.0, 15.0, 21.0, 36.0, 69.0, 76.0, 158.0, 240.0, 465.0, 1025.0, 2445.0, 6665.0, 23645.0, 122955.0, 2602926.0, 1319837.0, 85908.0, 18444.0, 5461.0, 1979.0, 851.0, 414.0, 223.0, 150.0, 74.0, 55.0, 34.0, 19.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.3125, -8.05987548828125, -7.8072509765625, -7.55462646484375, -7.302001953125, -7.04937744140625, -6.7967529296875, -6.54412841796875, -6.29150390625, -6.03887939453125, -5.7862548828125, -5.53363037109375, -5.281005859375, -5.02838134765625, -4.7757568359375, -4.52313232421875, -4.2705078125, -4.01788330078125, -3.7652587890625, -3.51263427734375, -3.260009765625, -3.00738525390625, -2.7547607421875, -2.50213623046875, -2.24951171875, -1.99688720703125, -1.7442626953125, -1.49163818359375, -1.239013671875, -0.98638916015625, -0.7337646484375, -0.48114013671875, -0.228515625, 0.02410888671875, 0.2767333984375, 0.52935791015625, 0.781982421875, 1.03460693359375, 1.2872314453125, 1.53985595703125, 1.79248046875, 2.04510498046875, 2.2977294921875, 2.55035400390625, 2.802978515625, 3.05560302734375, 3.3082275390625, 3.56085205078125, 3.8134765625, 4.06610107421875, 4.3187255859375, 4.57135009765625, 4.823974609375, 5.07659912109375, 5.3292236328125, 5.58184814453125, 5.83447265625, 6.08709716796875, 6.3397216796875, 6.59234619140625, 6.844970703125, 7.09759521484375, 7.3502197265625, 7.60284423828125, 7.85546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 8.0, 8.0, 13.0, 12.0, 29.0, 27.0, 51.0, 70.0, 100.0, 161.0, 325.0, 616.0, 972.0, 719.0, 386.0, 184.0, 121.0, 69.0, 51.0, 36.0, 32.0, 17.0, 11.0, 12.0, 10.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-9.0859375, -8.8310546875, -8.576171875, -8.3212890625, -8.06640625, -7.8115234375, -7.556640625, -7.3017578125, -7.046875, -6.7919921875, -6.537109375, -6.2822265625, -6.02734375, -5.7724609375, -5.517578125, -5.2626953125, -5.0078125, -4.7529296875, -4.498046875, -4.2431640625, -3.98828125, -3.7333984375, -3.478515625, -3.2236328125, -2.96875, -2.7138671875, -2.458984375, -2.2041015625, -1.94921875, -1.6943359375, -1.439453125, -1.1845703125, -0.9296875, -0.6748046875, -0.419921875, -0.1650390625, 0.08984375, 0.3447265625, 0.599609375, 0.8544921875, 1.109375, 1.3642578125, 1.619140625, 1.8740234375, 2.12890625, 2.3837890625, 2.638671875, 2.8935546875, 3.1484375, 3.4033203125, 3.658203125, 3.9130859375, 4.16796875, 4.4228515625, 4.677734375, 4.9326171875, 5.1875, 5.4423828125, 5.697265625, 5.9521484375, 6.20703125, 6.4619140625, 6.716796875, 6.9716796875, 7.2265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 14.0, 13.0, 44.0, 49.0, 105.0, 134.0, 162.0, 173.0, 103.0, 77.0, 43.0, 17.0, 21.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.58756637573242, -51.41310501098633, -49.23863983154297, -47.064178466796875, -44.88971710205078, -42.71525573730469, -40.54079055786133, -38.366329193115234, -36.191864013671875, -34.01740264892578, -31.842939376831055, -29.668476104736328, -27.494014739990234, -25.319551467895508, -23.14508819580078, -20.970626831054688, -18.796165466308594, -16.621702194213867, -14.447240829467773, -12.272777557373047, -10.098315238952637, -7.923852920532227, -5.7493896484375, -3.57492733001709, -1.4004650115966797, 0.7739975452423096, 2.948460102081299, 5.122922897338867, 7.297385215759277, 9.471847534179688, 11.646310806274414, 13.820773124694824, 15.9952392578125, 18.169702529907227, 20.34416389465332, 22.518627166748047, 24.69308853149414, 26.867551803588867, 29.042015075683594, 31.216476440429688, 33.39093780517578, 35.565399169921875, 37.739864349365234, 39.91432571411133, 42.08878707885742, 44.26325225830078, 46.437713623046875, 48.61217498779297, 50.78664016723633, 52.96110153198242, 55.13556671142578, 57.310028076171875, 59.48448944091797, 61.65895080566406, 63.83341598510742, 66.00788116455078, 68.18234252929688, 70.35680389404297, 72.53126525878906, 74.70573425292969, 76.88019561767578, 79.05465698242188, 81.22911834716797, 83.40357971191406, 85.57804107666016]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 5.0, 7.0, 9.0, 10.0, 19.0, 21.0, 14.0, 18.0, 26.0, 35.0, 27.0, 46.0, 37.0, 43.0, 39.0, 53.0, 51.0, 57.0, 31.0, 58.0, 58.0, 48.0, 32.0, 23.0, 35.0, 30.0, 33.0, 27.0, 20.0, 18.0, 15.0, 12.0, 9.0, 7.0, 8.0, 3.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.06435775756836, -39.911338806152344, -38.75831985473633, -37.60530090332031, -36.4522819519043, -35.29926300048828, -34.146244049072266, -32.99322509765625, -31.840206146240234, -30.68718719482422, -29.534168243408203, -28.381149291992188, -27.228130340576172, -26.075111389160156, -24.92209243774414, -23.769073486328125, -22.61605453491211, -21.463035583496094, -20.310016632080078, -19.156997680664062, -18.003978729248047, -16.85095977783203, -15.697940826416016, -14.544921875, -13.391902923583984, -12.238883972167969, -11.085865020751953, -9.932846069335938, -8.779827117919922, -7.626808166503906, -6.473789215087891, -5.320770263671875, -4.167747497558594, -3.014728546142578, -1.8617095947265625, -0.7086906433105469, 0.44432830810546875, 1.5973472595214844, 2.7503662109375, 3.9033851623535156, 5.056404113769531, 6.209423065185547, 7.3624420166015625, 8.515460968017578, 9.668479919433594, 10.82149887084961, 11.974517822265625, 13.12753677368164, 14.280555725097656, 15.433574676513672, 16.586593627929688, 17.739612579345703, 18.89263153076172, 20.045650482177734, 21.19866943359375, 22.351688385009766, 23.50470733642578, 24.657726287841797, 25.810745239257812, 26.963764190673828, 28.116783142089844, 29.26980209350586, 30.422821044921875, 31.57583999633789, 32.728858947753906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 13.0, 12.0, 16.0, 20.0, 30.0, 41.0, 57.0, 102.0, 141.0, 223.0, 330.0, 531.0, 805.0, 1336.0, 2285.0, 3662.0, 6380.0, 11640.0, 20846.0, 40339.0, 82175.0, 191968.0, 333252.0, 186016.0, 79870.0, 38918.0, 20609.0, 11154.0, 6318.0, 3643.0, 2174.0, 1371.0, 808.0, 531.0, 334.0, 221.0, 114.0, 81.0, 59.0, 39.0, 25.0, 18.0, 17.0, 16.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.734649658203125, -3.60797119140625, -3.481292724609375, -3.3546142578125, -3.227935791015625, -3.10125732421875, -2.974578857421875, -2.847900390625, -2.721221923828125, -2.59454345703125, -2.467864990234375, -2.3411865234375, -2.214508056640625, -2.08782958984375, -1.961151123046875, -1.83447265625, -1.707794189453125, -1.58111572265625, -1.454437255859375, -1.3277587890625, -1.201080322265625, -1.07440185546875, -0.947723388671875, -0.821044921875, -0.694366455078125, -0.56768798828125, -0.441009521484375, -0.3143310546875, -0.187652587890625, -0.06097412109375, 0.065704345703125, 0.1923828125, 0.319061279296875, 0.44573974609375, 0.572418212890625, 0.6990966796875, 0.825775146484375, 0.95245361328125, 1.079132080078125, 1.205810546875, 1.332489013671875, 1.45916748046875, 1.585845947265625, 1.7125244140625, 1.839202880859375, 1.96588134765625, 2.092559814453125, 2.21923828125, 2.345916748046875, 2.47259521484375, 2.599273681640625, 2.7259521484375, 2.852630615234375, 2.97930908203125, 3.105987548828125, 3.232666015625, 3.359344482421875, 3.48602294921875, 3.612701416015625, 3.7393798828125, 3.866058349609375, 3.99273681640625, 4.119415283203125, 4.24609375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 12.0, 8.0, 15.0, 14.0, 16.0, 21.0, 17.0, 16.0, 13.0, 21.0, 28.0, 36.0, 47.0, 37.0, 46.0, 37.0, 33.0, 40.0, 54.0, 37.0, 53.0, 34.0, 33.0, 23.0, 42.0, 34.0, 25.0, 32.0, 22.0, 20.0, 16.0, 23.0, 15.0, 20.0, 8.0, 8.0, 10.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 1.0], "bins": [-2.333984375, -2.268157958984375, -2.20233154296875, -2.136505126953125, -2.0706787109375, -2.004852294921875, -1.93902587890625, -1.873199462890625, -1.807373046875, -1.741546630859375, -1.67572021484375, -1.609893798828125, -1.5440673828125, -1.478240966796875, -1.41241455078125, -1.346588134765625, -1.28076171875, -1.214935302734375, -1.14910888671875, -1.083282470703125, -1.0174560546875, -0.951629638671875, -0.88580322265625, -0.819976806640625, -0.754150390625, -0.688323974609375, -0.62249755859375, -0.556671142578125, -0.4908447265625, -0.425018310546875, -0.35919189453125, -0.293365478515625, -0.2275390625, -0.161712646484375, -0.09588623046875, -0.030059814453125, 0.0357666015625, 0.101593017578125, 0.16741943359375, 0.233245849609375, 0.299072265625, 0.364898681640625, 0.43072509765625, 0.496551513671875, 0.5623779296875, 0.628204345703125, 0.69403076171875, 0.759857177734375, 0.82568359375, 0.891510009765625, 0.95733642578125, 1.023162841796875, 1.0889892578125, 1.154815673828125, 1.22064208984375, 1.286468505859375, 1.352294921875, 1.418121337890625, 1.48394775390625, 1.549774169921875, 1.6156005859375, 1.681427001953125, 1.74725341796875, 1.813079833984375, 1.87890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 7.0, 15.0, 16.0, 15.0, 36.0, 43.0, 68.0, 116.0, 160.0, 232.0, 344.0, 591.0, 1079.0, 2145.0, 5490.0, 22242.0, 210694.0, 736013.0, 53120.0, 9556.0, 3235.0, 1343.0, 730.0, 408.0, 266.0, 168.0, 131.0, 85.0, 53.0, 42.0, 22.0, 20.0, 15.0, 16.0, 4.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6422119140625, -11.229736328125, -10.8172607421875, -10.40478515625, -9.9923095703125, -9.579833984375, -9.1673583984375, -8.7548828125, -8.3424072265625, -7.929931640625, -7.5174560546875, -7.10498046875, -6.6925048828125, -6.280029296875, -5.8675537109375, -5.455078125, -5.0426025390625, -4.630126953125, -4.2176513671875, -3.80517578125, -3.3927001953125, -2.980224609375, -2.5677490234375, -2.1552734375, -1.7427978515625, -1.330322265625, -0.9178466796875, -0.50537109375, -0.0928955078125, 0.319580078125, 0.7320556640625, 1.14453125, 1.5570068359375, 1.969482421875, 2.3819580078125, 2.79443359375, 3.2069091796875, 3.619384765625, 4.0318603515625, 4.4443359375, 4.8568115234375, 5.269287109375, 5.6817626953125, 6.09423828125, 6.5067138671875, 6.919189453125, 7.3316650390625, 7.744140625, 8.1566162109375, 8.569091796875, 8.9815673828125, 9.39404296875, 9.8065185546875, 10.218994140625, 10.6314697265625, 11.0439453125, 11.4564208984375, 11.868896484375, 12.2813720703125, 12.69384765625, 13.1063232421875, 13.518798828125, 13.9312744140625, 14.34375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 10.0, 12.0, 21.0, 26.0, 22.0, 42.0, 69.0, 80.0, 86.0, 84.0, 110.0, 94.0, 78.0, 71.0, 51.0, 40.0, 31.0, 24.0, 14.0, 14.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.981201171875, -21.27490234375, -20.568603515625, -19.8623046875, -19.156005859375, -18.44970703125, -17.743408203125, -17.037109375, -16.330810546875, -15.62451171875, -14.918212890625, -14.2119140625, -13.505615234375, -12.79931640625, -12.093017578125, -11.38671875, -10.680419921875, -9.97412109375, -9.267822265625, -8.5615234375, -7.855224609375, -7.14892578125, -6.442626953125, -5.736328125, -5.030029296875, -4.32373046875, -3.617431640625, -2.9111328125, -2.204833984375, -1.49853515625, -0.792236328125, -0.0859375, 0.620361328125, 1.32666015625, 2.032958984375, 2.7392578125, 3.445556640625, 4.15185546875, 4.858154296875, 5.564453125, 6.270751953125, 6.97705078125, 7.683349609375, 8.3896484375, 9.095947265625, 9.80224609375, 10.508544921875, 11.21484375, 11.921142578125, 12.62744140625, 13.333740234375, 14.0400390625, 14.746337890625, 15.45263671875, 16.158935546875, 16.865234375, 17.571533203125, 18.27783203125, 18.984130859375, 19.6904296875, 20.396728515625, 21.10302734375, 21.809326171875, 22.515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 18.0, 39.0, 80.0, 229.0, 1288.0, 16345.0, 946136.0, 80821.0, 2937.0, 452.0, 114.0, 38.0, 29.0, 14.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.046875, -10.633056640625, -10.21923828125, -9.805419921875, -9.3916015625, -8.977783203125, -8.56396484375, -8.150146484375, -7.736328125, -7.322509765625, -6.90869140625, -6.494873046875, -6.0810546875, -5.667236328125, -5.25341796875, -4.839599609375, -4.42578125, -4.011962890625, -3.59814453125, -3.184326171875, -2.7705078125, -2.356689453125, -1.94287109375, -1.529052734375, -1.115234375, -0.701416015625, -0.28759765625, 0.126220703125, 0.5400390625, 0.953857421875, 1.36767578125, 1.781494140625, 2.1953125, 2.609130859375, 3.02294921875, 3.436767578125, 3.8505859375, 4.264404296875, 4.67822265625, 5.092041015625, 5.505859375, 5.919677734375, 6.33349609375, 6.747314453125, 7.1611328125, 7.574951171875, 7.98876953125, 8.402587890625, 8.81640625, 9.230224609375, 9.64404296875, 10.057861328125, 10.4716796875, 10.885498046875, 11.29931640625, 11.713134765625, 12.126953125, 12.540771484375, 12.95458984375, 13.368408203125, 13.7822265625, 14.196044921875, 14.60986328125, 15.023681640625, 15.4375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 6.0, 1.0, 5.0, 6.0, 12.0, 9.0, 16.0, 15.0, 25.0, 32.0, 51.0, 66.0, 91.0, 137.0, 136.0, 99.0, 64.0, 41.0, 39.0, 24.0, 23.0, 19.0, 10.0, 19.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0011339187622070312, -0.0010975450277328491, -0.001061171293258667, -0.0010247975587844849, -0.0009884238243103027, -0.0009520500898361206, -0.0009156763553619385, -0.0008793026208877563, -0.0008429288864135742, -0.0008065551519393921, -0.00077018141746521, -0.0007338076829910278, -0.0006974339485168457, -0.0006610602140426636, -0.0006246864795684814, -0.0005883127450942993, -0.0005519390106201172, -0.0005155652761459351, -0.00047919154167175293, -0.0004428178071975708, -0.00040644407272338867, -0.00037007033824920654, -0.0003336966037750244, -0.0002973228693008423, -0.00026094913482666016, -0.00022457540035247803, -0.0001882016658782959, -0.00015182793140411377, -0.00011545419692993164, -7.908046245574951e-05, -4.270672798156738e-05, -6.332993507385254e-06, 3.0040740966796875e-05, 6.6414475440979e-05, 0.00010278820991516113, 0.00013916194438934326, 0.0001755356788635254, 0.00021190941333770752, 0.00024828314781188965, 0.0002846568822860718, 0.0003210306167602539, 0.00035740435123443604, 0.00039377808570861816, 0.0004301518201828003, 0.0004665255546569824, 0.0005028992891311646, 0.0005392730236053467, 0.0005756467580795288, 0.0006120204925537109, 0.0006483942270278931, 0.0006847679615020752, 0.0007211416959762573, 0.0007575154304504395, 0.0007938891649246216, 0.0008302628993988037, 0.0008666366338729858, 0.000903010368347168, 0.0009393841028213501, 0.0009757578372955322, 0.0010121315717697144, 0.0010485053062438965, 0.0010848790407180786, 0.0011212527751922607, 0.0011576265096664429, 0.001194000244140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 4.0, 7.0, 9.0, 7.0, 10.0, 21.0, 26.0, 33.0, 56.0, 75.0, 91.0, 149.0, 207.0, 391.0, 536.0, 1050.0, 2040.0, 4451.0, 11902.0, 45132.0, 254846.0, 592503.0, 99753.0, 21791.0, 7010.0, 2885.0, 1443.0, 766.0, 457.0, 287.0, 181.0, 117.0, 80.0, 54.0, 56.0, 29.0, 28.0, 12.0, 18.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.712890625, -3.59405517578125, -3.4752197265625, -3.35638427734375, -3.237548828125, -3.11871337890625, -2.9998779296875, -2.88104248046875, -2.76220703125, -2.64337158203125, -2.5245361328125, -2.40570068359375, -2.286865234375, -2.16802978515625, -2.0491943359375, -1.93035888671875, -1.8115234375, -1.69268798828125, -1.5738525390625, -1.45501708984375, -1.336181640625, -1.21734619140625, -1.0985107421875, -0.97967529296875, -0.86083984375, -0.74200439453125, -0.6231689453125, -0.50433349609375, -0.385498046875, -0.26666259765625, -0.1478271484375, -0.02899169921875, 0.08984375, 0.20867919921875, 0.3275146484375, 0.44635009765625, 0.565185546875, 0.68402099609375, 0.8028564453125, 0.92169189453125, 1.04052734375, 1.15936279296875, 1.2781982421875, 1.39703369140625, 1.515869140625, 1.63470458984375, 1.7535400390625, 1.87237548828125, 1.9912109375, 2.11004638671875, 2.2288818359375, 2.34771728515625, 2.466552734375, 2.58538818359375, 2.7042236328125, 2.82305908203125, 2.94189453125, 3.06072998046875, 3.1795654296875, 3.29840087890625, 3.417236328125, 3.53607177734375, 3.6549072265625, 3.77374267578125, 3.892578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 14.0, 17.0, 15.0, 28.0, 23.0, 60.0, 56.0, 90.0, 70.0, 98.0, 91.0, 98.0, 72.0, 46.0, 54.0, 39.0, 32.0, 19.0, 19.0, 13.0, 13.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.82421875, -5.67523193359375, -5.5262451171875, -5.37725830078125, -5.228271484375, -5.07928466796875, -4.9302978515625, -4.78131103515625, -4.63232421875, -4.48333740234375, -4.3343505859375, -4.18536376953125, -4.036376953125, -3.88739013671875, -3.7384033203125, -3.58941650390625, -3.4404296875, -3.29144287109375, -3.1424560546875, -2.99346923828125, -2.844482421875, -2.69549560546875, -2.5465087890625, -2.39752197265625, -2.24853515625, -2.09954833984375, -1.9505615234375, -1.80157470703125, -1.652587890625, -1.50360107421875, -1.3546142578125, -1.20562744140625, -1.056640625, -0.90765380859375, -0.7586669921875, -0.60968017578125, -0.460693359375, -0.31170654296875, -0.1627197265625, -0.01373291015625, 0.13525390625, 0.28424072265625, 0.4332275390625, 0.58221435546875, 0.731201171875, 0.88018798828125, 1.0291748046875, 1.17816162109375, 1.3271484375, 1.47613525390625, 1.6251220703125, 1.77410888671875, 1.923095703125, 2.07208251953125, 2.2210693359375, 2.37005615234375, 2.51904296875, 2.66802978515625, 2.8170166015625, 2.96600341796875, 3.114990234375, 3.26397705078125, 3.4129638671875, 3.56195068359375, 3.7109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 12.0, 15.0, 39.0, 64.0, 114.0, 159.0, 223.0, 154.0, 93.0, 46.0, 34.0, 15.0, 7.0, 6.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.94975280761719, -98.00324249267578, -95.0567398071289, -92.1102294921875, -89.16372680664062, -86.21721649169922, -83.27070617675781, -80.32420349121094, -77.37769317626953, -74.43118286132812, -71.48468017578125, -68.53816986083984, -65.59165954589844, -62.64515686035156, -59.698646545410156, -56.752140045166016, -53.805633544921875, -50.859127044677734, -47.912620544433594, -44.96611022949219, -42.01960372924805, -39.073097229003906, -36.1265869140625, -33.18008041381836, -30.23357391357422, -27.287067413330078, -24.340559005737305, -21.39405059814453, -18.44754409790039, -15.501036643981934, -12.554529190063477, -9.608020782470703, -6.661521911621094, -3.7150144577026367, -0.7685070037841797, 2.1780004501342773, 5.124507904052734, 8.071015357971191, 11.017522811889648, 13.964031219482422, 16.910537719726562, 19.857044219970703, 22.803552627563477, 25.75006103515625, 28.69656753540039, 31.64307403564453, 34.58958435058594, 37.53609085083008, 40.48259735107422, 43.42910385131836, 46.3756103515625, 49.322120666503906, 52.26862716674805, 55.21513366699219, 58.161643981933594, 61.108150482177734, 64.05465698242188, 67.00116729736328, 69.94766998291016, 72.89418029785156, 75.84068298339844, 78.78719329833984, 81.73370361328125, 84.68020629882812, 87.62671661376953]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 7.0, 16.0, 13.0, 15.0, 16.0, 17.0, 28.0, 33.0, 37.0, 39.0, 34.0, 44.0, 50.0, 46.0, 50.0, 55.0, 46.0, 46.0, 56.0, 42.0, 49.0, 28.0, 24.0, 28.0, 24.0, 26.0, 18.0, 13.0, 18.0, 12.0, 10.0, 3.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.928470611572266, -41.582244873046875, -40.236019134521484, -38.889793395996094, -37.54357147216797, -36.19734573364258, -34.85111999511719, -33.5048942565918, -32.158668518066406, -30.812442779541016, -29.466217041015625, -28.119993209838867, -26.773767471313477, -25.427541732788086, -24.081317901611328, -22.735092163085938, -21.388866424560547, -20.042640686035156, -18.696414947509766, -17.350191116333008, -16.003965377807617, -14.657739639282227, -13.311514854431152, -11.965290069580078, -10.619064331054688, -9.272838592529297, -7.926613807678223, -6.58038854598999, -5.234163284301758, -3.8879380226135254, -2.541712760925293, -1.1954879760742188, 0.15073776245117188, 1.4969630241394043, 2.8431882858276367, 4.189413547515869, 5.535638809204102, 6.881864070892334, 8.228089332580566, 9.57431411743164, 10.920539855957031, 12.266765594482422, 13.612990379333496, 14.95921516418457, 16.30544090270996, 17.65166664123535, 18.99789047241211, 20.3441162109375, 21.69034194946289, 23.03656768798828, 24.382793426513672, 25.72901725769043, 27.07524299621582, 28.42146873474121, 29.76769256591797, 31.11391830444336, 32.46014404296875, 33.80636978149414, 35.15259552001953, 36.49882125854492, 37.84504699707031, 39.19126892089844, 40.53749465942383, 41.88372039794922, 43.22994613647461]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 12.0, 7.0, 10.0, 16.0, 27.0, 28.0, 43.0, 48.0, 77.0, 104.0, 191.0, 529.0, 5564.0, 1006855.0, 3170922.0, 8485.0, 718.0, 199.0, 129.0, 90.0, 50.0, 36.0, 32.0, 29.0, 14.0, 12.0, 10.0, 9.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.641357421875, -20.01708984375, -19.392822265625, -18.7685546875, -18.144287109375, -17.52001953125, -16.895751953125, -16.271484375, -15.647216796875, -15.02294921875, -14.398681640625, -13.7744140625, -13.150146484375, -12.52587890625, -11.901611328125, -11.27734375, -10.653076171875, -10.02880859375, -9.404541015625, -8.7802734375, -8.156005859375, -7.53173828125, -6.907470703125, -6.283203125, -5.658935546875, -5.03466796875, -4.410400390625, -3.7861328125, -3.161865234375, -2.53759765625, -1.913330078125, -1.2890625, -0.664794921875, -0.04052734375, 0.583740234375, 1.2080078125, 1.832275390625, 2.45654296875, 3.080810546875, 3.705078125, 4.329345703125, 4.95361328125, 5.577880859375, 6.2021484375, 6.826416015625, 7.45068359375, 8.074951171875, 8.69921875, 9.323486328125, 9.94775390625, 10.572021484375, 11.1962890625, 11.820556640625, 12.44482421875, 13.069091796875, 13.693359375, 14.317626953125, 14.94189453125, 15.566162109375, 16.1904296875, 16.814697265625, 17.43896484375, 18.063232421875, 18.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 10.0, 12.0, 6.0, 10.0, 8.0, 15.0, 20.0, 24.0, 23.0, 28.0, 27.0, 29.0, 43.0, 41.0, 38.0, 39.0, 44.0, 52.0, 45.0, 42.0, 35.0, 50.0, 41.0, 32.0, 36.0, 38.0, 32.0, 26.0, 23.0, 21.0, 18.0, 22.0, 11.0, 18.0, 10.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.123046875, -2.05401611328125, -1.9849853515625, -1.91595458984375, -1.846923828125, -1.77789306640625, -1.7088623046875, -1.63983154296875, -1.57080078125, -1.50177001953125, -1.4327392578125, -1.36370849609375, -1.294677734375, -1.22564697265625, -1.1566162109375, -1.08758544921875, -1.0185546875, -0.94952392578125, -0.8804931640625, -0.81146240234375, -0.742431640625, -0.67340087890625, -0.6043701171875, -0.53533935546875, -0.46630859375, -0.39727783203125, -0.3282470703125, -0.25921630859375, -0.190185546875, -0.12115478515625, -0.0521240234375, 0.01690673828125, 0.0859375, 0.15496826171875, 0.2239990234375, 0.29302978515625, 0.362060546875, 0.43109130859375, 0.5001220703125, 0.56915283203125, 0.63818359375, 0.70721435546875, 0.7762451171875, 0.84527587890625, 0.914306640625, 0.98333740234375, 1.0523681640625, 1.12139892578125, 1.1904296875, 1.25946044921875, 1.3284912109375, 1.39752197265625, 1.466552734375, 1.53558349609375, 1.6046142578125, 1.67364501953125, 1.74267578125, 1.81170654296875, 1.8807373046875, 1.94976806640625, 2.018798828125, 2.08782958984375, 2.1568603515625, 2.22589111328125, 2.294921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 12.0, 13.0, 13.0, 26.0, 46.0, 70.0, 83.0, 104.0, 210.0, 294.0, 558.0, 953.0, 1777.0, 3295.0, 6554.0, 14274.0, 35916.0, 119897.0, 762631.0, 2690593.0, 425003.0, 82931.0, 27046.0, 10947.0, 5080.0, 2597.0, 1427.0, 743.0, 432.0, 259.0, 183.0, 103.0, 63.0, 50.0, 19.0, 24.0, 11.0, 13.0, 9.0, 7.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.828125, -4.66912841796875, -4.5101318359375, -4.35113525390625, -4.192138671875, -4.03314208984375, -3.8741455078125, -3.71514892578125, -3.55615234375, -3.39715576171875, -3.2381591796875, -3.07916259765625, -2.920166015625, -2.76116943359375, -2.6021728515625, -2.44317626953125, -2.2841796875, -2.12518310546875, -1.9661865234375, -1.80718994140625, -1.648193359375, -1.48919677734375, -1.3302001953125, -1.17120361328125, -1.01220703125, -0.85321044921875, -0.6942138671875, -0.53521728515625, -0.376220703125, -0.21722412109375, -0.0582275390625, 0.10076904296875, 0.259765625, 0.41876220703125, 0.5777587890625, 0.73675537109375, 0.895751953125, 1.05474853515625, 1.2137451171875, 1.37274169921875, 1.53173828125, 1.69073486328125, 1.8497314453125, 2.00872802734375, 2.167724609375, 2.32672119140625, 2.4857177734375, 2.64471435546875, 2.8037109375, 2.96270751953125, 3.1217041015625, 3.28070068359375, 3.439697265625, 3.59869384765625, 3.7576904296875, 3.91668701171875, 4.07568359375, 4.23468017578125, 4.3936767578125, 4.55267333984375, 4.711669921875, 4.87066650390625, 5.0296630859375, 5.18865966796875, 5.34765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 4.0, 12.0, 8.0, 10.0, 12.0, 19.0, 24.0, 34.0, 49.0, 67.0, 105.0, 171.0, 323.0, 497.0, 787.0, 704.0, 450.0, 267.0, 172.0, 90.0, 69.0, 48.0, 42.0, 23.0, 21.0, 10.0, 4.0, 7.0, 12.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-7.83984375, -7.63299560546875, -7.4261474609375, -7.21929931640625, -7.012451171875, -6.80560302734375, -6.5987548828125, -6.39190673828125, -6.18505859375, -5.97821044921875, -5.7713623046875, -5.56451416015625, -5.357666015625, -5.15081787109375, -4.9439697265625, -4.73712158203125, -4.5302734375, -4.32342529296875, -4.1165771484375, -3.90972900390625, -3.702880859375, -3.49603271484375, -3.2891845703125, -3.08233642578125, -2.87548828125, -2.66864013671875, -2.4617919921875, -2.25494384765625, -2.048095703125, -1.84124755859375, -1.6343994140625, -1.42755126953125, -1.220703125, -1.01385498046875, -0.8070068359375, -0.60015869140625, -0.393310546875, -0.18646240234375, 0.0203857421875, 0.22723388671875, 0.43408203125, 0.64093017578125, 0.8477783203125, 1.05462646484375, 1.261474609375, 1.46832275390625, 1.6751708984375, 1.88201904296875, 2.0888671875, 2.29571533203125, 2.5025634765625, 2.70941162109375, 2.916259765625, 3.12310791015625, 3.3299560546875, 3.53680419921875, 3.74365234375, 3.95050048828125, 4.1573486328125, 4.36419677734375, 4.571044921875, 4.77789306640625, 4.9847412109375, 5.19158935546875, 5.3984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 7.0, 9.0, 27.0, 66.0, 193.0, 279.0, 207.0, 95.0, 63.0, 26.0, 11.0, 5.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.36143493652344, -83.21256256103516, -80.0636978149414, -76.91482543945312, -73.76595306396484, -70.61708068847656, -67.46821594238281, -64.31934356689453, -61.17047119140625, -58.021602630615234, -54.87273025512695, -51.72386169433594, -48.574989318847656, -45.42612075805664, -42.277252197265625, -39.128379821777344, -35.97951126098633, -32.83064270019531, -29.68177032470703, -26.532901763916016, -23.384029388427734, -20.23516082763672, -17.08629035949707, -13.937419891357422, -10.788549423217773, -7.639678955078125, -4.490808963775635, -1.3419389724731445, 1.806931495666504, 4.955801963806152, 8.104671478271484, 11.253541946411133, 14.402412414550781, 17.55128288269043, 20.700153350830078, 23.849021911621094, 26.997894287109375, 30.14676284790039, 33.295631408691406, 36.44450378417969, 39.59337615966797, 42.742244720458984, 45.891117095947266, 49.03998565673828, 52.18885803222656, 55.33772659301758, 58.486595153808594, 61.635467529296875, 64.78433227539062, 67.9332046508789, 71.08206939697266, 74.23094177246094, 77.37981414794922, 80.5286865234375, 83.67755126953125, 86.82642364501953, 89.97529602050781, 93.1241683959961, 96.27303314208984, 99.42190551757812, 102.5707778930664, 105.71965026855469, 108.86851501464844, 112.01738739013672, 115.166259765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 7.0, 2.0, 7.0, 7.0, 10.0, 8.0, 11.0, 16.0, 20.0, 22.0, 27.0, 26.0, 31.0, 32.0, 34.0, 35.0, 29.0, 40.0, 46.0, 41.0, 36.0, 45.0, 47.0, 55.0, 35.0, 35.0, 39.0, 38.0, 25.0, 33.0, 28.0, 26.0, 21.0, 19.0, 15.0, 10.0, 10.0, 10.0, 7.0, 2.0, 3.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.315643310546875, -23.442903518676758, -22.57016372680664, -21.69742202758789, -20.824682235717773, -19.951942443847656, -19.07920265197754, -18.206462860107422, -17.333723068237305, -16.460983276367188, -15.588242530822754, -14.715502738952637, -13.84276294708252, -12.970022201538086, -12.097282409667969, -11.224542617797852, -10.351801872253418, -9.4790620803833, -8.606321334838867, -7.73358154296875, -6.860841751098633, -5.988101482391357, -5.115361213684082, -4.242621421813965, -3.3698811531066895, -2.497141122817993, -1.6244009733200073, -0.7516608238220215, 0.1210792064666748, 0.9938192367553711, 1.8665595054626465, 2.7392992973327637, 3.612039566040039, 4.4847798347473145, 5.357519626617432, 6.230259895324707, 7.102999687194824, 7.9757399559021, 8.848480224609375, 9.721220016479492, 10.59395980834961, 11.466699600219727, 12.33944034576416, 13.212180137634277, 14.084919929504395, 14.957660675048828, 15.830400466918945, 16.703140258789062, 17.575881958007812, 18.44862174987793, 19.321361541748047, 20.194103240966797, 21.066843032836914, 21.93958282470703, 22.81232261657715, 23.685062408447266, 24.557802200317383, 25.4305419921875, 26.303281784057617, 27.176021575927734, 28.048763275146484, 28.9215030670166, 29.79424285888672, 30.666982650756836, 31.539722442626953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 0.0, 6.0, 5.0, 9.0, 16.0, 21.0, 24.0, 33.0, 55.0, 93.0, 145.0, 236.0, 401.0, 640.0, 1192.0, 2092.0, 4031.0, 8418.0, 17868.0, 40560.0, 111077.0, 373420.0, 325732.0, 95014.0, 35656.0, 16025.0, 7457.0, 3700.0, 1949.0, 1077.0, 612.0, 350.0, 231.0, 145.0, 83.0, 62.0, 32.0, 27.0, 22.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.76824951171875, -4.5911865234375, -4.41412353515625, -4.237060546875, -4.05999755859375, -3.8829345703125, -3.70587158203125, -3.52880859375, -3.35174560546875, -3.1746826171875, -2.99761962890625, -2.820556640625, -2.64349365234375, -2.4664306640625, -2.28936767578125, -2.1123046875, -1.93524169921875, -1.7581787109375, -1.58111572265625, -1.404052734375, -1.22698974609375, -1.0499267578125, -0.87286376953125, -0.69580078125, -0.51873779296875, -0.3416748046875, -0.16461181640625, 0.012451171875, 0.18951416015625, 0.3665771484375, 0.54364013671875, 0.720703125, 0.89776611328125, 1.0748291015625, 1.25189208984375, 1.428955078125, 1.60601806640625, 1.7830810546875, 1.96014404296875, 2.13720703125, 2.31427001953125, 2.4913330078125, 2.66839599609375, 2.845458984375, 3.02252197265625, 3.1995849609375, 3.37664794921875, 3.5537109375, 3.73077392578125, 3.9078369140625, 4.08489990234375, 4.261962890625, 4.43902587890625, 4.6160888671875, 4.79315185546875, 4.97021484375, 5.14727783203125, 5.3243408203125, 5.50140380859375, 5.678466796875, 5.85552978515625, 6.0325927734375, 6.20965576171875, 6.38671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 9.0, 12.0, 12.0, 22.0, 23.0, 23.0, 40.0, 41.0, 51.0, 51.0, 62.0, 57.0, 59.0, 80.0, 68.0, 70.0, 60.0, 64.0, 37.0, 33.0, 33.0, 27.0, 21.0, 16.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98828125, -1.8743896484375, -1.760498046875, -1.6466064453125, -1.53271484375, -1.4188232421875, -1.304931640625, -1.1910400390625, -1.0771484375, -0.9632568359375, -0.849365234375, -0.7354736328125, -0.62158203125, -0.5076904296875, -0.393798828125, -0.2799072265625, -0.166015625, -0.0521240234375, 0.061767578125, 0.1756591796875, 0.28955078125, 0.4034423828125, 0.517333984375, 0.6312255859375, 0.7451171875, 0.8590087890625, 0.972900390625, 1.0867919921875, 1.20068359375, 1.3145751953125, 1.428466796875, 1.5423583984375, 1.65625, 1.7701416015625, 1.884033203125, 1.9979248046875, 2.11181640625, 2.2257080078125, 2.339599609375, 2.4534912109375, 2.5673828125, 2.6812744140625, 2.795166015625, 2.9090576171875, 3.02294921875, 3.1368408203125, 3.250732421875, 3.3646240234375, 3.478515625, 3.5924072265625, 3.706298828125, 3.8201904296875, 3.93408203125, 4.0479736328125, 4.161865234375, 4.2757568359375, 4.3896484375, 4.5035400390625, 4.617431640625, 4.7313232421875, 4.84521484375, 4.9591064453125, 5.072998046875, 5.1868896484375, 5.30078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 8.0, 3.0, 8.0, 19.0, 34.0, 27.0, 57.0, 79.0, 115.0, 181.0, 316.0, 453.0, 823.0, 1699.0, 3774.0, 10730.0, 40228.0, 281297.0, 617271.0, 65858.0, 15617.0, 5194.0, 2158.0, 1036.0, 563.0, 337.0, 219.0, 141.0, 78.0, 49.0, 46.0, 36.0, 18.0, 9.0, 14.0, 8.0, 14.0, 5.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.8612060546875, -8.534912109375, -8.2086181640625, -7.88232421875, -7.5560302734375, -7.229736328125, -6.9034423828125, -6.5771484375, -6.2508544921875, -5.924560546875, -5.5982666015625, -5.27197265625, -4.9456787109375, -4.619384765625, -4.2930908203125, -3.966796875, -3.6405029296875, -3.314208984375, -2.9879150390625, -2.66162109375, -2.3353271484375, -2.009033203125, -1.6827392578125, -1.3564453125, -1.0301513671875, -0.703857421875, -0.3775634765625, -0.05126953125, 0.2750244140625, 0.601318359375, 0.9276123046875, 1.25390625, 1.5802001953125, 1.906494140625, 2.2327880859375, 2.55908203125, 2.8853759765625, 3.211669921875, 3.5379638671875, 3.8642578125, 4.1905517578125, 4.516845703125, 4.8431396484375, 5.16943359375, 5.4957275390625, 5.822021484375, 6.1483154296875, 6.474609375, 6.8009033203125, 7.127197265625, 7.4534912109375, 7.77978515625, 8.1060791015625, 8.432373046875, 8.7586669921875, 9.0849609375, 9.4112548828125, 9.737548828125, 10.0638427734375, 10.39013671875, 10.7164306640625, 11.042724609375, 11.3690185546875, 11.6953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 4.0, 11.0, 8.0, 9.0, 10.0, 11.0, 20.0, 11.0, 30.0, 29.0, 29.0, 45.0, 41.0, 47.0, 50.0, 51.0, 58.0, 53.0, 63.0, 51.0, 53.0, 59.0, 26.0, 38.0, 32.0, 23.0, 26.0, 19.0, 14.0, 13.0, 11.0, 8.0, 8.0, 4.0, 7.0, 3.0, 10.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2353515625, -8.853515625, -8.4716796875, -8.08984375, -7.7080078125, -7.326171875, -6.9443359375, -6.5625, -6.1806640625, -5.798828125, -5.4169921875, -5.03515625, -4.6533203125, -4.271484375, -3.8896484375, -3.5078125, -3.1259765625, -2.744140625, -2.3623046875, -1.98046875, -1.5986328125, -1.216796875, -0.8349609375, -0.453125, -0.0712890625, 0.310546875, 0.6923828125, 1.07421875, 1.4560546875, 1.837890625, 2.2197265625, 2.6015625, 2.9833984375, 3.365234375, 3.7470703125, 4.12890625, 4.5107421875, 4.892578125, 5.2744140625, 5.65625, 6.0380859375, 6.419921875, 6.8017578125, 7.18359375, 7.5654296875, 7.947265625, 8.3291015625, 8.7109375, 9.0927734375, 9.474609375, 9.8564453125, 10.23828125, 10.6201171875, 11.001953125, 11.3837890625, 11.765625, 12.1474609375, 12.529296875, 12.9111328125, 13.29296875, 13.6748046875, 14.056640625, 14.4384765625, 14.8203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 11.0, 16.0, 26.0, 51.0, 59.0, 106.0, 200.0, 334.0, 625.0, 1263.0, 3213.0, 9787.0, 47022.0, 527224.0, 401495.0, 42187.0, 9267.0, 2971.0, 1272.0, 592.0, 330.0, 164.0, 115.0, 66.0, 44.0, 33.0, 17.0, 9.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.34478759765625, -5.1466064453125, -4.94842529296875, -4.750244140625, -4.55206298828125, -4.3538818359375, -4.15570068359375, -3.95751953125, -3.75933837890625, -3.5611572265625, -3.36297607421875, -3.164794921875, -2.96661376953125, -2.7684326171875, -2.57025146484375, -2.3720703125, -2.17388916015625, -1.9757080078125, -1.77752685546875, -1.579345703125, -1.38116455078125, -1.1829833984375, -0.98480224609375, -0.78662109375, -0.58843994140625, -0.3902587890625, -0.19207763671875, 0.006103515625, 0.20428466796875, 0.4024658203125, 0.60064697265625, 0.798828125, 0.99700927734375, 1.1951904296875, 1.39337158203125, 1.591552734375, 1.78973388671875, 1.9879150390625, 2.18609619140625, 2.38427734375, 2.58245849609375, 2.7806396484375, 2.97882080078125, 3.177001953125, 3.37518310546875, 3.5733642578125, 3.77154541015625, 3.9697265625, 4.16790771484375, 4.3660888671875, 4.56427001953125, 4.762451171875, 4.96063232421875, 5.1588134765625, 5.35699462890625, 5.55517578125, 5.75335693359375, 5.9515380859375, 6.14971923828125, 6.347900390625, 6.54608154296875, 6.7442626953125, 6.94244384765625, 7.140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 9.0, 15.0, 18.0, 51.0, 126.0, 264.0, 301.0, 93.0, 66.0, 20.0, 18.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.004146575927734375, -0.004042834043502808, -0.00393909215927124, -0.003835350275039673, -0.0037316083908081055, -0.003627866506576538, -0.0035241246223449707, -0.0034203827381134033, -0.003316640853881836, -0.0032128989696502686, -0.003109157085418701, -0.003005415201187134, -0.0029016733169555664, -0.002797931432723999, -0.0026941895484924316, -0.0025904476642608643, -0.002486705780029297, -0.0023829638957977295, -0.002279222011566162, -0.0021754801273345947, -0.0020717382431030273, -0.00196799635887146, -0.0018642544746398926, -0.0017605125904083252, -0.0016567707061767578, -0.0015530288219451904, -0.001449286937713623, -0.0013455450534820557, -0.0012418031692504883, -0.001138061285018921, -0.0010343194007873535, -0.0009305775165557861, -0.0008268356323242188, -0.0007230937480926514, -0.000619351863861084, -0.0005156099796295166, -0.0004118680953979492, -0.00030812621116638184, -0.00020438432693481445, -0.00010064244270324707, 3.0994415283203125e-06, 0.0001068413257598877, 0.00021058320999145508, 0.00031432509422302246, 0.00041806697845458984, 0.0005218088626861572, 0.0006255507469177246, 0.000729292631149292, 0.0008330345153808594, 0.0009367763996124268, 0.0010405182838439941, 0.0011442601680755615, 0.001248002052307129, 0.0013517439365386963, 0.0014554858207702637, 0.001559227705001831, 0.0016629695892333984, 0.0017667114734649658, 0.0018704533576965332, 0.0019741952419281006, 0.002077937126159668, 0.0021816790103912354, 0.0022854208946228027, 0.00238916277885437, 0.0024929046630859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 20.0, 19.0, 39.0, 70.0, 97.0, 190.0, 363.0, 820.0, 2154.0, 7502.0, 51274.0, 717359.0, 241238.0, 20647.0, 4169.0, 1360.0, 542.0, 281.0, 114.0, 86.0, 55.0, 38.0, 30.0, 13.0, 11.0, 11.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.15625, -7.92181396484375, -7.6873779296875, -7.45294189453125, -7.218505859375, -6.98406982421875, -6.7496337890625, -6.51519775390625, -6.28076171875, -6.04632568359375, -5.8118896484375, -5.57745361328125, -5.343017578125, -5.10858154296875, -4.8741455078125, -4.63970947265625, -4.4052734375, -4.17083740234375, -3.9364013671875, -3.70196533203125, -3.467529296875, -3.23309326171875, -2.9986572265625, -2.76422119140625, -2.52978515625, -2.29534912109375, -2.0609130859375, -1.82647705078125, -1.592041015625, -1.35760498046875, -1.1231689453125, -0.88873291015625, -0.654296875, -0.41986083984375, -0.1854248046875, 0.04901123046875, 0.283447265625, 0.51788330078125, 0.7523193359375, 0.98675537109375, 1.22119140625, 1.45562744140625, 1.6900634765625, 1.92449951171875, 2.158935546875, 2.39337158203125, 2.6278076171875, 2.86224365234375, 3.0966796875, 3.33111572265625, 3.5655517578125, 3.79998779296875, 4.034423828125, 4.26885986328125, 4.5032958984375, 4.73773193359375, 4.97216796875, 5.20660400390625, 5.4410400390625, 5.67547607421875, 5.909912109375, 6.14434814453125, 6.3787841796875, 6.61322021484375, 6.84765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 11.0, 12.0, 21.0, 11.0, 29.0, 45.0, 65.0, 78.0, 103.0, 105.0, 135.0, 111.0, 100.0, 61.0, 33.0, 30.0, 17.0, 14.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.760498046875, -5.54833984375, -5.336181640625, -5.1240234375, -4.911865234375, -4.69970703125, -4.487548828125, -4.275390625, -4.063232421875, -3.85107421875, -3.638916015625, -3.4267578125, -3.214599609375, -3.00244140625, -2.790283203125, -2.578125, -2.365966796875, -2.15380859375, -1.941650390625, -1.7294921875, -1.517333984375, -1.30517578125, -1.093017578125, -0.880859375, -0.668701171875, -0.45654296875, -0.244384765625, -0.0322265625, 0.179931640625, 0.39208984375, 0.604248046875, 0.81640625, 1.028564453125, 1.24072265625, 1.452880859375, 1.6650390625, 1.877197265625, 2.08935546875, 2.301513671875, 2.513671875, 2.725830078125, 2.93798828125, 3.150146484375, 3.3623046875, 3.574462890625, 3.78662109375, 3.998779296875, 4.2109375, 4.423095703125, 4.63525390625, 4.847412109375, 5.0595703125, 5.271728515625, 5.48388671875, 5.696044921875, 5.908203125, 6.120361328125, 6.33251953125, 6.544677734375, 6.7568359375, 6.968994140625, 7.18115234375, 7.393310546875, 7.60546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 10.0, 27.0, 79.0, 167.0, 282.0, 231.0, 125.0, 46.0, 14.0, 6.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.58036804199219, -70.12629699707031, -65.6722183227539, -61.21814727783203, -56.76407241821289, -52.30999755859375, -47.855926513671875, -43.401851654052734, -38.947776794433594, -34.49370193481445, -30.039628982543945, -25.585556030273438, -21.131481170654297, -16.677406311035156, -12.223333358764648, -7.769260406494141, -3.315185546875, 1.1388883590698242, 5.592962265014648, 10.047036170959473, 14.501110076904297, 18.955184936523438, 23.409257888793945, 27.863330841064453, 32.317405700683594, 36.771480560302734, 41.225555419921875, 45.67962646484375, 50.13370132446289, 54.58777618408203, 59.041847229003906, 63.49592208862305, 67.95001220703125, 72.40408325195312, 76.85816192626953, 81.3122329711914, 85.76631164550781, 90.22038269042969, 94.67445373535156, 99.12852478027344, 103.58260345458984, 108.03667449951172, 112.49075317382812, 116.94482421875, 121.39889526367188, 125.85297393798828, 130.3070526123047, 134.76112365722656, 139.21519470214844, 143.6692657470703, 148.1233367919922, 152.57742309570312, 157.031494140625, 161.48556518554688, 165.93963623046875, 170.39370727539062, 174.8477783203125, 179.30184936523438, 183.75592041015625, 188.2100067138672, 192.66407775878906, 197.11814880371094, 201.5722198486328, 206.0262908935547, 210.48037719726562]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 2.0, 7.0, 5.0, 9.0, 9.0, 9.0, 14.0, 11.0, 14.0, 32.0, 25.0, 22.0, 48.0, 35.0, 25.0, 32.0, 30.0, 50.0, 59.0, 67.0, 63.0, 57.0, 37.0, 39.0, 38.0, 30.0, 34.0, 33.0, 32.0, 20.0, 18.0, 23.0, 17.0, 5.0, 5.0, 8.0, 10.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-53.84965515136719, -52.389434814453125, -50.92921829223633, -49.46900177001953, -48.00878143310547, -46.548561096191406, -45.08834457397461, -43.62812805175781, -42.16790771484375, -40.70768737792969, -39.24747085571289, -37.787254333496094, -36.32703399658203, -34.86681365966797, -33.40659713745117, -31.946378707885742, -30.486160278320312, -29.025941848754883, -27.565723419189453, -26.105504989624023, -24.645286560058594, -23.185068130493164, -21.724849700927734, -20.264631271362305, -18.804412841796875, -17.344194412231445, -15.883975982666016, -14.423757553100586, -12.963539123535156, -11.503320693969727, -10.043102264404297, -8.582883834838867, -7.1226654052734375, -5.662446975708008, -4.202228546142578, -2.7420101165771484, -1.2817916870117188, 0.17842674255371094, 1.6386451721191406, 3.0988636016845703, 4.55908203125, 6.01930046081543, 7.479518890380859, 8.939737319946289, 10.399955749511719, 11.860174179077148, 13.320392608642578, 14.780611038208008, 16.240829467773438, 17.701047897338867, 19.161266326904297, 20.621484756469727, 22.081703186035156, 23.541921615600586, 25.002140045166016, 26.462358474731445, 27.922576904296875, 29.382795333862305, 30.843013763427734, 32.30323028564453, 33.763450622558594, 35.223670959472656, 36.68388748168945, 38.14410400390625, 39.60432434082031]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 9.0, 9.0, 13.0, 17.0, 25.0, 53.0, 69.0, 119.0, 212.0, 329.0, 648.0, 1322.0, 3019.0, 7752.0, 21847.0, 76217.0, 416800.0, 2443565.0, 1020807.0, 145569.0, 36092.0, 11643.0, 4455.0, 1799.0, 885.0, 418.0, 245.0, 125.0, 83.0, 52.0, 30.0, 13.0, 11.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.26171875, -6.104034423828125, -5.94635009765625, -5.788665771484375, -5.6309814453125, -5.473297119140625, -5.31561279296875, -5.157928466796875, -5.000244140625, -4.842559814453125, -4.68487548828125, -4.527191162109375, -4.3695068359375, -4.211822509765625, -4.05413818359375, -3.896453857421875, -3.73876953125, -3.581085205078125, -3.42340087890625, -3.265716552734375, -3.1080322265625, -2.950347900390625, -2.79266357421875, -2.634979248046875, -2.477294921875, -2.319610595703125, -2.16192626953125, -2.004241943359375, -1.8465576171875, -1.688873291015625, -1.53118896484375, -1.373504638671875, -1.2158203125, -1.058135986328125, -0.90045166015625, -0.742767333984375, -0.5850830078125, -0.427398681640625, -0.26971435546875, -0.112030029296875, 0.045654296875, 0.203338623046875, 0.36102294921875, 0.518707275390625, 0.6763916015625, 0.834075927734375, 0.99176025390625, 1.149444580078125, 1.30712890625, 1.464813232421875, 1.62249755859375, 1.780181884765625, 1.9378662109375, 2.095550537109375, 2.25323486328125, 2.410919189453125, 2.568603515625, 2.726287841796875, 2.88397216796875, 3.041656494140625, 3.1993408203125, 3.357025146484375, 3.51470947265625, 3.672393798828125, 3.830078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 9.0, 15.0, 18.0, 12.0, 17.0, 20.0, 24.0, 23.0, 34.0, 44.0, 38.0, 37.0, 53.0, 44.0, 39.0, 57.0, 53.0, 50.0, 49.0, 35.0, 46.0, 44.0, 27.0, 38.0, 28.0, 21.0, 26.0, 12.0, 18.0, 14.0, 12.0, 12.0, 7.0, 9.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.686767578125, -2.60595703125, -2.525146484375, -2.4443359375, -2.363525390625, -2.28271484375, -2.201904296875, -2.12109375, -2.040283203125, -1.95947265625, -1.878662109375, -1.7978515625, -1.717041015625, -1.63623046875, -1.555419921875, -1.474609375, -1.393798828125, -1.31298828125, -1.232177734375, -1.1513671875, -1.070556640625, -0.98974609375, -0.908935546875, -0.828125, -0.747314453125, -0.66650390625, -0.585693359375, -0.5048828125, -0.424072265625, -0.34326171875, -0.262451171875, -0.181640625, -0.100830078125, -0.02001953125, 0.060791015625, 0.1416015625, 0.222412109375, 0.30322265625, 0.384033203125, 0.46484375, 0.545654296875, 0.62646484375, 0.707275390625, 0.7880859375, 0.868896484375, 0.94970703125, 1.030517578125, 1.111328125, 1.192138671875, 1.27294921875, 1.353759765625, 1.4345703125, 1.515380859375, 1.59619140625, 1.677001953125, 1.7578125, 1.838623046875, 1.91943359375, 2.000244140625, 2.0810546875, 2.161865234375, 2.24267578125, 2.323486328125, 2.404296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 29.0, 16.0, 41.0, 108.0, 241.0, 1024.0, 8606.0, 341974.0, 3796068.0, 43031.0, 2303.0, 430.0, 133.0, 80.0, 63.0, 40.0, 23.0, 21.0, 16.0, 10.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -16.8974609375, -16.201171875, -15.5048828125, -14.80859375, -14.1123046875, -13.416015625, -12.7197265625, -12.0234375, -11.3271484375, -10.630859375, -9.9345703125, -9.23828125, -8.5419921875, -7.845703125, -7.1494140625, -6.453125, -5.7568359375, -5.060546875, -4.3642578125, -3.66796875, -2.9716796875, -2.275390625, -1.5791015625, -0.8828125, -0.1865234375, 0.509765625, 1.2060546875, 1.90234375, 2.5986328125, 3.294921875, 3.9912109375, 4.6875, 5.3837890625, 6.080078125, 6.7763671875, 7.47265625, 8.1689453125, 8.865234375, 9.5615234375, 10.2578125, 10.9541015625, 11.650390625, 12.3466796875, 13.04296875, 13.7392578125, 14.435546875, 15.1318359375, 15.828125, 16.5244140625, 17.220703125, 17.9169921875, 18.61328125, 19.3095703125, 20.005859375, 20.7021484375, 21.3984375, 22.0947265625, 22.791015625, 23.4873046875, 24.18359375, 24.8798828125, 25.576171875, 26.2724609375, 26.96875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 6.0, 11.0, 13.0, 28.0, 55.0, 83.0, 161.0, 367.0, 718.0, 1228.0, 728.0, 351.0, 154.0, 73.0, 44.0, 22.0, 21.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.1307373046875, -11.613037109375, -11.0953369140625, -10.57763671875, -10.0599365234375, -9.542236328125, -9.0245361328125, -8.5068359375, -7.9891357421875, -7.471435546875, -6.9537353515625, -6.43603515625, -5.9183349609375, -5.400634765625, -4.8829345703125, -4.365234375, -3.8475341796875, -3.329833984375, -2.8121337890625, -2.29443359375, -1.7767333984375, -1.259033203125, -0.7413330078125, -0.2236328125, 0.2940673828125, 0.811767578125, 1.3294677734375, 1.84716796875, 2.3648681640625, 2.882568359375, 3.4002685546875, 3.91796875, 4.4356689453125, 4.953369140625, 5.4710693359375, 5.98876953125, 6.5064697265625, 7.024169921875, 7.5418701171875, 8.0595703125, 8.5772705078125, 9.094970703125, 9.6126708984375, 10.13037109375, 10.6480712890625, 11.165771484375, 11.6834716796875, 12.201171875, 12.7188720703125, 13.236572265625, 13.7542724609375, 14.27197265625, 14.7896728515625, 15.307373046875, 15.8250732421875, 16.3427734375, 16.8604736328125, 17.378173828125, 17.8958740234375, 18.41357421875, 18.9312744140625, 19.448974609375, 19.9666748046875, 20.484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 6.0, 11.0, 25.0, 30.0, 50.0, 98.0, 148.0, 177.0, 146.0, 109.0, 58.0, 34.0, 23.0, 22.0, 15.0, 5.0, 11.0, 8.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.62010192871094, -95.39066314697266, -92.1612319946289, -88.93179321289062, -85.70236206054688, -82.4729232788086, -79.24348449707031, -76.01405334472656, -72.78461456298828, -69.55517578125, -66.32574462890625, -63.09630584716797, -59.86687088012695, -56.63743591308594, -53.407997131347656, -50.17856216430664, -46.949127197265625, -43.71969223022461, -40.490257263183594, -37.26081848144531, -34.0313835144043, -30.80194854736328, -27.572511672973633, -24.343074798583984, -21.11363983154297, -17.884204864501953, -14.654767990112305, -11.425332069396973, -8.19589614868164, -4.966461181640625, -1.7370243072509766, 1.4924125671386719, 4.721839904785156, 7.951275825500488, 11.18071174621582, 14.410147666931152, 17.639583587646484, 20.8690185546875, 24.09845542907715, 27.327892303466797, 30.557327270507812, 33.78676223754883, 37.016197204589844, 40.245635986328125, 43.47507095336914, 46.704505920410156, 49.93394470214844, 53.16337966918945, 56.39281463623047, 59.622249603271484, 62.8516845703125, 66.08112335205078, 69.31056213378906, 72.53999328613281, 75.7694320678711, 78.99887084960938, 82.22830200195312, 85.4577407836914, 88.68717193603516, 91.91661071777344, 95.14604187011719, 98.37548065185547, 101.60491943359375, 104.8343505859375, 108.06378936767578]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 4.0, 5.0, 8.0, 7.0, 12.0, 10.0, 15.0, 20.0, 24.0, 24.0, 38.0, 26.0, 38.0, 43.0, 49.0, 48.0, 52.0, 54.0, 55.0, 41.0, 44.0, 42.0, 33.0, 50.0, 33.0, 29.0, 37.0, 27.0, 22.0, 20.0, 15.0, 17.0, 10.0, 13.0, 8.0, 4.0, 7.0, 5.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.59345245361328, -55.76282501220703, -53.93219757080078, -52.10157012939453, -50.27094268798828, -48.44031524658203, -46.60968780517578, -44.77906036376953, -42.94843292236328, -41.11780548095703, -39.28717803955078, -37.45655059814453, -35.62592315673828, -33.79529571533203, -31.96466827392578, -30.13404083251953, -28.303415298461914, -26.472787857055664, -24.642160415649414, -22.811532974243164, -20.980905532836914, -19.150279998779297, -17.319652557373047, -15.48902416229248, -13.65839672088623, -11.82776927947998, -9.99714183807373, -8.166515350341797, -6.335887432098389, -4.505260467529297, -2.674633026123047, -0.8440055847167969, 0.9866218566894531, 2.817249298095703, 4.647876739501953, 6.478503704071045, 8.309131622314453, 10.139758110046387, 11.970385551452637, 13.801012992858887, 15.631640434265137, 17.46226692199707, 19.29289436340332, 21.12352180480957, 22.95414924621582, 24.78477668762207, 26.61540412902832, 28.44603157043457, 30.27665901184082, 32.10728454589844, 33.93791198730469, 35.76853942871094, 37.59916687011719, 39.42979431152344, 41.26042175292969, 43.09104919433594, 44.92167663574219, 46.75230407714844, 48.58293151855469, 50.41355895996094, 52.24418640136719, 54.07481384277344, 55.90544128417969, 57.73606872558594, 59.56669616699219]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 16.0, 19.0, 24.0, 36.0, 71.0, 106.0, 141.0, 217.0, 375.0, 569.0, 908.0, 1594.0, 2750.0, 4668.0, 8075.0, 14826.0, 26655.0, 50603.0, 100052.0, 210569.0, 295551.0, 161773.0, 78202.0, 40693.0, 21647.0, 11978.0, 6764.0, 3869.0, 2189.0, 1378.0, 782.0, 530.0, 321.0, 176.0, 129.0, 82.0, 65.0, 49.0, 24.0, 19.0, 12.0, 10.0, 14.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.515625, -5.3594970703125, -5.203369140625, -5.0472412109375, -4.89111328125, -4.7349853515625, -4.578857421875, -4.4227294921875, -4.2666015625, -4.1104736328125, -3.954345703125, -3.7982177734375, -3.64208984375, -3.4859619140625, -3.329833984375, -3.1737060546875, -3.017578125, -2.8614501953125, -2.705322265625, -2.5491943359375, -2.39306640625, -2.2369384765625, -2.080810546875, -1.9246826171875, -1.7685546875, -1.6124267578125, -1.456298828125, -1.3001708984375, -1.14404296875, -0.9879150390625, -0.831787109375, -0.6756591796875, -0.51953125, -0.3634033203125, -0.207275390625, -0.0511474609375, 0.10498046875, 0.2611083984375, 0.417236328125, 0.5733642578125, 0.7294921875, 0.8856201171875, 1.041748046875, 1.1978759765625, 1.35400390625, 1.5101318359375, 1.666259765625, 1.8223876953125, 1.978515625, 2.1346435546875, 2.290771484375, 2.4468994140625, 2.60302734375, 2.7591552734375, 2.915283203125, 3.0714111328125, 3.2275390625, 3.3836669921875, 3.539794921875, 3.6959228515625, 3.85205078125, 4.0081787109375, 4.164306640625, 4.3204345703125, 4.4765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 12.0, 16.0, 8.0, 14.0, 25.0, 21.0, 19.0, 35.0, 32.0, 43.0, 34.0, 49.0, 41.0, 52.0, 50.0, 51.0, 51.0, 66.0, 36.0, 54.0, 44.0, 35.0, 32.0, 24.0, 26.0, 32.0, 18.0, 8.0, 13.0, 8.0, 11.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.47265625, -3.357757568359375, -3.24285888671875, -3.127960205078125, -3.0130615234375, -2.898162841796875, -2.78326416015625, -2.668365478515625, -2.553466796875, -2.438568115234375, -2.32366943359375, -2.208770751953125, -2.0938720703125, -1.978973388671875, -1.86407470703125, -1.749176025390625, -1.63427734375, -1.519378662109375, -1.40447998046875, -1.289581298828125, -1.1746826171875, -1.059783935546875, -0.94488525390625, -0.829986572265625, -0.715087890625, -0.600189208984375, -0.48529052734375, -0.370391845703125, -0.2554931640625, -0.140594482421875, -0.02569580078125, 0.089202880859375, 0.2041015625, 0.319000244140625, 0.43389892578125, 0.548797607421875, 0.6636962890625, 0.778594970703125, 0.89349365234375, 1.008392333984375, 1.123291015625, 1.238189697265625, 1.35308837890625, 1.467987060546875, 1.5828857421875, 1.697784423828125, 1.81268310546875, 1.927581787109375, 2.04248046875, 2.157379150390625, 2.27227783203125, 2.387176513671875, 2.5020751953125, 2.616973876953125, 2.73187255859375, 2.846771240234375, 2.961669921875, 3.076568603515625, 3.19146728515625, 3.306365966796875, 3.4212646484375, 3.536163330078125, 3.65106201171875, 3.765960693359375, 3.880859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 4.0, 13.0, 15.0, 24.0, 28.0, 43.0, 54.0, 106.0, 161.0, 284.0, 548.0, 1074.0, 2453.0, 7694.0, 47147.0, 824426.0, 143670.0, 13957.0, 3862.0, 1426.0, 651.0, 341.0, 202.0, 111.0, 85.0, 52.0, 37.0, 18.0, 16.0, 18.0, 8.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.109375, -22.331298828125, -21.55322265625, -20.775146484375, -19.9970703125, -19.218994140625, -18.44091796875, -17.662841796875, -16.884765625, -16.106689453125, -15.32861328125, -14.550537109375, -13.7724609375, -12.994384765625, -12.21630859375, -11.438232421875, -10.66015625, -9.882080078125, -9.10400390625, -8.325927734375, -7.5478515625, -6.769775390625, -5.99169921875, -5.213623046875, -4.435546875, -3.657470703125, -2.87939453125, -2.101318359375, -1.3232421875, -0.545166015625, 0.23291015625, 1.010986328125, 1.7890625, 2.567138671875, 3.34521484375, 4.123291015625, 4.9013671875, 5.679443359375, 6.45751953125, 7.235595703125, 8.013671875, 8.791748046875, 9.56982421875, 10.347900390625, 11.1259765625, 11.904052734375, 12.68212890625, 13.460205078125, 14.23828125, 15.016357421875, 15.79443359375, 16.572509765625, 17.3505859375, 18.128662109375, 18.90673828125, 19.684814453125, 20.462890625, 21.240966796875, 22.01904296875, 22.797119140625, 23.5751953125, 24.353271484375, 25.13134765625, 25.909423828125, 26.6875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 7.0, 8.0, 10.0, 12.0, 16.0, 17.0, 27.0, 40.0, 36.0, 49.0, 47.0, 73.0, 73.0, 68.0, 91.0, 65.0, 56.0, 51.0, 58.0, 42.0, 32.0, 26.0, 27.0, 15.0, 10.0, 9.0, 8.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.65625, -28.80712890625, -27.9580078125, -27.10888671875, -26.259765625, -25.41064453125, -24.5615234375, -23.71240234375, -22.86328125, -22.01416015625, -21.1650390625, -20.31591796875, -19.466796875, -18.61767578125, -17.7685546875, -16.91943359375, -16.0703125, -15.22119140625, -14.3720703125, -13.52294921875, -12.673828125, -11.82470703125, -10.9755859375, -10.12646484375, -9.27734375, -8.42822265625, -7.5791015625, -6.72998046875, -5.880859375, -5.03173828125, -4.1826171875, -3.33349609375, -2.484375, -1.63525390625, -0.7861328125, 0.06298828125, 0.912109375, 1.76123046875, 2.6103515625, 3.45947265625, 4.30859375, 5.15771484375, 6.0068359375, 6.85595703125, 7.705078125, 8.55419921875, 9.4033203125, 10.25244140625, 11.1015625, 11.95068359375, 12.7998046875, 13.64892578125, 14.498046875, 15.34716796875, 16.1962890625, 17.04541015625, 17.89453125, 18.74365234375, 19.5927734375, 20.44189453125, 21.291015625, 22.14013671875, 22.9892578125, 23.83837890625, 24.6875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 10.0, 25.0, 27.0, 36.0, 66.0, 122.0, 216.0, 340.0, 642.0, 1255.0, 2876.0, 7462.0, 49005.0, 904673.0, 67307.0, 8476.0, 3018.0, 1401.0, 692.0, 358.0, 202.0, 129.0, 72.0, 43.0, 27.0, 13.0, 21.0, 9.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.2109375, -14.74365234375, -14.2763671875, -13.80908203125, -13.341796875, -12.87451171875, -12.4072265625, -11.93994140625, -11.47265625, -11.00537109375, -10.5380859375, -10.07080078125, -9.603515625, -9.13623046875, -8.6689453125, -8.20166015625, -7.734375, -7.26708984375, -6.7998046875, -6.33251953125, -5.865234375, -5.39794921875, -4.9306640625, -4.46337890625, -3.99609375, -3.52880859375, -3.0615234375, -2.59423828125, -2.126953125, -1.65966796875, -1.1923828125, -0.72509765625, -0.2578125, 0.20947265625, 0.6767578125, 1.14404296875, 1.611328125, 2.07861328125, 2.5458984375, 3.01318359375, 3.48046875, 3.94775390625, 4.4150390625, 4.88232421875, 5.349609375, 5.81689453125, 6.2841796875, 6.75146484375, 7.21875, 7.68603515625, 8.1533203125, 8.62060546875, 9.087890625, 9.55517578125, 10.0224609375, 10.48974609375, 10.95703125, 11.42431640625, 11.8916015625, 12.35888671875, 12.826171875, 13.29345703125, 13.7607421875, 14.22802734375, 14.6953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 8.0, 22.0, 27.0, 59.0, 81.0, 147.0, 304.0, 161.0, 68.0, 35.0, 25.0, 13.0, 11.0, 5.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003173828125, -0.0030492544174194336, -0.002924680709838867, -0.0028001070022583008, -0.0026755332946777344, -0.002550959587097168, -0.0024263858795166016, -0.002301812171936035, -0.0021772384643554688, -0.0020526647567749023, -0.001928091049194336, -0.0018035173416137695, -0.0016789436340332031, -0.0015543699264526367, -0.0014297962188720703, -0.001305222511291504, -0.0011806488037109375, -0.001056075096130371, -0.0009315013885498047, -0.0008069276809692383, -0.0006823539733886719, -0.0005577802658081055, -0.00043320655822753906, -0.00030863285064697266, -0.00018405914306640625, -5.9485435485839844e-05, 6.508827209472656e-05, 0.00018966197967529297, 0.0003142356872558594, 0.0004388093948364258, 0.0005633831024169922, 0.0006879568099975586, 0.000812530517578125, 0.0009371042251586914, 0.0010616779327392578, 0.0011862516403198242, 0.0013108253479003906, 0.001435399055480957, 0.0015599727630615234, 0.0016845464706420898, 0.0018091201782226562, 0.0019336938858032227, 0.002058267593383789, 0.0021828413009643555, 0.002307415008544922, 0.0024319887161254883, 0.0025565624237060547, 0.002681136131286621, 0.0028057098388671875, 0.002930283546447754, 0.0030548572540283203, 0.0031794309616088867, 0.003304004669189453, 0.0034285783767700195, 0.003553152084350586, 0.0036777257919311523, 0.0038022994995117188, 0.003926873207092285, 0.0040514469146728516, 0.004176020622253418, 0.004300594329833984, 0.004425168037414551, 0.004549741744995117, 0.004674315452575684, 0.00479888916015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 6.0, 10.0, 21.0, 20.0, 26.0, 46.0, 54.0, 80.0, 135.0, 182.0, 294.0, 436.0, 693.0, 1302.0, 2510.0, 4971.0, 13204.0, 145442.0, 840313.0, 24197.0, 7057.0, 3232.0, 1682.0, 1010.0, 546.0, 338.0, 212.0, 142.0, 91.0, 62.0, 51.0, 30.0, 38.0, 16.0, 16.0, 14.0, 6.0, 9.0, 4.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-15.9140625, -15.419921875, -14.92578125, -14.431640625, -13.9375, -13.443359375, -12.94921875, -12.455078125, -11.9609375, -11.466796875, -10.97265625, -10.478515625, -9.984375, -9.490234375, -8.99609375, -8.501953125, -8.0078125, -7.513671875, -7.01953125, -6.525390625, -6.03125, -5.537109375, -5.04296875, -4.548828125, -4.0546875, -3.560546875, -3.06640625, -2.572265625, -2.078125, -1.583984375, -1.08984375, -0.595703125, -0.1015625, 0.392578125, 0.88671875, 1.380859375, 1.875, 2.369140625, 2.86328125, 3.357421875, 3.8515625, 4.345703125, 4.83984375, 5.333984375, 5.828125, 6.322265625, 6.81640625, 7.310546875, 7.8046875, 8.298828125, 8.79296875, 9.287109375, 9.78125, 10.275390625, 10.76953125, 11.263671875, 11.7578125, 12.251953125, 12.74609375, 13.240234375, 13.734375, 14.228515625, 14.72265625, 15.216796875, 15.7109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 6.0, 11.0, 20.0, 37.0, 59.0, 134.0, 220.0, 220.0, 119.0, 55.0, 31.0, 19.0, 14.0, 5.0, 2.0, 1.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.34375, -17.805419921875, -17.26708984375, -16.728759765625, -16.1904296875, -15.652099609375, -15.11376953125, -14.575439453125, -14.037109375, -13.498779296875, -12.96044921875, -12.422119140625, -11.8837890625, -11.345458984375, -10.80712890625, -10.268798828125, -9.73046875, -9.192138671875, -8.65380859375, -8.115478515625, -7.5771484375, -7.038818359375, -6.50048828125, -5.962158203125, -5.423828125, -4.885498046875, -4.34716796875, -3.808837890625, -3.2705078125, -2.732177734375, -2.19384765625, -1.655517578125, -1.1171875, -0.578857421875, -0.04052734375, 0.497802734375, 1.0361328125, 1.574462890625, 2.11279296875, 2.651123046875, 3.189453125, 3.727783203125, 4.26611328125, 4.804443359375, 5.3427734375, 5.881103515625, 6.41943359375, 6.957763671875, 7.49609375, 8.034423828125, 8.57275390625, 9.111083984375, 9.6494140625, 10.187744140625, 10.72607421875, 11.264404296875, 11.802734375, 12.341064453125, 12.87939453125, 13.417724609375, 13.9560546875, 14.494384765625, 15.03271484375, 15.571044921875, 16.109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 11.0, 24.0, 72.0, 222.0, 388.0, 188.0, 52.0, 20.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.55203247070312, -198.31365966796875, -188.07530212402344, -177.83692932128906, -167.59857177734375, -157.36019897460938, -147.121826171875, -136.8834686279297, -126.64510345458984, -116.40673828125, -106.16837310791016, -95.93000793457031, -85.69163513183594, -75.45327758789062, -65.21490478515625, -54.976539611816406, -44.73817443847656, -34.49980926513672, -24.261442184448242, -14.023075103759766, -3.784709930419922, 6.453655242919922, 16.69202423095703, 26.930389404296875, 37.16875457763672, 47.40711975097656, 57.645484924316406, 67.88385009765625, 78.12222290039062, 88.36058044433594, 98.59895324707031, 108.83731842041016, 119.07568359375, 129.31405639648438, 139.5524139404297, 149.79078674316406, 160.02914428710938, 170.26751708984375, 180.50588989257812, 190.74424743652344, 200.98260498046875, 211.22097778320312, 221.45933532714844, 231.6977081298828, 241.93606567382812, 252.1744384765625, 262.4128112792969, 272.65118408203125, 282.8895263671875, 293.1278991699219, 303.36627197265625, 313.6046142578125, 323.8429870605469, 334.08135986328125, 344.3197326660156, 354.55810546875, 364.7964782714844, 375.03485107421875, 385.2732238769531, 395.5115661621094, 405.74993896484375, 415.9883117675781, 426.2266845703125, 436.46502685546875, 446.7033996582031]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 11.0, 3.0, 8.0, 9.0, 10.0, 17.0, 11.0, 16.0, 12.0, 19.0, 23.0, 20.0, 28.0, 28.0, 27.0, 33.0, 34.0, 32.0, 39.0, 54.0, 62.0, 38.0, 54.0, 45.0, 34.0, 31.0, 25.0, 24.0, 26.0, 27.0, 26.0, 18.0, 20.0, 20.0, 13.0, 15.0, 13.0, 10.0, 14.0, 13.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0], "bins": [-72.90275573730469, -70.6104507446289, -68.31814575195312, -66.02584838867188, -63.733543395996094, -61.44123840332031, -59.14893341064453, -56.85662841796875, -54.564327239990234, -52.27202224731445, -49.97972106933594, -47.687416076660156, -45.395111083984375, -43.10280990600586, -40.81050491333008, -38.51820373535156, -36.22589874267578, -33.93359375, -31.641292572021484, -29.348987579345703, -27.056684494018555, -24.764381408691406, -22.472076416015625, -20.179773330688477, -17.887470245361328, -15.59516716003418, -13.302863121032715, -11.01055908203125, -8.718255996704102, -6.425952911376953, -4.133648872375488, -1.8413448333740234, 0.45095062255859375, 2.7432541847229004, 5.035557746887207, 7.327861309051514, 9.62016487121582, 11.912467956542969, 14.204771995544434, 16.4970760345459, 18.789379119873047, 21.081682205200195, 23.373985290527344, 25.666290283203125, 27.958593368530273, 30.250896453857422, 32.5432014465332, 34.83550262451172, 37.1278076171875, 39.42011260986328, 41.7124137878418, 44.00471878051758, 46.297019958496094, 48.589324951171875, 50.881629943847656, 53.17393493652344, 55.46623611450195, 57.758541107177734, 60.05084228515625, 62.34314727783203, 64.63545227050781, 66.92774963378906, 69.22005462646484, 71.51235961914062, 73.8046646118164]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 15.0, 25.0, 25.0, 37.0, 54.0, 88.0, 105.0, 196.0, 319.0, 742.0, 2135.0, 9261.0, 77412.0, 2579466.0, 1462922.0, 51115.0, 7116.0, 1778.0, 628.0, 305.0, 165.0, 98.0, 79.0, 40.0, 38.0, 26.0, 13.0, 15.0, 10.0, 9.0, 4.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -12.2830810546875, -11.909912109375, -11.5367431640625, -11.16357421875, -10.7904052734375, -10.417236328125, -10.0440673828125, -9.6708984375, -9.2977294921875, -8.924560546875, -8.5513916015625, -8.17822265625, -7.8050537109375, -7.431884765625, -7.0587158203125, -6.685546875, -6.3123779296875, -5.939208984375, -5.5660400390625, -5.19287109375, -4.8197021484375, -4.446533203125, -4.0733642578125, -3.7001953125, -3.3270263671875, -2.953857421875, -2.5806884765625, -2.20751953125, -1.8343505859375, -1.461181640625, -1.0880126953125, -0.71484375, -0.3416748046875, 0.031494140625, 0.4046630859375, 0.77783203125, 1.1510009765625, 1.524169921875, 1.8973388671875, 2.2705078125, 2.6436767578125, 3.016845703125, 3.3900146484375, 3.76318359375, 4.1363525390625, 4.509521484375, 4.8826904296875, 5.255859375, 5.6290283203125, 6.002197265625, 6.3753662109375, 6.74853515625, 7.1217041015625, 7.494873046875, 7.8680419921875, 8.2412109375, 8.6143798828125, 8.987548828125, 9.3607177734375, 9.73388671875, 10.1070556640625, 10.480224609375, 10.8533935546875, 11.2265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 8.0, 7.0, 16.0, 11.0, 21.0, 26.0, 27.0, 23.0, 29.0, 53.0, 54.0, 49.0, 47.0, 53.0, 54.0, 50.0, 58.0, 47.0, 47.0, 50.0, 43.0, 45.0, 25.0, 33.0, 24.0, 17.0, 20.0, 13.0, 10.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.35546875, -5.214996337890625, -5.07452392578125, -4.934051513671875, -4.7935791015625, -4.653106689453125, -4.51263427734375, -4.372161865234375, -4.231689453125, -4.091217041015625, -3.95074462890625, -3.810272216796875, -3.6697998046875, -3.529327392578125, -3.38885498046875, -3.248382568359375, -3.10791015625, -2.967437744140625, -2.82696533203125, -2.686492919921875, -2.5460205078125, -2.405548095703125, -2.26507568359375, -2.124603271484375, -1.984130859375, -1.843658447265625, -1.70318603515625, -1.562713623046875, -1.4222412109375, -1.281768798828125, -1.14129638671875, -1.000823974609375, -0.8603515625, -0.719879150390625, -0.57940673828125, -0.438934326171875, -0.2984619140625, -0.157989501953125, -0.01751708984375, 0.122955322265625, 0.263427734375, 0.403900146484375, 0.54437255859375, 0.684844970703125, 0.8253173828125, 0.965789794921875, 1.10626220703125, 1.246734619140625, 1.38720703125, 1.527679443359375, 1.66815185546875, 1.808624267578125, 1.9490966796875, 2.089569091796875, 2.23004150390625, 2.370513916015625, 2.510986328125, 2.651458740234375, 2.79193115234375, 2.932403564453125, 3.0728759765625, 3.213348388671875, 3.35382080078125, 3.494293212890625, 3.634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 15.0, 12.0, 34.0, 49.0, 73.0, 130.0, 263.0, 658.0, 1804.0, 7608.0, 76182.0, 3797552.0, 291199.0, 14105.0, 2764.0, 850.0, 398.0, 187.0, 108.0, 80.0, 60.0, 48.0, 29.0, 22.0, 12.0, 14.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.488525390625, -19.77392578125, -19.059326171875, -18.3447265625, -17.630126953125, -16.91552734375, -16.200927734375, -15.486328125, -14.771728515625, -14.05712890625, -13.342529296875, -12.6279296875, -11.913330078125, -11.19873046875, -10.484130859375, -9.76953125, -9.054931640625, -8.34033203125, -7.625732421875, -6.9111328125, -6.196533203125, -5.48193359375, -4.767333984375, -4.052734375, -3.338134765625, -2.62353515625, -1.908935546875, -1.1943359375, -0.479736328125, 0.23486328125, 0.949462890625, 1.6640625, 2.378662109375, 3.09326171875, 3.807861328125, 4.5224609375, 5.237060546875, 5.95166015625, 6.666259765625, 7.380859375, 8.095458984375, 8.81005859375, 9.524658203125, 10.2392578125, 10.953857421875, 11.66845703125, 12.383056640625, 13.09765625, 13.812255859375, 14.52685546875, 15.241455078125, 15.9560546875, 16.670654296875, 17.38525390625, 18.099853515625, 18.814453125, 19.529052734375, 20.24365234375, 20.958251953125, 21.6728515625, 22.387451171875, 23.10205078125, 23.816650390625, 24.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 16.0, 13.0, 11.0, 29.0, 35.0, 63.0, 95.0, 169.0, 328.0, 661.0, 905.0, 767.0, 428.0, 226.0, 129.0, 79.0, 43.0, 21.0, 12.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.0751953125, -8.587890625, -8.1005859375, -7.61328125, -7.1259765625, -6.638671875, -6.1513671875, -5.6640625, -5.1767578125, -4.689453125, -4.2021484375, -3.71484375, -3.2275390625, -2.740234375, -2.2529296875, -1.765625, -1.2783203125, -0.791015625, -0.3037109375, 0.18359375, 0.6708984375, 1.158203125, 1.6455078125, 2.1328125, 2.6201171875, 3.107421875, 3.5947265625, 4.08203125, 4.5693359375, 5.056640625, 5.5439453125, 6.03125, 6.5185546875, 7.005859375, 7.4931640625, 7.98046875, 8.4677734375, 8.955078125, 9.4423828125, 9.9296875, 10.4169921875, 10.904296875, 11.3916015625, 11.87890625, 12.3662109375, 12.853515625, 13.3408203125, 13.828125, 14.3154296875, 14.802734375, 15.2900390625, 15.77734375, 16.2646484375, 16.751953125, 17.2392578125, 17.7265625, 18.2138671875, 18.701171875, 19.1884765625, 19.67578125, 20.1630859375, 20.650390625, 21.1376953125, 21.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 13.0, 17.0, 34.0, 59.0, 146.0, 209.0, 261.0, 138.0, 63.0, 32.0, 14.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-207.18370056152344, -201.86293029785156, -196.54214477539062, -191.22137451171875, -185.90060424804688, -180.579833984375, -175.25904846191406, -169.9382781982422, -164.61749267578125, -159.29672241210938, -153.97593688964844, -148.65516662597656, -143.3343963623047, -138.01361083984375, -132.69284057617188, -127.3720703125, -122.05130004882812, -116.73052215576172, -111.40975189208984, -106.08897399902344, -100.76820373535156, -95.44742584228516, -90.12664794921875, -84.80587768554688, -79.48509979248047, -74.16432189941406, -68.84355163574219, -63.52277374267578, -58.20199966430664, -52.8812255859375, -47.560447692871094, -42.23967361450195, -36.91888427734375, -31.59811019897461, -26.277334213256836, -20.956558227539062, -15.635784149169922, -10.315010070800781, -4.994234085083008, 0.3265419006347656, 5.647315979003906, 10.968091011047363, 16.28886604309082, 21.609642028808594, 26.930416107177734, 32.251190185546875, 37.57196807861328, 42.89274215698242, 48.21351623535156, 53.5342903137207, 58.855064392089844, 64.17584228515625, 69.49661254882812, 74.81739044189453, 80.13816833496094, 85.45893859863281, 90.77971649169922, 96.10049438476562, 101.4212646484375, 106.7420425415039, 112.06282043457031, 117.38359069824219, 122.7043685913086, 128.025146484375, 133.34591674804688]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 15.0, 14.0, 17.0, 16.0, 27.0, 33.0, 26.0, 40.0, 41.0, 49.0, 50.0, 60.0, 69.0, 72.0, 56.0, 58.0, 45.0, 50.0, 33.0, 42.0, 43.0, 18.0, 24.0, 22.0, 24.0, 11.0, 11.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-79.3607177734375, -77.1825180053711, -75.00432586669922, -72.82612609863281, -70.64793395996094, -68.46973419189453, -66.29154205322266, -64.11334228515625, -61.935150146484375, -59.756954193115234, -57.578758239746094, -55.40056228637695, -53.22236633300781, -51.04417037963867, -48.86597442626953, -46.687774658203125, -44.509578704833984, -42.331382751464844, -40.1531867980957, -37.97499084472656, -35.79679489135742, -33.61859893798828, -31.440401077270508, -29.262205123901367, -27.084009170532227, -24.905813217163086, -22.727617263793945, -20.549419403076172, -18.37122344970703, -16.19302749633789, -14.01483154296875, -11.83663558959961, -9.658439636230469, -7.480243682861328, -5.302047252655029, -3.1238508224487305, -0.9456548690795898, 1.2325410842895508, 3.410737991333008, 5.588933944702148, 7.767129898071289, 9.94532585144043, 12.12352180480957, 14.301718711853027, 16.479915618896484, 18.658111572265625, 20.836307525634766, 23.014503479003906, 25.192699432373047, 27.370895385742188, 29.549091339111328, 31.72728729248047, 33.90548324584961, 36.08367919921875, 38.261878967285156, 40.44007110595703, 42.61827087402344, 44.79646682739258, 46.97466278076172, 49.15285873413086, 51.3310546875, 53.50925064086914, 55.68744659423828, 57.86564636230469, 60.04383850097656]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 10.0, 19.0, 32.0, 38.0, 46.0, 60.0, 82.0, 125.0, 191.0, 258.0, 441.0, 699.0, 1138.0, 1907.0, 3389.0, 6429.0, 13261.0, 29659.0, 78403.0, 261303.0, 421593.0, 140944.0, 48044.0, 19901.0, 9405.0, 4682.0, 2525.0, 1435.0, 852.0, 547.0, 351.0, 220.0, 166.0, 111.0, 86.0, 53.0, 36.0, 25.0, 22.0, 9.0, 14.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9302978515625, -7.649658203125, -7.3690185546875, -7.08837890625, -6.8077392578125, -6.527099609375, -6.2464599609375, -5.9658203125, -5.6851806640625, -5.404541015625, -5.1239013671875, -4.84326171875, -4.5626220703125, -4.281982421875, -4.0013427734375, -3.720703125, -3.4400634765625, -3.159423828125, -2.8787841796875, -2.59814453125, -2.3175048828125, -2.036865234375, -1.7562255859375, -1.4755859375, -1.1949462890625, -0.914306640625, -0.6336669921875, -0.35302734375, -0.0723876953125, 0.208251953125, 0.4888916015625, 0.76953125, 1.0501708984375, 1.330810546875, 1.6114501953125, 1.89208984375, 2.1727294921875, 2.453369140625, 2.7340087890625, 3.0146484375, 3.2952880859375, 3.575927734375, 3.8565673828125, 4.13720703125, 4.4178466796875, 4.698486328125, 4.9791259765625, 5.259765625, 5.5404052734375, 5.821044921875, 6.1016845703125, 6.38232421875, 6.6629638671875, 6.943603515625, 7.2242431640625, 7.5048828125, 7.7855224609375, 8.066162109375, 8.3468017578125, 8.62744140625, 8.9080810546875, 9.188720703125, 9.4693603515625, 9.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 10.0, 9.0, 17.0, 18.0, 16.0, 23.0, 21.0, 27.0, 33.0, 38.0, 41.0, 44.0, 47.0, 44.0, 46.0, 43.0, 51.0, 46.0, 45.0, 52.0, 41.0, 36.0, 39.0, 35.0, 30.0, 20.0, 26.0, 14.0, 19.0, 11.0, 11.0, 9.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.7890625, -4.64501953125, -4.5009765625, -4.35693359375, -4.212890625, -4.06884765625, -3.9248046875, -3.78076171875, -3.63671875, -3.49267578125, -3.3486328125, -3.20458984375, -3.060546875, -2.91650390625, -2.7724609375, -2.62841796875, -2.484375, -2.34033203125, -2.1962890625, -2.05224609375, -1.908203125, -1.76416015625, -1.6201171875, -1.47607421875, -1.33203125, -1.18798828125, -1.0439453125, -0.89990234375, -0.755859375, -0.61181640625, -0.4677734375, -0.32373046875, -0.1796875, -0.03564453125, 0.1083984375, 0.25244140625, 0.396484375, 0.54052734375, 0.6845703125, 0.82861328125, 0.97265625, 1.11669921875, 1.2607421875, 1.40478515625, 1.548828125, 1.69287109375, 1.8369140625, 1.98095703125, 2.125, 2.26904296875, 2.4130859375, 2.55712890625, 2.701171875, 2.84521484375, 2.9892578125, 3.13330078125, 3.27734375, 3.42138671875, 3.5654296875, 3.70947265625, 3.853515625, 3.99755859375, 4.1416015625, 4.28564453125, 4.4296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 11.0, 13.0, 22.0, 45.0, 49.0, 68.0, 112.0, 171.0, 250.0, 372.0, 693.0, 1064.0, 2210.0, 5194.0, 16082.0, 87723.0, 757880.0, 142455.0, 22103.0, 6388.0, 2512.0, 1247.0, 643.0, 412.0, 237.0, 145.0, 112.0, 83.0, 59.0, 41.0, 29.0, 37.0, 16.0, 8.0, 10.0, 11.0, 2.0, 6.0, 3.0, 2.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.21875, -20.58740234375, -19.9560546875, -19.32470703125, -18.693359375, -18.06201171875, -17.4306640625, -16.79931640625, -16.16796875, -15.53662109375, -14.9052734375, -14.27392578125, -13.642578125, -13.01123046875, -12.3798828125, -11.74853515625, -11.1171875, -10.48583984375, -9.8544921875, -9.22314453125, -8.591796875, -7.96044921875, -7.3291015625, -6.69775390625, -6.06640625, -5.43505859375, -4.8037109375, -4.17236328125, -3.541015625, -2.90966796875, -2.2783203125, -1.64697265625, -1.015625, -0.38427734375, 0.2470703125, 0.87841796875, 1.509765625, 2.14111328125, 2.7724609375, 3.40380859375, 4.03515625, 4.66650390625, 5.2978515625, 5.92919921875, 6.560546875, 7.19189453125, 7.8232421875, 8.45458984375, 9.0859375, 9.71728515625, 10.3486328125, 10.97998046875, 11.611328125, 12.24267578125, 12.8740234375, 13.50537109375, 14.13671875, 14.76806640625, 15.3994140625, 16.03076171875, 16.662109375, 17.29345703125, 17.9248046875, 18.55615234375, 19.1875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 7.0, 6.0, 9.0, 14.0, 12.0, 15.0, 23.0, 35.0, 27.0, 44.0, 36.0, 56.0, 42.0, 55.0, 66.0, 72.0, 55.0, 54.0, 59.0, 46.0, 44.0, 40.0, 33.0, 27.0, 21.0, 13.0, 22.0, 16.0, 11.0, 5.0, 9.0, 5.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.955078125, -23.16015625, -22.365234375, -21.5703125, -20.775390625, -19.98046875, -19.185546875, -18.390625, -17.595703125, -16.80078125, -16.005859375, -15.2109375, -14.416015625, -13.62109375, -12.826171875, -12.03125, -11.236328125, -10.44140625, -9.646484375, -8.8515625, -8.056640625, -7.26171875, -6.466796875, -5.671875, -4.876953125, -4.08203125, -3.287109375, -2.4921875, -1.697265625, -0.90234375, -0.107421875, 0.6875, 1.482421875, 2.27734375, 3.072265625, 3.8671875, 4.662109375, 5.45703125, 6.251953125, 7.046875, 7.841796875, 8.63671875, 9.431640625, 10.2265625, 11.021484375, 11.81640625, 12.611328125, 13.40625, 14.201171875, 14.99609375, 15.791015625, 16.5859375, 17.380859375, 18.17578125, 18.970703125, 19.765625, 20.560546875, 21.35546875, 22.150390625, 22.9453125, 23.740234375, 24.53515625, 25.330078125, 26.125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 12.0, 13.0, 28.0, 29.0, 49.0, 83.0, 99.0, 210.0, 351.0, 686.0, 1370.0, 3422.0, 11430.0, 69883.0, 814750.0, 122365.0, 15828.0, 4350.0, 1739.0, 798.0, 439.0, 236.0, 126.0, 83.0, 51.0, 41.0, 27.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.296875, -11.9197998046875, -11.542724609375, -11.1656494140625, -10.78857421875, -10.4114990234375, -10.034423828125, -9.6573486328125, -9.2802734375, -8.9031982421875, -8.526123046875, -8.1490478515625, -7.77197265625, -7.3948974609375, -7.017822265625, -6.6407470703125, -6.263671875, -5.8865966796875, -5.509521484375, -5.1324462890625, -4.75537109375, -4.3782958984375, -4.001220703125, -3.6241455078125, -3.2470703125, -2.8699951171875, -2.492919921875, -2.1158447265625, -1.73876953125, -1.3616943359375, -0.984619140625, -0.6075439453125, -0.23046875, 0.1466064453125, 0.523681640625, 0.9007568359375, 1.27783203125, 1.6549072265625, 2.031982421875, 2.4090576171875, 2.7861328125, 3.1632080078125, 3.540283203125, 3.9173583984375, 4.29443359375, 4.6715087890625, 5.048583984375, 5.4256591796875, 5.802734375, 6.1798095703125, 6.556884765625, 6.9339599609375, 7.31103515625, 7.6881103515625, 8.065185546875, 8.4422607421875, 8.8193359375, 9.1964111328125, 9.573486328125, 9.9505615234375, 10.32763671875, 10.7047119140625, 11.081787109375, 11.4588623046875, 11.8359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 13.0, 21.0, 48.0, 79.0, 148.0, 263.0, 161.0, 89.0, 58.0, 34.0, 19.0, 13.0, 4.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032062530517578125, -0.0030764639377593994, -0.0029466748237609863, -0.0028168857097625732, -0.00268709659576416, -0.002557307481765747, -0.002427518367767334, -0.002297729253768921, -0.002167940139770508, -0.0020381510257720947, -0.0019083619117736816, -0.0017785727977752686, -0.0016487836837768555, -0.0015189945697784424, -0.0013892054557800293, -0.0012594163417816162, -0.0011296272277832031, -0.00099983811378479, -0.000870048999786377, -0.0007402598857879639, -0.0006104707717895508, -0.0004806816577911377, -0.0003508925437927246, -0.00022110342979431152, -9.131431579589844e-05, 3.847479820251465e-05, 0.00016826391220092773, 0.0002980530261993408, 0.0004278421401977539, 0.000557631254196167, 0.0006874203681945801, 0.0008172094821929932, 0.0009469985961914062, 0.0010767877101898193, 0.0012065768241882324, 0.0013363659381866455, 0.0014661550521850586, 0.0015959441661834717, 0.0017257332801818848, 0.0018555223941802979, 0.001985311508178711, 0.002115100622177124, 0.002244889736175537, 0.00237467885017395, 0.0025044679641723633, 0.0026342570781707764, 0.0027640461921691895, 0.0028938353061676025, 0.0030236244201660156, 0.0031534135341644287, 0.003283202648162842, 0.003412991762161255, 0.003542780876159668, 0.003672569990158081, 0.003802359104156494, 0.003932148218154907, 0.00406193733215332, 0.004191726446151733, 0.0043215155601501465, 0.00445130467414856, 0.004581093788146973, 0.004710882902145386, 0.004840672016143799, 0.004970461130142212, 0.005100250244140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 9.0, 8.0, 17.0, 17.0, 33.0, 38.0, 86.0, 99.0, 189.0, 296.0, 489.0, 836.0, 1553.0, 3288.0, 7792.0, 24055.0, 128526.0, 742666.0, 103669.0, 21189.0, 7059.0, 2999.0, 1540.0, 789.0, 412.0, 299.0, 189.0, 125.0, 83.0, 60.0, 28.0, 28.0, 20.0, 7.0, 12.0, 9.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-10.7109375, -10.4249267578125, -10.138916015625, -9.8529052734375, -9.56689453125, -9.2808837890625, -8.994873046875, -8.7088623046875, -8.4228515625, -8.1368408203125, -7.850830078125, -7.5648193359375, -7.27880859375, -6.9927978515625, -6.706787109375, -6.4207763671875, -6.134765625, -5.8487548828125, -5.562744140625, -5.2767333984375, -4.99072265625, -4.7047119140625, -4.418701171875, -4.1326904296875, -3.8466796875, -3.5606689453125, -3.274658203125, -2.9886474609375, -2.70263671875, -2.4166259765625, -2.130615234375, -1.8446044921875, -1.55859375, -1.2725830078125, -0.986572265625, -0.7005615234375, -0.41455078125, -0.1285400390625, 0.157470703125, 0.4434814453125, 0.7294921875, 1.0155029296875, 1.301513671875, 1.5875244140625, 1.87353515625, 2.1595458984375, 2.445556640625, 2.7315673828125, 3.017578125, 3.3035888671875, 3.589599609375, 3.8756103515625, 4.16162109375, 4.4476318359375, 4.733642578125, 5.0196533203125, 5.3056640625, 5.5916748046875, 5.877685546875, 6.1636962890625, 6.44970703125, 6.7357177734375, 7.021728515625, 7.3077392578125, 7.59375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 6.0, 10.0, 11.0, 13.0, 24.0, 20.0, 17.0, 26.0, 39.0, 36.0, 53.0, 66.0, 93.0, 92.0, 109.0, 85.0, 61.0, 48.0, 44.0, 27.0, 24.0, 23.0, 19.0, 7.0, 8.0, 5.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.453125, -9.19451904296875, -8.9359130859375, -8.67730712890625, -8.418701171875, -8.16009521484375, -7.9014892578125, -7.64288330078125, -7.38427734375, -7.12567138671875, -6.8670654296875, -6.60845947265625, -6.349853515625, -6.09124755859375, -5.8326416015625, -5.57403564453125, -5.3154296875, -5.05682373046875, -4.7982177734375, -4.53961181640625, -4.281005859375, -4.02239990234375, -3.7637939453125, -3.50518798828125, -3.24658203125, -2.98797607421875, -2.7293701171875, -2.47076416015625, -2.212158203125, -1.95355224609375, -1.6949462890625, -1.43634033203125, -1.177734375, -0.91912841796875, -0.6605224609375, -0.40191650390625, -0.143310546875, 0.11529541015625, 0.3739013671875, 0.63250732421875, 0.89111328125, 1.14971923828125, 1.4083251953125, 1.66693115234375, 1.925537109375, 2.18414306640625, 2.4427490234375, 2.70135498046875, 2.9599609375, 3.21856689453125, 3.4771728515625, 3.73577880859375, 3.994384765625, 4.25299072265625, 4.5115966796875, 4.77020263671875, 5.02880859375, 5.28741455078125, 5.5460205078125, 5.80462646484375, 6.063232421875, 6.32183837890625, 6.5804443359375, 6.83905029296875, 7.09765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 17.0, 25.0, 57.0, 120.0, 235.0, 316.0, 138.0, 47.0, 20.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.24142456054688, -169.92918395996094, -162.616943359375, -155.30471801757812, -147.9924774169922, -140.68023681640625, -133.3679962158203, -126.05575561523438, -118.74352264404297, -111.43128204345703, -104.11904907226562, -96.80680847167969, -89.49456787109375, -82.18233489990234, -74.8700942993164, -67.557861328125, -60.24562072753906, -52.93338394165039, -45.62114715576172, -38.30890655517578, -30.99666976928711, -23.684432983398438, -16.3721923828125, -9.059955596923828, -1.7477188110351562, 5.564518928527832, 12.87675666809082, 20.188995361328125, 27.501232147216797, 34.81346893310547, 42.125709533691406, 49.43794631958008, 56.75018310546875, 64.06242370605469, 71.3746566772461, 78.68689727783203, 85.99913024902344, 93.31137084960938, 100.62361145019531, 107.93585205078125, 115.24808502197266, 122.5603256225586, 129.87255859375, 137.18479919433594, 144.49703979492188, 151.80926513671875, 159.12152099609375, 166.43374633789062, 173.74598693847656, 181.0582275390625, 188.37046813964844, 195.68270874023438, 202.99493408203125, 210.3071746826172, 217.61941528320312, 224.93165588378906, 232.243896484375, 239.55613708496094, 246.86837768554688, 254.18060302734375, 261.49285888671875, 268.8050842285156, 276.1173095703125, 283.4295654296875, 290.7417907714844]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 4.0, 11.0, 3.0, 11.0, 4.0, 9.0, 14.0, 12.0, 21.0, 18.0, 17.0, 26.0, 29.0, 23.0, 30.0, 40.0, 51.0, 49.0, 64.0, 67.0, 64.0, 56.0, 51.0, 36.0, 31.0, 35.0, 26.0, 31.0, 30.0, 24.0, 22.0, 21.0, 7.0, 12.0, 10.0, 8.0, 8.0, 4.0, 7.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-96.14286804199219, -93.28614044189453, -90.4294204711914, -87.57269287109375, -84.71597290039062, -81.85924530029297, -79.00251770019531, -76.14579772949219, -73.28907775878906, -70.4323501586914, -67.57563018798828, -64.71890258789062, -61.8621826171875, -59.005455017089844, -56.14873123168945, -53.29200744628906, -50.435279846191406, -47.578556060791016, -44.721832275390625, -41.86510467529297, -39.008384704589844, -36.15165710449219, -33.2949333190918, -30.438209533691406, -27.581485748291016, -24.724761962890625, -21.868038177490234, -19.01131248474121, -16.15458869934082, -13.29786491394043, -10.441139221191406, -7.584415435791016, -4.727691650390625, -1.8709673881530762, 0.9857568740844727, 3.8424816131591797, 6.69920539855957, 9.555929183959961, 12.412654876708984, 15.269378662109375, 18.126102447509766, 20.982826232910156, 23.839550018310547, 26.69627571105957, 29.55299949645996, 32.40972137451172, 35.266448974609375, 38.123172760009766, 40.979896545410156, 43.83662033081055, 46.69334411621094, 49.550071716308594, 52.40679168701172, 55.263519287109375, 58.120243072509766, 60.976966857910156, 63.83369064331055, 66.69041442871094, 69.5471420288086, 72.40386199951172, 75.26058959960938, 78.1173095703125, 80.97403717041016, 83.83076477050781, 86.68748474121094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 12.0, 30.0, 33.0, 31.0, 54.0, 70.0, 104.0, 196.0, 363.0, 709.0, 1593.0, 4890.0, 27291.0, 757160.0, 3293747.0, 92504.0, 10483.0, 2803.0, 1006.0, 544.0, 264.0, 152.0, 78.0, 46.0, 41.0, 20.0, 14.0, 9.0, 6.0, 2.0, 10.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.158447265625, -12.72314453125, -12.287841796875, -11.8525390625, -11.417236328125, -10.98193359375, -10.546630859375, -10.111328125, -9.676025390625, -9.24072265625, -8.805419921875, -8.3701171875, -7.934814453125, -7.49951171875, -7.064208984375, -6.62890625, -6.193603515625, -5.75830078125, -5.322998046875, -4.8876953125, -4.452392578125, -4.01708984375, -3.581787109375, -3.146484375, -2.711181640625, -2.27587890625, -1.840576171875, -1.4052734375, -0.969970703125, -0.53466796875, -0.099365234375, 0.3359375, 0.771240234375, 1.20654296875, 1.641845703125, 2.0771484375, 2.512451171875, 2.94775390625, 3.383056640625, 3.818359375, 4.253662109375, 4.68896484375, 5.124267578125, 5.5595703125, 5.994873046875, 6.43017578125, 6.865478515625, 7.30078125, 7.736083984375, 8.17138671875, 8.606689453125, 9.0419921875, 9.477294921875, 9.91259765625, 10.347900390625, 10.783203125, 11.218505859375, 11.65380859375, 12.089111328125, 12.5244140625, 12.959716796875, 13.39501953125, 13.830322265625, 14.265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 9.0, 5.0, 9.0, 10.0, 8.0, 12.0, 17.0, 18.0, 31.0, 26.0, 27.0, 30.0, 37.0, 48.0, 52.0, 50.0, 72.0, 46.0, 47.0, 57.0, 40.0, 53.0, 49.0, 40.0, 31.0, 30.0, 30.0, 21.0, 11.0, 12.0, 16.0, 12.0, 7.0, 11.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.14208984375, -4.9833984375, -4.82470703125, -4.666015625, -4.50732421875, -4.3486328125, -4.18994140625, -4.03125, -3.87255859375, -3.7138671875, -3.55517578125, -3.396484375, -3.23779296875, -3.0791015625, -2.92041015625, -2.76171875, -2.60302734375, -2.4443359375, -2.28564453125, -2.126953125, -1.96826171875, -1.8095703125, -1.65087890625, -1.4921875, -1.33349609375, -1.1748046875, -1.01611328125, -0.857421875, -0.69873046875, -0.5400390625, -0.38134765625, -0.22265625, -0.06396484375, 0.0947265625, 0.25341796875, 0.412109375, 0.57080078125, 0.7294921875, 0.88818359375, 1.046875, 1.20556640625, 1.3642578125, 1.52294921875, 1.681640625, 1.84033203125, 1.9990234375, 2.15771484375, 2.31640625, 2.47509765625, 2.6337890625, 2.79248046875, 2.951171875, 3.10986328125, 3.2685546875, 3.42724609375, 3.5859375, 3.74462890625, 3.9033203125, 4.06201171875, 4.220703125, 4.37939453125, 4.5380859375, 4.69677734375, 4.85546875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 14.0, 10.0, 9.0, 13.0, 35.0, 27.0, 41.0, 66.0, 108.0, 229.0, 860.0, 6476.0, 3889371.0, 292407.0, 3262.0, 670.0, 261.0, 121.0, 70.0, 51.0, 41.0, 26.0, 25.0, 25.0, 16.0, 13.0, 7.0, 9.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.75, -64.939453125, -63.12890625, -61.318359375, -59.5078125, -57.697265625, -55.88671875, -54.076171875, -52.265625, -50.455078125, -48.64453125, -46.833984375, -45.0234375, -43.212890625, -41.40234375, -39.591796875, -37.78125, -35.970703125, -34.16015625, -32.349609375, -30.5390625, -28.728515625, -26.91796875, -25.107421875, -23.296875, -21.486328125, -19.67578125, -17.865234375, -16.0546875, -14.244140625, -12.43359375, -10.623046875, -8.8125, -7.001953125, -5.19140625, -3.380859375, -1.5703125, 0.240234375, 2.05078125, 3.861328125, 5.671875, 7.482421875, 9.29296875, 11.103515625, 12.9140625, 14.724609375, 16.53515625, 18.345703125, 20.15625, 21.966796875, 23.77734375, 25.587890625, 27.3984375, 29.208984375, 31.01953125, 32.830078125, 34.640625, 36.451171875, 38.26171875, 40.072265625, 41.8828125, 43.693359375, 45.50390625, 47.314453125, 49.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 11.0, 26.0, 58.0, 104.0, 310.0, 900.0, 1540.0, 698.0, 225.0, 88.0, 54.0, 23.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.03125, -15.2041015625, -14.376953125, -13.5498046875, -12.72265625, -11.8955078125, -11.068359375, -10.2412109375, -9.4140625, -8.5869140625, -7.759765625, -6.9326171875, -6.10546875, -5.2783203125, -4.451171875, -3.6240234375, -2.796875, -1.9697265625, -1.142578125, -0.3154296875, 0.51171875, 1.3388671875, 2.166015625, 2.9931640625, 3.8203125, 4.6474609375, 5.474609375, 6.3017578125, 7.12890625, 7.9560546875, 8.783203125, 9.6103515625, 10.4375, 11.2646484375, 12.091796875, 12.9189453125, 13.74609375, 14.5732421875, 15.400390625, 16.2275390625, 17.0546875, 17.8818359375, 18.708984375, 19.5361328125, 20.36328125, 21.1904296875, 22.017578125, 22.8447265625, 23.671875, 24.4990234375, 25.326171875, 26.1533203125, 26.98046875, 27.8076171875, 28.634765625, 29.4619140625, 30.2890625, 31.1162109375, 31.943359375, 32.7705078125, 33.59765625, 34.4248046875, 35.251953125, 36.0791015625, 36.90625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 13.0, 10.0, 23.0, 60.0, 178.0, 336.0, 227.0, 83.0, 37.0, 17.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-144.11822509765625, -134.9344940185547, -125.75074768066406, -116.5670166015625, -107.3832778930664, -98.19953918457031, -89.01580810546875, -79.83206939697266, -70.64833068847656, -61.46459197998047, -52.28085708618164, -43.09712219238281, -33.91338348388672, -24.729644775390625, -15.545909881591797, -6.362174987792969, 2.821563720703125, 12.005300521850586, 21.189037322998047, 30.372774124145508, 39.55651092529297, 48.74024963378906, 57.92398452758789, 67.10771942138672, 76.29145812988281, 85.4751968383789, 94.658935546875, 103.84266662597656, 113.02640533447266, 122.21014404296875, 131.3938751220703, 140.57760620117188, 149.76132202148438, 158.94505310058594, 168.12879943847656, 177.31253051757812, 186.49627685546875, 195.6800079345703, 204.86373901367188, 214.0474853515625, 223.23121643066406, 232.41494750976562, 241.59869384765625, 250.7824249267578, 259.9661560058594, 269.14990234375, 278.3336486816406, 287.5173645019531, 296.70111083984375, 305.8848571777344, 315.0685729980469, 324.2523193359375, 333.4360656738281, 342.61981201171875, 351.80352783203125, 360.9872741699219, 370.1710205078125, 379.3547668457031, 388.5384826660156, 397.72222900390625, 406.9059753417969, 416.0897216796875, 425.2734375, 434.4571838378906, 443.6408996582031]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 6.0, 7.0, 18.0, 22.0, 15.0, 17.0, 33.0, 35.0, 29.0, 36.0, 42.0, 33.0, 50.0, 53.0, 55.0, 55.0, 46.0, 57.0, 43.0, 34.0, 45.0, 36.0, 31.0, 20.0, 20.0, 24.0, 19.0, 20.0, 16.0, 17.0, 12.0, 8.0, 6.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.015933990478516, -55.159820556640625, -53.3037109375, -51.44759750366211, -49.59148406982422, -47.735374450683594, -45.8792610168457, -44.02314758300781, -42.16703796386719, -40.3109245300293, -38.45481491088867, -36.59870147705078, -34.742591857910156, -32.886478424072266, -31.030364990234375, -29.174253463745117, -27.31814193725586, -25.4620304107666, -23.605918884277344, -21.749805450439453, -19.893693923950195, -18.037582397460938, -16.181468963623047, -14.325357437133789, -12.469245910644531, -10.613134384155273, -8.7570219039917, -6.900909900665283, -5.044797897338867, -3.1886863708496094, -1.3325738906860352, 0.5235385894775391, 2.3796463012695312, 4.235758304595947, 6.091870307922363, 7.947982311248779, 9.804094314575195, 11.660205841064453, 13.516318321228027, 15.372430801391602, 17.22854232788086, 19.084653854370117, 20.940765380859375, 22.796878814697266, 24.652990341186523, 26.50910186767578, 28.365215301513672, 30.22132682800293, 32.07743835449219, 33.93355178833008, 35.7896614074707, 37.645774841308594, 39.50188446044922, 41.35799789428711, 43.214111328125, 45.070220947265625, 46.926334381103516, 48.782447814941406, 50.63855743408203, 52.49467086791992, 54.35078430175781, 56.20689392089844, 58.06300735473633, 59.91912078857422, 61.775230407714844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 17.0, 14.0, 21.0, 28.0, 58.0, 77.0, 110.0, 214.0, 391.0, 653.0, 1390.0, 3684.0, 12839.0, 81156.0, 667060.0, 243552.0, 26865.0, 6186.0, 2138.0, 910.0, 462.0, 262.0, 150.0, 100.0, 62.0, 38.0, 31.0, 29.0, 13.0, 8.0, 8.0, 5.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.9659423828125, -16.447509765625, -15.9290771484375, -15.41064453125, -14.8922119140625, -14.373779296875, -13.8553466796875, -13.3369140625, -12.8184814453125, -12.300048828125, -11.7816162109375, -11.26318359375, -10.7447509765625, -10.226318359375, -9.7078857421875, -9.189453125, -8.6710205078125, -8.152587890625, -7.6341552734375, -7.11572265625, -6.5972900390625, -6.078857421875, -5.5604248046875, -5.0419921875, -4.5235595703125, -4.005126953125, -3.4866943359375, -2.96826171875, -2.4498291015625, -1.931396484375, -1.4129638671875, -0.89453125, -0.3760986328125, 0.142333984375, 0.6607666015625, 1.17919921875, 1.6976318359375, 2.216064453125, 2.7344970703125, 3.2529296875, 3.7713623046875, 4.289794921875, 4.8082275390625, 5.32666015625, 5.8450927734375, 6.363525390625, 6.8819580078125, 7.400390625, 7.9188232421875, 8.437255859375, 8.9556884765625, 9.47412109375, 9.9925537109375, 10.510986328125, 11.0294189453125, 11.5478515625, 12.0662841796875, 12.584716796875, 13.1031494140625, 13.62158203125, 14.1400146484375, 14.658447265625, 15.1768798828125, 15.6953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 4.0, 5.0, 11.0, 12.0, 8.0, 22.0, 27.0, 35.0, 46.0, 45.0, 62.0, 60.0, 58.0, 78.0, 62.0, 51.0, 63.0, 59.0, 79.0, 65.0, 38.0, 23.0, 24.0, 16.0, 10.0, 13.0, 10.0, 1.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.40625, -8.1597900390625, -7.913330078125, -7.6668701171875, -7.42041015625, -7.1739501953125, -6.927490234375, -6.6810302734375, -6.4345703125, -6.1881103515625, -5.941650390625, -5.6951904296875, -5.44873046875, -5.2022705078125, -4.955810546875, -4.7093505859375, -4.462890625, -4.2164306640625, -3.969970703125, -3.7235107421875, -3.47705078125, -3.2305908203125, -2.984130859375, -2.7376708984375, -2.4912109375, -2.2447509765625, -1.998291015625, -1.7518310546875, -1.50537109375, -1.2589111328125, -1.012451171875, -0.7659912109375, -0.51953125, -0.2730712890625, -0.026611328125, 0.2198486328125, 0.46630859375, 0.7127685546875, 0.959228515625, 1.2056884765625, 1.4521484375, 1.6986083984375, 1.945068359375, 2.1915283203125, 2.43798828125, 2.6844482421875, 2.930908203125, 3.1773681640625, 3.423828125, 3.6702880859375, 3.916748046875, 4.1632080078125, 4.40966796875, 4.6561279296875, 4.902587890625, 5.1490478515625, 5.3955078125, 5.6419677734375, 5.888427734375, 6.1348876953125, 6.38134765625, 6.6278076171875, 6.874267578125, 7.1207275390625, 7.3671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 16.0, 15.0, 24.0, 24.0, 53.0, 81.0, 96.0, 184.0, 353.0, 594.0, 1267.0, 2680.0, 7218.0, 34328.0, 643569.0, 322452.0, 24875.0, 5924.0, 2356.0, 1133.0, 518.0, 296.0, 160.0, 112.0, 59.0, 48.0, 28.0, 16.0, 15.0, 13.0, 7.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.546142578125, -17.90478515625, -17.263427734375, -16.6220703125, -15.980712890625, -15.33935546875, -14.697998046875, -14.056640625, -13.415283203125, -12.77392578125, -12.132568359375, -11.4912109375, -10.849853515625, -10.20849609375, -9.567138671875, -8.92578125, -8.284423828125, -7.64306640625, -7.001708984375, -6.3603515625, -5.718994140625, -5.07763671875, -4.436279296875, -3.794921875, -3.153564453125, -2.51220703125, -1.870849609375, -1.2294921875, -0.588134765625, 0.05322265625, 0.694580078125, 1.3359375, 1.977294921875, 2.61865234375, 3.260009765625, 3.9013671875, 4.542724609375, 5.18408203125, 5.825439453125, 6.466796875, 7.108154296875, 7.74951171875, 8.390869140625, 9.0322265625, 9.673583984375, 10.31494140625, 10.956298828125, 11.59765625, 12.239013671875, 12.88037109375, 13.521728515625, 14.1630859375, 14.804443359375, 15.44580078125, 16.087158203125, 16.728515625, 17.369873046875, 18.01123046875, 18.652587890625, 19.2939453125, 19.935302734375, 20.57666015625, 21.218017578125, 21.859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 8.0, 5.0, 7.0, 12.0, 12.0, 17.0, 22.0, 22.0, 29.0, 30.0, 32.0, 39.0, 34.0, 42.0, 48.0, 40.0, 48.0, 40.0, 54.0, 51.0, 44.0, 45.0, 31.0, 47.0, 38.0, 24.0, 27.0, 24.0, 15.0, 10.0, 15.0, 13.0, 7.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.234375, -17.630615234375, -17.02685546875, -16.423095703125, -15.8193359375, -15.215576171875, -14.61181640625, -14.008056640625, -13.404296875, -12.800537109375, -12.19677734375, -11.593017578125, -10.9892578125, -10.385498046875, -9.78173828125, -9.177978515625, -8.57421875, -7.970458984375, -7.36669921875, -6.762939453125, -6.1591796875, -5.555419921875, -4.95166015625, -4.347900390625, -3.744140625, -3.140380859375, -2.53662109375, -1.932861328125, -1.3291015625, -0.725341796875, -0.12158203125, 0.482177734375, 1.0859375, 1.689697265625, 2.29345703125, 2.897216796875, 3.5009765625, 4.104736328125, 4.70849609375, 5.312255859375, 5.916015625, 6.519775390625, 7.12353515625, 7.727294921875, 8.3310546875, 8.934814453125, 9.53857421875, 10.142333984375, 10.74609375, 11.349853515625, 11.95361328125, 12.557373046875, 13.1611328125, 13.764892578125, 14.36865234375, 14.972412109375, 15.576171875, 16.179931640625, 16.78369140625, 17.387451171875, 17.9912109375, 18.594970703125, 19.19873046875, 19.802490234375, 20.40625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 12.0, 10.0, 8.0, 27.0, 27.0, 52.0, 95.0, 145.0, 244.0, 428.0, 767.0, 1639.0, 3537.0, 8945.0, 26922.0, 117976.0, 676831.0, 159335.0, 32877.0, 10532.0, 4207.0, 1886.0, 887.0, 468.0, 277.0, 160.0, 86.0, 65.0, 31.0, 27.0, 13.0, 16.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.546875, -6.3519287109375, -6.156982421875, -5.9620361328125, -5.76708984375, -5.5721435546875, -5.377197265625, -5.1822509765625, -4.9873046875, -4.7923583984375, -4.597412109375, -4.4024658203125, -4.20751953125, -4.0125732421875, -3.817626953125, -3.6226806640625, -3.427734375, -3.2327880859375, -3.037841796875, -2.8428955078125, -2.64794921875, -2.4530029296875, -2.258056640625, -2.0631103515625, -1.8681640625, -1.6732177734375, -1.478271484375, -1.2833251953125, -1.08837890625, -0.8934326171875, -0.698486328125, -0.5035400390625, -0.30859375, -0.1136474609375, 0.081298828125, 0.2762451171875, 0.47119140625, 0.6661376953125, 0.861083984375, 1.0560302734375, 1.2509765625, 1.4459228515625, 1.640869140625, 1.8358154296875, 2.03076171875, 2.2257080078125, 2.420654296875, 2.6156005859375, 2.810546875, 3.0054931640625, 3.200439453125, 3.3953857421875, 3.59033203125, 3.7852783203125, 3.980224609375, 4.1751708984375, 4.3701171875, 4.5650634765625, 4.760009765625, 4.9549560546875, 5.14990234375, 5.3448486328125, 5.539794921875, 5.7347412109375, 5.9296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 12.0, 19.0, 33.0, 70.0, 142.0, 268.0, 226.0, 104.0, 42.0, 24.0, 19.0, 12.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003711700439453125, -0.003595024347305298, -0.0034783482551574707, -0.0033616721630096436, -0.0032449960708618164, -0.0031283199787139893, -0.003011643886566162, -0.002894967794418335, -0.002778291702270508, -0.0026616156101226807, -0.0025449395179748535, -0.0024282634258270264, -0.0023115873336791992, -0.002194911241531372, -0.002078235149383545, -0.0019615590572357178, -0.0018448829650878906, -0.0017282068729400635, -0.0016115307807922363, -0.0014948546886444092, -0.001378178596496582, -0.0012615025043487549, -0.0011448264122009277, -0.0010281503200531006, -0.0009114742279052734, -0.0007947981357574463, -0.0006781220436096191, -0.000561445951461792, -0.00044476985931396484, -0.0003280937671661377, -0.00021141767501831055, -9.47415828704834e-05, 2.193450927734375e-05, 0.0001386106014251709, 0.00025528669357299805, 0.0003719627857208252, 0.0004886388778686523, 0.0006053149700164795, 0.0007219910621643066, 0.0008386671543121338, 0.0009553432464599609, 0.001072019338607788, 0.0011886954307556152, 0.0013053715229034424, 0.0014220476150512695, 0.0015387237071990967, 0.0016553997993469238, 0.001772075891494751, 0.0018887519836425781, 0.0020054280757904053, 0.0021221041679382324, 0.0022387802600860596, 0.0023554563522338867, 0.002472132444381714, 0.002588808536529541, 0.002705484628677368, 0.0028221607208251953, 0.0029388368129730225, 0.0030555129051208496, 0.0031721889972686768, 0.003288865089416504, 0.003405541181564331, 0.003522217273712158, 0.0036388933658599854, 0.0037555694580078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 9.0, 12.0, 22.0, 36.0, 53.0, 58.0, 137.0, 193.0, 356.0, 691.0, 1368.0, 2969.0, 6619.0, 17584.0, 56455.0, 244970.0, 575681.0, 96395.0, 27112.0, 9736.0, 4187.0, 1841.0, 925.0, 478.0, 267.0, 147.0, 79.0, 55.0, 40.0, 26.0, 18.0, 6.0, 7.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.460205078125, -4.27587890625, -4.091552734375, -3.9072265625, -3.722900390625, -3.53857421875, -3.354248046875, -3.169921875, -2.985595703125, -2.80126953125, -2.616943359375, -2.4326171875, -2.248291015625, -2.06396484375, -1.879638671875, -1.6953125, -1.510986328125, -1.32666015625, -1.142333984375, -0.9580078125, -0.773681640625, -0.58935546875, -0.405029296875, -0.220703125, -0.036376953125, 0.14794921875, 0.332275390625, 0.5166015625, 0.700927734375, 0.88525390625, 1.069580078125, 1.25390625, 1.438232421875, 1.62255859375, 1.806884765625, 1.9912109375, 2.175537109375, 2.35986328125, 2.544189453125, 2.728515625, 2.912841796875, 3.09716796875, 3.281494140625, 3.4658203125, 3.650146484375, 3.83447265625, 4.018798828125, 4.203125, 4.387451171875, 4.57177734375, 4.756103515625, 4.9404296875, 5.124755859375, 5.30908203125, 5.493408203125, 5.677734375, 5.862060546875, 6.04638671875, 6.230712890625, 6.4150390625, 6.599365234375, 6.78369140625, 6.968017578125, 7.15234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 12.0, 13.0, 22.0, 31.0, 11.0, 27.0, 35.0, 43.0, 47.0, 60.0, 72.0, 91.0, 66.0, 76.0, 46.0, 54.0, 43.0, 39.0, 36.0, 15.0, 30.0, 17.0, 21.0, 5.0, 8.0, 7.0, 8.0, 6.0, 9.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.2109375, -4.0753173828125, -3.939697265625, -3.8040771484375, -3.66845703125, -3.5328369140625, -3.397216796875, -3.2615966796875, -3.1259765625, -2.9903564453125, -2.854736328125, -2.7191162109375, -2.58349609375, -2.4478759765625, -2.312255859375, -2.1766357421875, -2.041015625, -1.9053955078125, -1.769775390625, -1.6341552734375, -1.49853515625, -1.3629150390625, -1.227294921875, -1.0916748046875, -0.9560546875, -0.8204345703125, -0.684814453125, -0.5491943359375, -0.41357421875, -0.2779541015625, -0.142333984375, -0.0067138671875, 0.12890625, 0.2645263671875, 0.400146484375, 0.5357666015625, 0.67138671875, 0.8070068359375, 0.942626953125, 1.0782470703125, 1.2138671875, 1.3494873046875, 1.485107421875, 1.6207275390625, 1.75634765625, 1.8919677734375, 2.027587890625, 2.1632080078125, 2.298828125, 2.4344482421875, 2.570068359375, 2.7056884765625, 2.84130859375, 2.9769287109375, 3.112548828125, 3.2481689453125, 3.3837890625, 3.5194091796875, 3.655029296875, 3.7906494140625, 3.92626953125, 4.0618896484375, 4.197509765625, 4.3331298828125, 4.46875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 27.0, 80.0, 330.0, 367.0, 113.0, 40.0, 13.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.26854705810547, -85.72735595703125, -77.1861572265625, -68.64496612548828, -60.10377502441406, -51.562583923339844, -43.02138900756836, -34.480194091796875, -25.939002990722656, -17.397809982299805, -8.856616973876953, -0.31542396545410156, 8.22576904296875, 16.76696014404297, 25.308155059814453, 33.84934997558594, 42.390541076660156, 50.931732177734375, 59.47292709350586, 68.01412200927734, 76.55531311035156, 85.09650421142578, 93.6376953125, 102.17889404296875, 110.72008514404297, 119.26127624511719, 127.80247497558594, 136.34365844726562, 144.88485717773438, 153.42605590820312, 161.9672393798828, 170.50843811035156, 179.04962158203125, 187.5908203125, 196.1320037841797, 204.67320251464844, 213.21438598632812, 221.75558471679688, 230.29678344726562, 238.83798217773438, 247.37916564941406, 255.9203643798828, 264.4615478515625, 273.00274658203125, 281.5439453125, 290.08514404296875, 298.6263122558594, 307.1675109863281, 315.7087097167969, 324.2499084472656, 332.7911071777344, 341.332275390625, 349.87347412109375, 358.4146728515625, 366.95587158203125, 375.4970703125, 384.03826904296875, 392.5794677734375, 401.12066650390625, 409.6618347167969, 418.2030334472656, 426.7442321777344, 435.2854309082031, 443.8266296386719, 452.3677978515625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 18.0, 20.0, 24.0, 29.0, 25.0, 50.0, 52.0, 51.0, 64.0, 105.0, 103.0, 96.0, 50.0, 41.0, 34.0, 48.0, 33.0, 25.0, 28.0, 19.0, 13.0, 11.0, 10.0, 4.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.69261169433594, -102.92444610595703, -99.15628051757812, -95.38811492919922, -91.61994934082031, -87.85177612304688, -84.0836181640625, -80.31544494628906, -76.54727935791016, -72.77911376953125, -69.01094818115234, -65.24278259277344, -61.474613189697266, -57.70644760131836, -53.93828201293945, -50.17011260986328, -46.40195083618164, -42.633785247802734, -38.86561965942383, -35.097450256347656, -31.32928466796875, -27.561119079589844, -23.792953491210938, -20.0247859954834, -16.256620407104492, -12.48845386505127, -8.720287322998047, -4.952121734619141, -1.183955192565918, 2.5842113494873047, 6.352376937866211, 10.12054443359375, 13.888710021972656, 17.656875610351562, 21.4250431060791, 25.193208694458008, 28.961376190185547, 32.72954177856445, 36.49770736694336, 40.26587677001953, 44.03404235839844, 47.802207946777344, 51.57037353515625, 55.338539123535156, 59.10670852661133, 62.874874114990234, 66.64303588867188, 70.41120910644531, 74.17936706542969, 77.9475326538086, 81.7156982421875, 85.4838638305664, 89.25202941894531, 93.02020263671875, 96.78836059570312, 100.55653381347656, 104.32469940185547, 108.09286499023438, 111.86103057861328, 115.62919616699219, 119.3973617553711, 123.16552734375, 126.93370056152344, 130.7018585205078, 134.47003173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 12.0, 17.0, 23.0, 38.0, 62.0, 59.0, 108.0, 154.0, 209.0, 347.0, 570.0, 1060.0, 2187.0, 5983.0, 31014.0, 534948.0, 3420365.0, 171642.0, 17085.0, 4354.0, 1801.0, 891.0, 477.0, 279.0, 180.0, 122.0, 86.0, 52.0, 42.0, 37.0, 20.0, 10.0, 7.0, 2.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9293212890625, -11.522705078125, -11.1160888671875, -10.70947265625, -10.3028564453125, -9.896240234375, -9.4896240234375, -9.0830078125, -8.6763916015625, -8.269775390625, -7.8631591796875, -7.45654296875, -7.0499267578125, -6.643310546875, -6.2366943359375, -5.830078125, -5.4234619140625, -5.016845703125, -4.6102294921875, -4.20361328125, -3.7969970703125, -3.390380859375, -2.9837646484375, -2.5771484375, -2.1705322265625, -1.763916015625, -1.3572998046875, -0.95068359375, -0.5440673828125, -0.137451171875, 0.2691650390625, 0.67578125, 1.0823974609375, 1.489013671875, 1.8956298828125, 2.30224609375, 2.7088623046875, 3.115478515625, 3.5220947265625, 3.9287109375, 4.3353271484375, 4.741943359375, 5.1485595703125, 5.55517578125, 5.9617919921875, 6.368408203125, 6.7750244140625, 7.181640625, 7.5882568359375, 7.994873046875, 8.4014892578125, 8.80810546875, 9.2147216796875, 9.621337890625, 10.0279541015625, 10.4345703125, 10.8411865234375, 11.247802734375, 11.6544189453125, 12.06103515625, 12.4676513671875, 12.874267578125, 13.2808837890625, 13.6875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 2.0, 4.0, 4.0, 9.0, 14.0, 9.0, 14.0, 29.0, 23.0, 26.0, 28.0, 40.0, 39.0, 69.0, 46.0, 48.0, 55.0, 53.0, 56.0, 58.0, 55.0, 43.0, 40.0, 30.0, 39.0, 32.0, 21.0, 20.0, 15.0, 14.0, 16.0, 4.0, 9.0, 6.0, 3.0, 4.0, 0.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.20562744140625, -5.0167236328125, -4.82781982421875, -4.638916015625, -4.45001220703125, -4.2611083984375, -4.07220458984375, -3.88330078125, -3.69439697265625, -3.5054931640625, -3.31658935546875, -3.127685546875, -2.93878173828125, -2.7498779296875, -2.56097412109375, -2.3720703125, -2.18316650390625, -1.9942626953125, -1.80535888671875, -1.616455078125, -1.42755126953125, -1.2386474609375, -1.04974365234375, -0.86083984375, -0.67193603515625, -0.4830322265625, -0.29412841796875, -0.105224609375, 0.08367919921875, 0.2725830078125, 0.46148681640625, 0.650390625, 0.83929443359375, 1.0281982421875, 1.21710205078125, 1.406005859375, 1.59490966796875, 1.7838134765625, 1.97271728515625, 2.16162109375, 2.35052490234375, 2.5394287109375, 2.72833251953125, 2.917236328125, 3.10614013671875, 3.2950439453125, 3.48394775390625, 3.6728515625, 3.86175537109375, 4.0506591796875, 4.23956298828125, 4.428466796875, 4.61737060546875, 4.8062744140625, 4.99517822265625, 5.18408203125, 5.37298583984375, 5.5618896484375, 5.75079345703125, 5.939697265625, 6.12860107421875, 6.3175048828125, 6.50640869140625, 6.6953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 5.0, 17.0, 26.0, 50.0, 156.0, 452.0, 1896.0, 12331.0, 3609746.0, 559983.0, 7625.0, 1378.0, 366.0, 120.0, 44.0, 18.0, 16.0, 6.0, 7.0, 4.0, 4.0, 2.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.75, -41.4501953125, -40.150390625, -38.8505859375, -37.55078125, -36.2509765625, -34.951171875, -33.6513671875, -32.3515625, -31.0517578125, -29.751953125, -28.4521484375, -27.15234375, -25.8525390625, -24.552734375, -23.2529296875, -21.953125, -20.6533203125, -19.353515625, -18.0537109375, -16.75390625, -15.4541015625, -14.154296875, -12.8544921875, -11.5546875, -10.2548828125, -8.955078125, -7.6552734375, -6.35546875, -5.0556640625, -3.755859375, -2.4560546875, -1.15625, 0.1435546875, 1.443359375, 2.7431640625, 4.04296875, 5.3427734375, 6.642578125, 7.9423828125, 9.2421875, 10.5419921875, 11.841796875, 13.1416015625, 14.44140625, 15.7412109375, 17.041015625, 18.3408203125, 19.640625, 20.9404296875, 22.240234375, 23.5400390625, 24.83984375, 26.1396484375, 27.439453125, 28.7392578125, 30.0390625, 31.3388671875, 32.638671875, 33.9384765625, 35.23828125, 36.5380859375, 37.837890625, 39.1376953125, 40.4375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 8.0, 10.0, 11.0, 19.0, 29.0, 37.0, 77.0, 161.0, 352.0, 758.0, 1098.0, 717.0, 347.0, 186.0, 91.0, 52.0, 27.0, 31.0, 10.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.3248291015625, -11.798095703125, -11.2713623046875, -10.74462890625, -10.2178955078125, -9.691162109375, -9.1644287109375, -8.6376953125, -8.1109619140625, -7.584228515625, -7.0574951171875, -6.53076171875, -6.0040283203125, -5.477294921875, -4.9505615234375, -4.423828125, -3.8970947265625, -3.370361328125, -2.8436279296875, -2.31689453125, -1.7901611328125, -1.263427734375, -0.7366943359375, -0.2099609375, 0.3167724609375, 0.843505859375, 1.3702392578125, 1.89697265625, 2.4237060546875, 2.950439453125, 3.4771728515625, 4.00390625, 4.5306396484375, 5.057373046875, 5.5841064453125, 6.11083984375, 6.6375732421875, 7.164306640625, 7.6910400390625, 8.2177734375, 8.7445068359375, 9.271240234375, 9.7979736328125, 10.32470703125, 10.8514404296875, 11.378173828125, 11.9049072265625, 12.431640625, 12.9583740234375, 13.485107421875, 14.0118408203125, 14.53857421875, 15.0653076171875, 15.592041015625, 16.1187744140625, 16.6455078125, 17.1722412109375, 17.698974609375, 18.2257080078125, 18.75244140625, 19.2791748046875, 19.805908203125, 20.3326416015625, 20.859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 15.0, 26.0, 59.0, 126.0, 211.0, 250.0, 139.0, 82.0, 39.0, 21.0, 9.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.57237243652344, -87.4019546508789, -82.23153686523438, -77.06111145019531, -71.89069366455078, -66.72027587890625, -61.54985809326172, -56.37943649291992, -51.20901870727539, -46.03860092163086, -40.86817932128906, -35.69776153564453, -30.527341842651367, -25.356922149658203, -20.186504364013672, -15.016082763671875, -9.845664978027344, -4.675245761871338, 0.49517345428466797, 5.665592193603516, 10.83601188659668, 16.006431579589844, 21.176849365234375, 26.347270965576172, 31.517688751220703, 36.688106536865234, 41.85852813720703, 47.02894592285156, 52.199363708496094, 57.36978530883789, 62.54020309448242, 67.71062469482422, 72.88104248046875, 78.05146026611328, 83.22187805175781, 88.39230346679688, 93.5627212524414, 98.73313903808594, 103.90355682373047, 109.073974609375, 114.24440002441406, 119.4148178100586, 124.58523559570312, 129.7556610107422, 134.9260711669922, 140.09649658203125, 145.26690673828125, 150.4373321533203, 155.60775756835938, 160.77818298339844, 165.94859313964844, 171.1190185546875, 176.2894287109375, 181.45985412597656, 186.63027954101562, 191.80068969726562, 196.97109985351562, 202.1415252685547, 207.3119354248047, 212.48236083984375, 217.65277099609375, 222.8231964111328, 227.99362182617188, 233.16403198242188, 238.33445739746094]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 9.0, 8.0, 16.0, 20.0, 27.0, 37.0, 27.0, 31.0, 51.0, 39.0, 43.0, 32.0, 38.0, 40.0, 43.0, 52.0, 40.0, 41.0, 30.0, 40.0, 36.0, 28.0, 46.0, 25.0, 23.0, 22.0, 18.0, 14.0, 19.0, 26.0, 25.0, 15.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.33277130126953, -50.580684661865234, -48.8286018371582, -47.076515197753906, -45.324432373046875, -43.57234573364258, -41.82025909423828, -40.06817626953125, -38.31608963012695, -36.564002990722656, -34.811920166015625, -33.05983352661133, -31.307748794555664, -29.5556640625, -27.803577423095703, -26.05149269104004, -24.299407958984375, -22.54732322692871, -20.795238494873047, -19.04315185546875, -17.291067123413086, -15.538982391357422, -13.786896705627441, -12.034811019897461, -10.282726287841797, -8.530641555786133, -6.778555870056152, -5.02647066116333, -3.274385452270508, -1.5223007202148438, 0.22978496551513672, 1.9818706512451172, 3.7339515686035156, 5.486036777496338, 7.23812198638916, 8.99020767211914, 10.742292404174805, 12.494377136230469, 14.24646282196045, 15.99854850769043, 17.750633239746094, 19.502717971801758, 21.254802703857422, 23.00688934326172, 24.758974075317383, 26.511058807373047, 28.263145446777344, 30.015230178833008, 31.767314910888672, 33.51940155029297, 35.271484375, 37.0235710144043, 38.775657653808594, 40.527740478515625, 42.27982711791992, 44.03191375732422, 45.78399658203125, 47.53608322143555, 49.28816604614258, 51.040252685546875, 52.792335510253906, 54.5444221496582, 56.2965087890625, 58.04859161376953, 59.80067825317383]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 29.0, 30.0, 47.0, 63.0, 113.0, 161.0, 258.0, 401.0, 696.0, 1206.0, 2225.0, 4420.0, 9752.0, 22509.0, 58882.0, 180495.0, 426406.0, 221468.0, 71177.0, 26108.0, 11064.0, 5112.0, 2599.0, 1309.0, 731.0, 470.0, 278.0, 180.0, 101.0, 73.0, 49.0, 38.0, 30.0, 15.0, 8.0, 7.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.80078125, -7.5614013671875, -7.322021484375, -7.0826416015625, -6.84326171875, -6.6038818359375, -6.364501953125, -6.1251220703125, -5.8857421875, -5.6463623046875, -5.406982421875, -5.1676025390625, -4.92822265625, -4.6888427734375, -4.449462890625, -4.2100830078125, -3.970703125, -3.7313232421875, -3.491943359375, -3.2525634765625, -3.01318359375, -2.7738037109375, -2.534423828125, -2.2950439453125, -2.0556640625, -1.8162841796875, -1.576904296875, -1.3375244140625, -1.09814453125, -0.8587646484375, -0.619384765625, -0.3800048828125, -0.140625, 0.0987548828125, 0.338134765625, 0.5775146484375, 0.81689453125, 1.0562744140625, 1.295654296875, 1.5350341796875, 1.7744140625, 2.0137939453125, 2.253173828125, 2.4925537109375, 2.73193359375, 2.9713134765625, 3.210693359375, 3.4500732421875, 3.689453125, 3.9288330078125, 4.168212890625, 4.4075927734375, 4.64697265625, 4.8863525390625, 5.125732421875, 5.3651123046875, 5.6044921875, 5.8438720703125, 6.083251953125, 6.3226318359375, 6.56201171875, 6.8013916015625, 7.040771484375, 7.2801513671875, 7.51953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 9.0, 12.0, 5.0, 13.0, 17.0, 18.0, 20.0, 25.0, 30.0, 36.0, 40.0, 44.0, 41.0, 51.0, 61.0, 63.0, 51.0, 56.0, 53.0, 47.0, 47.0, 51.0, 40.0, 31.0, 22.0, 15.0, 22.0, 13.0, 17.0, 10.0, 6.0, 7.0, 4.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.94891357421875, -5.7376708984375, -5.52642822265625, -5.315185546875, -5.10394287109375, -4.8927001953125, -4.68145751953125, -4.47021484375, -4.25897216796875, -4.0477294921875, -3.83648681640625, -3.625244140625, -3.41400146484375, -3.2027587890625, -2.99151611328125, -2.7802734375, -2.56903076171875, -2.3577880859375, -2.14654541015625, -1.935302734375, -1.72406005859375, -1.5128173828125, -1.30157470703125, -1.09033203125, -0.87908935546875, -0.6678466796875, -0.45660400390625, -0.245361328125, -0.03411865234375, 0.1771240234375, 0.38836669921875, 0.599609375, 0.81085205078125, 1.0220947265625, 1.23333740234375, 1.444580078125, 1.65582275390625, 1.8670654296875, 2.07830810546875, 2.28955078125, 2.50079345703125, 2.7120361328125, 2.92327880859375, 3.134521484375, 3.34576416015625, 3.5570068359375, 3.76824951171875, 3.9794921875, 4.19073486328125, 4.4019775390625, 4.61322021484375, 4.824462890625, 5.03570556640625, 5.2469482421875, 5.45819091796875, 5.66943359375, 5.88067626953125, 6.0919189453125, 6.30316162109375, 6.514404296875, 6.72564697265625, 6.9368896484375, 7.14813232421875, 7.359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 5.0, 10.0, 9.0, 19.0, 23.0, 23.0, 47.0, 49.0, 92.0, 139.0, 272.0, 480.0, 1077.0, 2712.0, 9353.0, 44958.0, 572402.0, 363785.0, 39832.0, 8552.0, 2582.0, 969.0, 476.0, 240.0, 131.0, 97.0, 71.0, 39.0, 32.0, 25.0, 13.0, 6.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.8712158203125, -13.375244140625, -12.8792724609375, -12.38330078125, -11.8873291015625, -11.391357421875, -10.8953857421875, -10.3994140625, -9.9034423828125, -9.407470703125, -8.9114990234375, -8.41552734375, -7.9195556640625, -7.423583984375, -6.9276123046875, -6.431640625, -5.9356689453125, -5.439697265625, -4.9437255859375, -4.44775390625, -3.9517822265625, -3.455810546875, -2.9598388671875, -2.4638671875, -1.9678955078125, -1.471923828125, -0.9759521484375, -0.47998046875, 0.0159912109375, 0.511962890625, 1.0079345703125, 1.50390625, 1.9998779296875, 2.495849609375, 2.9918212890625, 3.48779296875, 3.9837646484375, 4.479736328125, 4.9757080078125, 5.4716796875, 5.9676513671875, 6.463623046875, 6.9595947265625, 7.45556640625, 7.9515380859375, 8.447509765625, 8.9434814453125, 9.439453125, 9.9354248046875, 10.431396484375, 10.9273681640625, 11.42333984375, 11.9193115234375, 12.415283203125, 12.9112548828125, 13.4072265625, 13.9031982421875, 14.399169921875, 14.8951416015625, 15.39111328125, 15.8870849609375, 16.383056640625, 16.8790283203125, 17.375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 12.0, 12.0, 15.0, 30.0, 26.0, 33.0, 42.0, 47.0, 52.0, 66.0, 75.0, 63.0, 84.0, 67.0, 47.0, 73.0, 39.0, 45.0, 30.0, 33.0, 24.0, 17.0, 7.0, 14.0, 6.0, 11.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.46875, -33.456298828125, -32.44384765625, -31.431396484375, -30.4189453125, -29.406494140625, -28.39404296875, -27.381591796875, -26.369140625, -25.356689453125, -24.34423828125, -23.331787109375, -22.3193359375, -21.306884765625, -20.29443359375, -19.281982421875, -18.26953125, -17.257080078125, -16.24462890625, -15.232177734375, -14.2197265625, -13.207275390625, -12.19482421875, -11.182373046875, -10.169921875, -9.157470703125, -8.14501953125, -7.132568359375, -6.1201171875, -5.107666015625, -4.09521484375, -3.082763671875, -2.0703125, -1.057861328125, -0.04541015625, 0.967041015625, 1.9794921875, 2.991943359375, 4.00439453125, 5.016845703125, 6.029296875, 7.041748046875, 8.05419921875, 9.066650390625, 10.0791015625, 11.091552734375, 12.10400390625, 13.116455078125, 14.12890625, 15.141357421875, 16.15380859375, 17.166259765625, 18.1787109375, 19.191162109375, 20.20361328125, 21.216064453125, 22.228515625, 23.240966796875, 24.25341796875, 25.265869140625, 26.2783203125, 27.290771484375, 28.30322265625, 29.315673828125, 30.328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 11.0, 9.0, 11.0, 19.0, 25.0, 39.0, 51.0, 57.0, 128.0, 200.0, 302.0, 503.0, 836.0, 1575.0, 3092.0, 7239.0, 20081.0, 76122.0, 693370.0, 186964.0, 36614.0, 11539.0, 4703.0, 2236.0, 1125.0, 600.0, 383.0, 226.0, 167.0, 109.0, 63.0, 42.0, 31.0, 23.0, 20.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.09466552734375, -4.9041748046875, -4.71368408203125, -4.523193359375, -4.33270263671875, -4.1422119140625, -3.95172119140625, -3.76123046875, -3.57073974609375, -3.3802490234375, -3.18975830078125, -2.999267578125, -2.80877685546875, -2.6182861328125, -2.42779541015625, -2.2373046875, -2.04681396484375, -1.8563232421875, -1.66583251953125, -1.475341796875, -1.28485107421875, -1.0943603515625, -0.90386962890625, -0.71337890625, -0.52288818359375, -0.3323974609375, -0.14190673828125, 0.048583984375, 0.23907470703125, 0.4295654296875, 0.62005615234375, 0.810546875, 1.00103759765625, 1.1915283203125, 1.38201904296875, 1.572509765625, 1.76300048828125, 1.9534912109375, 2.14398193359375, 2.33447265625, 2.52496337890625, 2.7154541015625, 2.90594482421875, 3.096435546875, 3.28692626953125, 3.4774169921875, 3.66790771484375, 3.8583984375, 4.04888916015625, 4.2393798828125, 4.42987060546875, 4.620361328125, 4.81085205078125, 5.0013427734375, 5.19183349609375, 5.38232421875, 5.57281494140625, 5.7633056640625, 5.95379638671875, 6.144287109375, 6.33477783203125, 6.5252685546875, 6.71575927734375, 6.90625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 6.0, 17.0, 20.0, 25.0, 51.0, 121.0, 246.0, 256.0, 121.0, 51.0, 30.0, 12.0, 10.0, 14.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032863616943359375, -0.003168851137161255, -0.0030513405799865723, -0.0029338300228118896, -0.002816319465637207, -0.0026988089084625244, -0.002581298351287842, -0.002463787794113159, -0.0023462772369384766, -0.002228766679763794, -0.0021112561225891113, -0.0019937455654144287, -0.001876235008239746, -0.0017587244510650635, -0.0016412138938903809, -0.0015237033367156982, -0.0014061927795410156, -0.001288682222366333, -0.0011711716651916504, -0.0010536611080169678, -0.0009361505508422852, -0.0008186399936676025, -0.0007011294364929199, -0.0005836188793182373, -0.0004661083221435547, -0.00034859776496887207, -0.00023108720779418945, -0.00011357665061950684, 3.933906555175781e-06, 0.0001214444637298584, 0.00023895502090454102, 0.00035646557807922363, 0.00047397613525390625, 0.0005914866924285889, 0.0007089972496032715, 0.0008265078067779541, 0.0009440183639526367, 0.0010615289211273193, 0.001179039478302002, 0.0012965500354766846, 0.0014140605926513672, 0.0015315711498260498, 0.0016490817070007324, 0.001766592264175415, 0.0018841028213500977, 0.0020016133785247803, 0.002119123935699463, 0.0022366344928741455, 0.002354145050048828, 0.0024716556072235107, 0.0025891661643981934, 0.002706676721572876, 0.0028241872787475586, 0.002941697835922241, 0.003059208393096924, 0.0031767189502716064, 0.003294229507446289, 0.0034117400646209717, 0.0035292506217956543, 0.003646761178970337, 0.0037642717361450195, 0.003881782293319702, 0.003999292850494385, 0.004116803407669067, 0.00423431396484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 6.0, 7.0, 17.0, 20.0, 37.0, 44.0, 67.0, 107.0, 204.0, 313.0, 648.0, 1312.0, 2936.0, 7640.0, 24363.0, 123091.0, 763814.0, 92124.0, 20221.0, 6433.0, 2609.0, 1125.0, 587.0, 290.0, 194.0, 113.0, 74.0, 39.0, 35.0, 19.0, 21.0, 16.0, 6.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.33306884765625, -7.0997314453125, -6.86639404296875, -6.633056640625, -6.39971923828125, -6.1663818359375, -5.93304443359375, -5.69970703125, -5.46636962890625, -5.2330322265625, -4.99969482421875, -4.766357421875, -4.53302001953125, -4.2996826171875, -4.06634521484375, -3.8330078125, -3.59967041015625, -3.3663330078125, -3.13299560546875, -2.899658203125, -2.66632080078125, -2.4329833984375, -2.19964599609375, -1.96630859375, -1.73297119140625, -1.4996337890625, -1.26629638671875, -1.032958984375, -0.79962158203125, -0.5662841796875, -0.33294677734375, -0.099609375, 0.13372802734375, 0.3670654296875, 0.60040283203125, 0.833740234375, 1.06707763671875, 1.3004150390625, 1.53375244140625, 1.76708984375, 2.00042724609375, 2.2337646484375, 2.46710205078125, 2.700439453125, 2.93377685546875, 3.1671142578125, 3.40045166015625, 3.6337890625, 3.86712646484375, 4.1004638671875, 4.33380126953125, 4.567138671875, 4.80047607421875, 5.0338134765625, 5.26715087890625, 5.50048828125, 5.73382568359375, 5.9671630859375, 6.20050048828125, 6.433837890625, 6.66717529296875, 6.9005126953125, 7.13385009765625, 7.3671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 14.0, 16.0, 19.0, 39.0, 55.0, 75.0, 107.0, 139.0, 156.0, 96.0, 76.0, 53.0, 28.0, 29.0, 21.0, 16.0, 9.0, 7.0, 5.0, 2.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.28125, -7.0230712890625, -6.764892578125, -6.5067138671875, -6.24853515625, -5.9903564453125, -5.732177734375, -5.4739990234375, -5.2158203125, -4.9576416015625, -4.699462890625, -4.4412841796875, -4.18310546875, -3.9249267578125, -3.666748046875, -3.4085693359375, -3.150390625, -2.8922119140625, -2.634033203125, -2.3758544921875, -2.11767578125, -1.8594970703125, -1.601318359375, -1.3431396484375, -1.0849609375, -0.8267822265625, -0.568603515625, -0.3104248046875, -0.05224609375, 0.2059326171875, 0.464111328125, 0.7222900390625, 0.98046875, 1.2386474609375, 1.496826171875, 1.7550048828125, 2.01318359375, 2.2713623046875, 2.529541015625, 2.7877197265625, 3.0458984375, 3.3040771484375, 3.562255859375, 3.8204345703125, 4.07861328125, 4.3367919921875, 4.594970703125, 4.8531494140625, 5.111328125, 5.3695068359375, 5.627685546875, 5.8858642578125, 6.14404296875, 6.4022216796875, 6.660400390625, 6.9185791015625, 7.1767578125, 7.4349365234375, 7.693115234375, 7.9512939453125, 8.20947265625, 8.4676513671875, 8.725830078125, 8.9840087890625, 9.2421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 12.0, 17.0, 70.0, 107.0, 211.0, 321.0, 129.0, 58.0, 26.0, 14.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.88392639160156, -160.7493133544922, -155.6147003173828, -150.4801025390625, -145.34548950195312, -140.21087646484375, -135.07626342773438, -129.941650390625, -124.80704498291016, -119.67243194580078, -114.53782653808594, -109.40321350097656, -104.26860046386719, -99.13399505615234, -93.99938201904297, -88.86477661132812, -83.73016357421875, -78.59555053710938, -73.46094512939453, -68.32633209228516, -63.19172286987305, -58.05711364746094, -52.92250061035156, -47.78789138793945, -42.653282165527344, -37.518672943115234, -32.384063720703125, -27.24945068359375, -22.11484146118164, -16.98023223876953, -11.845621109008789, -6.711009979248047, -1.576385498046875, 3.558224678039551, 8.692834854125977, 13.827445030212402, 18.962055206298828, 24.096664428710938, 29.23127555847168, 34.36588668823242, 39.50049591064453, 44.63510513305664, 49.76971435546875, 54.904327392578125, 60.038936614990234, 65.17354583740234, 70.30815887451172, 75.44276428222656, 80.57737731933594, 85.71199035644531, 90.84659576416016, 95.98120880126953, 101.11581420898438, 106.25042724609375, 111.38504028320312, 116.5196533203125, 121.65425872802734, 126.78887176513672, 131.92347717285156, 137.05809020996094, 142.1927032470703, 147.32730102539062, 152.4619140625, 157.59652709960938, 162.73114013671875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 3.0, 7.0, 5.0, 8.0, 8.0, 13.0, 7.0, 4.0, 7.0, 16.0, 12.0, 17.0, 23.0, 18.0, 20.0, 28.0, 27.0, 40.0, 45.0, 53.0, 86.0, 92.0, 80.0, 65.0, 29.0, 25.0, 30.0, 31.0, 28.0, 24.0, 17.0, 15.0, 13.0, 19.0, 12.0, 12.0, 10.0, 13.0, 14.0, 10.0, 0.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.20503234863281, -82.51416778564453, -79.82330322265625, -77.13243865966797, -74.44157409667969, -71.75070190429688, -69.0598373413086, -66.36897277832031, -63.67810821533203, -60.98724365234375, -58.29637908935547, -55.60551071166992, -52.91464614868164, -50.22378158569336, -47.53291320800781, -44.84204864501953, -42.15118408203125, -39.46031951904297, -36.76945495605469, -34.07858657836914, -31.38772201538086, -28.696857452392578, -26.005990982055664, -23.31512451171875, -20.62425994873047, -17.933395385742188, -15.242528915405273, -12.551663398742676, -9.860797882080078, -7.1699323654174805, -4.479066848754883, -1.7882003784179688, 0.9026718139648438, 3.5935373306274414, 6.284402847290039, 8.975268363952637, 11.666133880615234, 14.356999397277832, 17.04786491394043, 19.738731384277344, 22.429595947265625, 25.120460510253906, 27.81132698059082, 30.502193450927734, 33.193058013916016, 35.8839225769043, 38.574790954589844, 41.265655517578125, 43.956520080566406, 46.64738464355469, 49.33824920654297, 52.029117584228516, 54.7199821472168, 57.41084671020508, 60.101715087890625, 62.792579650878906, 65.48344421386719, 68.17430877685547, 70.86517333984375, 73.55603790283203, 76.24690246582031, 78.93777465820312, 81.6286392211914, 84.31950378417969, 87.01036834716797]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 5.0, 11.0, 5.0, 16.0, 24.0, 29.0, 49.0, 46.0, 68.0, 121.0, 150.0, 214.0, 249.0, 396.0, 623.0, 918.0, 1517.0, 3490.0, 11432.0, 95589.0, 2347928.0, 1642530.0, 71985.0, 9806.0, 3009.0, 1454.0, 827.0, 491.0, 350.0, 256.0, 185.0, 122.0, 98.0, 67.0, 41.0, 51.0, 25.0, 30.0, 24.0, 12.0, 7.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7265625, -12.301513671875, -11.87646484375, -11.451416015625, -11.0263671875, -10.601318359375, -10.17626953125, -9.751220703125, -9.326171875, -8.901123046875, -8.47607421875, -8.051025390625, -7.6259765625, -7.200927734375, -6.77587890625, -6.350830078125, -5.92578125, -5.500732421875, -5.07568359375, -4.650634765625, -4.2255859375, -3.800537109375, -3.37548828125, -2.950439453125, -2.525390625, -2.100341796875, -1.67529296875, -1.250244140625, -0.8251953125, -0.400146484375, 0.02490234375, 0.449951171875, 0.875, 1.300048828125, 1.72509765625, 2.150146484375, 2.5751953125, 3.000244140625, 3.42529296875, 3.850341796875, 4.275390625, 4.700439453125, 5.12548828125, 5.550537109375, 5.9755859375, 6.400634765625, 6.82568359375, 7.250732421875, 7.67578125, 8.100830078125, 8.52587890625, 8.950927734375, 9.3759765625, 9.801025390625, 10.22607421875, 10.651123046875, 11.076171875, 11.501220703125, 11.92626953125, 12.351318359375, 12.7763671875, 13.201416015625, 13.62646484375, 14.051513671875, 14.4765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 4.0, 7.0, 13.0, 13.0, 11.0, 11.0, 21.0, 21.0, 17.0, 14.0, 39.0, 31.0, 37.0, 52.0, 38.0, 43.0, 37.0, 54.0, 33.0, 53.0, 47.0, 52.0, 35.0, 37.0, 35.0, 29.0, 31.0, 18.0, 24.0, 20.0, 20.0, 14.0, 18.0, 12.0, 10.0, 3.0, 10.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.9921875, -5.818603515625, -5.64501953125, -5.471435546875, -5.2978515625, -5.124267578125, -4.95068359375, -4.777099609375, -4.603515625, -4.429931640625, -4.25634765625, -4.082763671875, -3.9091796875, -3.735595703125, -3.56201171875, -3.388427734375, -3.21484375, -3.041259765625, -2.86767578125, -2.694091796875, -2.5205078125, -2.346923828125, -2.17333984375, -1.999755859375, -1.826171875, -1.652587890625, -1.47900390625, -1.305419921875, -1.1318359375, -0.958251953125, -0.78466796875, -0.611083984375, -0.4375, -0.263916015625, -0.09033203125, 0.083251953125, 0.2568359375, 0.430419921875, 0.60400390625, 0.777587890625, 0.951171875, 1.124755859375, 1.29833984375, 1.471923828125, 1.6455078125, 1.819091796875, 1.99267578125, 2.166259765625, 2.33984375, 2.513427734375, 2.68701171875, 2.860595703125, 3.0341796875, 3.207763671875, 3.38134765625, 3.554931640625, 3.728515625, 3.902099609375, 4.07568359375, 4.249267578125, 4.4228515625, 4.596435546875, 4.77001953125, 4.943603515625, 5.1171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 15.0, 33.0, 56.0, 109.0, 255.0, 980.0, 47637.0, 4142188.0, 2434.0, 316.0, 138.0, 57.0, 29.0, 18.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5, -95.9716796875, -92.443359375, -88.9150390625, -85.38671875, -81.8583984375, -78.330078125, -74.8017578125, -71.2734375, -67.7451171875, -64.216796875, -60.6884765625, -57.16015625, -53.6318359375, -50.103515625, -46.5751953125, -43.046875, -39.5185546875, -35.990234375, -32.4619140625, -28.93359375, -25.4052734375, -21.876953125, -18.3486328125, -14.8203125, -11.2919921875, -7.763671875, -4.2353515625, -0.70703125, 2.8212890625, 6.349609375, 9.8779296875, 13.40625, 16.9345703125, 20.462890625, 23.9912109375, 27.51953125, 31.0478515625, 34.576171875, 38.1044921875, 41.6328125, 45.1611328125, 48.689453125, 52.2177734375, 55.74609375, 59.2744140625, 62.802734375, 66.3310546875, 69.859375, 73.3876953125, 76.916015625, 80.4443359375, 83.97265625, 87.5009765625, 91.029296875, 94.5576171875, 98.0859375, 101.6142578125, 105.142578125, 108.6708984375, 112.19921875, 115.7275390625, 119.255859375, 122.7841796875, 126.3125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 17.0, 30.0, 58.0, 139.0, 411.0, 1449.0, 1320.0, 417.0, 126.0, 37.0, 29.0, 11.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-49.0, -47.955810546875, -46.91162109375, -45.867431640625, -44.8232421875, -43.779052734375, -42.73486328125, -41.690673828125, -40.646484375, -39.602294921875, -38.55810546875, -37.513916015625, -36.4697265625, -35.425537109375, -34.38134765625, -33.337158203125, -32.29296875, -31.248779296875, -30.20458984375, -29.160400390625, -28.1162109375, -27.072021484375, -26.02783203125, -24.983642578125, -23.939453125, -22.895263671875, -21.85107421875, -20.806884765625, -19.7626953125, -18.718505859375, -17.67431640625, -16.630126953125, -15.5859375, -14.541748046875, -13.49755859375, -12.453369140625, -11.4091796875, -10.364990234375, -9.32080078125, -8.276611328125, -7.232421875, -6.188232421875, -5.14404296875, -4.099853515625, -3.0556640625, -2.011474609375, -0.96728515625, 0.076904296875, 1.12109375, 2.165283203125, 3.20947265625, 4.253662109375, 5.2978515625, 6.342041015625, 7.38623046875, 8.430419921875, 9.474609375, 10.518798828125, 11.56298828125, 12.607177734375, 13.6513671875, 14.695556640625, 15.73974609375, 16.783935546875, 17.828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 17.0, 25.0, 41.0, 79.0, 178.0, 272.0, 209.0, 89.0, 40.0, 17.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-386.29156494140625, -378.1650695800781, -370.0385437011719, -361.91204833984375, -353.7855224609375, -345.6590270996094, -337.53253173828125, -329.406005859375, -321.2795104980469, -313.15301513671875, -305.0264892578125, -296.8999938964844, -288.77349853515625, -280.64697265625, -272.5204772949219, -264.3939514160156, -256.2674560546875, -248.1409454345703, -240.01443481445312, -231.887939453125, -223.7614288330078, -215.63491821289062, -207.5084228515625, -199.3819122314453, -191.25540161132812, -183.12889099121094, -175.00238037109375, -166.87588500976562, -158.74937438964844, -150.62286376953125, -142.49636840820312, -134.36985778808594, -126.24331665039062, -118.11680603027344, -109.99030303955078, -101.86380004882812, -93.73728942871094, -85.61077880859375, -77.4842758178711, -69.35777282714844, -61.23126220703125, -53.10475540161133, -44.978248596191406, -36.851741790771484, -28.725234985351562, -20.59872817993164, -12.472221374511719, -4.345714569091797, 3.780792236328125, 11.907299041748047, 20.03380584716797, 28.16031265258789, 36.28681945800781, 44.413326263427734, 52.539833068847656, 60.66633987426758, 68.7928466796875, 76.91935729980469, 85.04586029052734, 93.17236328125, 101.29887390136719, 109.42538452148438, 117.55188751220703, 125.67839050292969, 133.80490112304688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 3.0, 13.0, 19.0, 10.0, 13.0, 25.0, 15.0, 25.0, 38.0, 26.0, 57.0, 40.0, 51.0, 58.0, 65.0, 53.0, 50.0, 44.0, 47.0, 44.0, 43.0, 42.0, 24.0, 32.0, 30.0, 22.0, 14.0, 14.0, 14.0, 8.0, 9.0, 6.0, 10.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.1110954284668, -59.762718200683594, -57.414337158203125, -55.065956115722656, -52.71757888793945, -50.36920166015625, -48.02082061767578, -45.67243957519531, -43.32406234741211, -40.975685119628906, -38.62730407714844, -36.27892303466797, -33.930545806884766, -31.58216667175293, -29.233787536621094, -26.885408401489258, -24.537029266357422, -22.188650131225586, -19.84027099609375, -17.491891860961914, -15.143512725830078, -12.795133590698242, -10.446754455566406, -8.09837532043457, -5.749996185302734, -3.4016170501708984, -1.0532379150390625, 1.2951412200927734, 3.6435203552246094, 5.991899490356445, 8.340278625488281, 10.688657760620117, 13.037033081054688, 15.385412216186523, 17.73379135131836, 20.082170486450195, 22.43054962158203, 24.778928756713867, 27.127307891845703, 29.47568702697754, 31.824066162109375, 34.172447204589844, 36.52082443237305, 38.86920166015625, 41.21758270263672, 43.56596374511719, 45.91434097290039, 48.262718200683594, 50.61109924316406, 52.95948028564453, 55.307857513427734, 57.65623474121094, 60.004615783691406, 62.352996826171875, 64.70137023925781, 67.04975128173828, 69.39813232421875, 71.74651336669922, 74.09489440917969, 76.44326782226562, 78.7916488647461, 81.14002990722656, 83.4884033203125, 85.83678436279297, 88.18516540527344]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 14.0, 15.0, 17.0, 24.0, 29.0, 38.0, 70.0, 126.0, 192.0, 293.0, 449.0, 867.0, 1513.0, 2786.0, 5390.0, 11458.0, 26175.0, 66154.0, 188627.0, 410748.0, 208442.0, 71656.0, 28648.0, 12468.0, 5798.0, 2807.0, 1502.0, 863.0, 490.0, 311.0, 193.0, 112.0, 87.0, 54.0, 44.0, 26.0, 22.0, 11.0, 9.0, 4.0, 8.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.7265625, -7.4962158203125, -7.265869140625, -7.0355224609375, -6.80517578125, -6.5748291015625, -6.344482421875, -6.1141357421875, -5.8837890625, -5.6534423828125, -5.423095703125, -5.1927490234375, -4.96240234375, -4.7320556640625, -4.501708984375, -4.2713623046875, -4.041015625, -3.8106689453125, -3.580322265625, -3.3499755859375, -3.11962890625, -2.8892822265625, -2.658935546875, -2.4285888671875, -2.1982421875, -1.9678955078125, -1.737548828125, -1.5072021484375, -1.27685546875, -1.0465087890625, -0.816162109375, -0.5858154296875, -0.35546875, -0.1251220703125, 0.105224609375, 0.3355712890625, 0.56591796875, 0.7962646484375, 1.026611328125, 1.2569580078125, 1.4873046875, 1.7176513671875, 1.947998046875, 2.1783447265625, 2.40869140625, 2.6390380859375, 2.869384765625, 3.0997314453125, 3.330078125, 3.5604248046875, 3.790771484375, 4.0211181640625, 4.25146484375, 4.4818115234375, 4.712158203125, 4.9425048828125, 5.1728515625, 5.4031982421875, 5.633544921875, 5.8638916015625, 6.09423828125, 6.3245849609375, 6.554931640625, 6.7852783203125, 7.015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 4.0, 3.0, 10.0, 8.0, 11.0, 11.0, 14.0, 20.0, 27.0, 25.0, 26.0, 35.0, 45.0, 36.0, 44.0, 43.0, 45.0, 36.0, 49.0, 46.0, 45.0, 37.0, 55.0, 41.0, 30.0, 48.0, 34.0, 28.0, 26.0, 18.0, 12.0, 16.0, 17.0, 11.0, 12.0, 5.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4453125, -6.22857666015625, -6.0118408203125, -5.79510498046875, -5.578369140625, -5.36163330078125, -5.1448974609375, -4.92816162109375, -4.71142578125, -4.49468994140625, -4.2779541015625, -4.06121826171875, -3.844482421875, -3.62774658203125, -3.4110107421875, -3.19427490234375, -2.9775390625, -2.76080322265625, -2.5440673828125, -2.32733154296875, -2.110595703125, -1.89385986328125, -1.6771240234375, -1.46038818359375, -1.24365234375, -1.02691650390625, -0.8101806640625, -0.59344482421875, -0.376708984375, -0.15997314453125, 0.0567626953125, 0.27349853515625, 0.490234375, 0.70697021484375, 0.9237060546875, 1.14044189453125, 1.357177734375, 1.57391357421875, 1.7906494140625, 2.00738525390625, 2.22412109375, 2.44085693359375, 2.6575927734375, 2.87432861328125, 3.091064453125, 3.30780029296875, 3.5245361328125, 3.74127197265625, 3.9580078125, 4.17474365234375, 4.3914794921875, 4.60821533203125, 4.824951171875, 5.04168701171875, 5.2584228515625, 5.47515869140625, 5.69189453125, 5.90863037109375, 6.1253662109375, 6.34210205078125, 6.558837890625, 6.77557373046875, 6.9923095703125, 7.20904541015625, 7.42578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 9.0, 3.0, 13.0, 10.0, 19.0, 19.0, 32.0, 28.0, 31.0, 69.0, 109.0, 146.0, 280.0, 448.0, 939.0, 2127.0, 6213.0, 23792.0, 162689.0, 765563.0, 65708.0, 13128.0, 3986.0, 1493.0, 697.0, 372.0, 199.0, 118.0, 77.0, 48.0, 51.0, 37.0, 19.0, 21.0, 16.0, 9.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.640625, -17.076904296875, -16.51318359375, -15.949462890625, -15.3857421875, -14.822021484375, -14.25830078125, -13.694580078125, -13.130859375, -12.567138671875, -12.00341796875, -11.439697265625, -10.8759765625, -10.312255859375, -9.74853515625, -9.184814453125, -8.62109375, -8.057373046875, -7.49365234375, -6.929931640625, -6.3662109375, -5.802490234375, -5.23876953125, -4.675048828125, -4.111328125, -3.547607421875, -2.98388671875, -2.420166015625, -1.8564453125, -1.292724609375, -0.72900390625, -0.165283203125, 0.3984375, 0.962158203125, 1.52587890625, 2.089599609375, 2.6533203125, 3.217041015625, 3.78076171875, 4.344482421875, 4.908203125, 5.471923828125, 6.03564453125, 6.599365234375, 7.1630859375, 7.726806640625, 8.29052734375, 8.854248046875, 9.41796875, 9.981689453125, 10.54541015625, 11.109130859375, 11.6728515625, 12.236572265625, 12.80029296875, 13.364013671875, 13.927734375, 14.491455078125, 15.05517578125, 15.618896484375, 16.1826171875, 16.746337890625, 17.31005859375, 17.873779296875, 18.4375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 6.0, 2.0, 2.0, 6.0, 12.0, 12.0, 8.0, 13.0, 17.0, 22.0, 24.0, 35.0, 32.0, 37.0, 45.0, 59.0, 50.0, 62.0, 52.0, 63.0, 57.0, 52.0, 44.0, 43.0, 55.0, 25.0, 31.0, 30.0, 11.0, 23.0, 10.0, 7.0, 8.0, 6.0, 11.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.46875, -29.48046875, -28.4921875, -27.50390625, -26.515625, -25.52734375, -24.5390625, -23.55078125, -22.5625, -21.57421875, -20.5859375, -19.59765625, -18.609375, -17.62109375, -16.6328125, -15.64453125, -14.65625, -13.66796875, -12.6796875, -11.69140625, -10.703125, -9.71484375, -8.7265625, -7.73828125, -6.75, -5.76171875, -4.7734375, -3.78515625, -2.796875, -1.80859375, -0.8203125, 0.16796875, 1.15625, 2.14453125, 3.1328125, 4.12109375, 5.109375, 6.09765625, 7.0859375, 8.07421875, 9.0625, 10.05078125, 11.0390625, 12.02734375, 13.015625, 14.00390625, 14.9921875, 15.98046875, 16.96875, 17.95703125, 18.9453125, 19.93359375, 20.921875, 21.91015625, 22.8984375, 23.88671875, 24.875, 25.86328125, 26.8515625, 27.83984375, 28.828125, 29.81640625, 30.8046875, 31.79296875, 32.78125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 13.0, 29.0, 71.0, 229.0, 730.0, 4150.0, 66712.0, 948434.0, 25047.0, 2322.0, 497.0, 154.0, 62.0, 34.0, 15.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.626220703125, -10.18994140625, -9.753662109375, -9.3173828125, -8.881103515625, -8.44482421875, -8.008544921875, -7.572265625, -7.135986328125, -6.69970703125, -6.263427734375, -5.8271484375, -5.390869140625, -4.95458984375, -4.518310546875, -4.08203125, -3.645751953125, -3.20947265625, -2.773193359375, -2.3369140625, -1.900634765625, -1.46435546875, -1.028076171875, -0.591796875, -0.155517578125, 0.28076171875, 0.717041015625, 1.1533203125, 1.589599609375, 2.02587890625, 2.462158203125, 2.8984375, 3.334716796875, 3.77099609375, 4.207275390625, 4.6435546875, 5.079833984375, 5.51611328125, 5.952392578125, 6.388671875, 6.824951171875, 7.26123046875, 7.697509765625, 8.1337890625, 8.570068359375, 9.00634765625, 9.442626953125, 9.87890625, 10.315185546875, 10.75146484375, 11.187744140625, 11.6240234375, 12.060302734375, 12.49658203125, 12.932861328125, 13.369140625, 13.805419921875, 14.24169921875, 14.677978515625, 15.1142578125, 15.550537109375, 15.98681640625, 16.423095703125, 16.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 19.0, 18.0, 12.0, 27.0, 55.0, 55.0, 98.0, 152.0, 178.0, 116.0, 80.0, 55.0, 32.0, 21.0, 15.0, 21.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.00232696533203125, -0.002271801233291626, -0.002216637134552002, -0.002161473035812378, -0.002106308937072754, -0.00205114483833313, -0.001995980739593506, -0.0019408166408538818, -0.0018856525421142578, -0.0018304884433746338, -0.0017753243446350098, -0.0017201602458953857, -0.0016649961471557617, -0.0016098320484161377, -0.0015546679496765137, -0.0014995038509368896, -0.0014443397521972656, -0.0013891756534576416, -0.0013340115547180176, -0.0012788474559783936, -0.0012236833572387695, -0.0011685192584991455, -0.0011133551597595215, -0.0010581910610198975, -0.0010030269622802734, -0.0009478628635406494, -0.0008926987648010254, -0.0008375346660614014, -0.0007823705673217773, -0.0007272064685821533, -0.0006720423698425293, -0.0006168782711029053, -0.0005617141723632812, -0.0005065500736236572, -0.0004513859748840332, -0.0003962218761444092, -0.00034105777740478516, -0.00028589367866516113, -0.0002307295799255371, -0.00017556548118591309, -0.00012040138244628906, -6.523728370666504e-05, -1.0073184967041016e-05, 4.509091377258301e-05, 0.00010025501251220703, 0.00015541911125183105, 0.00021058320999145508, 0.0002657473087310791, 0.0003209114074707031, 0.00037607550621032715, 0.00043123960494995117, 0.0004864037036895752, 0.0005415678024291992, 0.0005967319011688232, 0.0006518959999084473, 0.0007070600986480713, 0.0007622241973876953, 0.0008173882961273193, 0.0008725523948669434, 0.0009277164936065674, 0.0009828805923461914, 0.0010380446910858154, 0.0010932087898254395, 0.0011483728885650635, 0.0012035369873046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 10.0, 17.0, 41.0, 68.0, 140.0, 351.0, 1175.0, 6971.0, 172398.0, 849620.0, 15030.0, 1838.0, 504.0, 200.0, 85.0, 37.0, 29.0, 12.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.086181640625, -11.64111328125, -11.196044921875, -10.7509765625, -10.305908203125, -9.86083984375, -9.415771484375, -8.970703125, -8.525634765625, -8.08056640625, -7.635498046875, -7.1904296875, -6.745361328125, -6.30029296875, -5.855224609375, -5.41015625, -4.965087890625, -4.52001953125, -4.074951171875, -3.6298828125, -3.184814453125, -2.73974609375, -2.294677734375, -1.849609375, -1.404541015625, -0.95947265625, -0.514404296875, -0.0693359375, 0.375732421875, 0.82080078125, 1.265869140625, 1.7109375, 2.156005859375, 2.60107421875, 3.046142578125, 3.4912109375, 3.936279296875, 4.38134765625, 4.826416015625, 5.271484375, 5.716552734375, 6.16162109375, 6.606689453125, 7.0517578125, 7.496826171875, 7.94189453125, 8.386962890625, 8.83203125, 9.277099609375, 9.72216796875, 10.167236328125, 10.6123046875, 11.057373046875, 11.50244140625, 11.947509765625, 12.392578125, 12.837646484375, 13.28271484375, 13.727783203125, 14.1728515625, 14.617919921875, 15.06298828125, 15.508056640625, 15.953125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 8.0, 10.0, 14.0, 21.0, 39.0, 51.0, 97.0, 139.0, 186.0, 174.0, 93.0, 60.0, 28.0, 27.0, 14.0, 12.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -6.9638671875, -6.654296875, -6.3447265625, -6.03515625, -5.7255859375, -5.416015625, -5.1064453125, -4.796875, -4.4873046875, -4.177734375, -3.8681640625, -3.55859375, -3.2490234375, -2.939453125, -2.6298828125, -2.3203125, -2.0107421875, -1.701171875, -1.3916015625, -1.08203125, -0.7724609375, -0.462890625, -0.1533203125, 0.15625, 0.4658203125, 0.775390625, 1.0849609375, 1.39453125, 1.7041015625, 2.013671875, 2.3232421875, 2.6328125, 2.9423828125, 3.251953125, 3.5615234375, 3.87109375, 4.1806640625, 4.490234375, 4.7998046875, 5.109375, 5.4189453125, 5.728515625, 6.0380859375, 6.34765625, 6.6572265625, 6.966796875, 7.2763671875, 7.5859375, 7.8955078125, 8.205078125, 8.5146484375, 8.82421875, 9.1337890625, 9.443359375, 9.7529296875, 10.0625, 10.3720703125, 10.681640625, 10.9912109375, 11.30078125, 11.6103515625, 11.919921875, 12.2294921875, 12.5390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 51.0, 212.0, 559.0, 133.0, 27.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-357.4536437988281, -345.2993469238281, -333.1450500488281, -320.9907531738281, -308.8364562988281, -296.6821594238281, -284.52789306640625, -272.37359619140625, -260.21929931640625, -248.06500244140625, -235.91070556640625, -223.75640869140625, -211.60211181640625, -199.44781494140625, -187.2935333251953, -175.1392364501953, -162.98492431640625, -150.83062744140625, -138.67633056640625, -126.52204132080078, -114.36774444580078, -102.21344757080078, -90.05915832519531, -77.90486145019531, -65.75056457519531, -53.59626770019531, -41.44197463989258, -29.287681579589844, -17.133384704589844, -4.979087829589844, 7.175201416015625, 19.329498291015625, 31.483795166015625, 43.638092041015625, 55.79238510131836, 67.9466781616211, 80.1009750366211, 92.2552719116211, 104.40956115722656, 116.56385803222656, 128.71815490722656, 140.87245178222656, 153.02674865722656, 165.1810302734375, 177.3353271484375, 189.4896240234375, 201.6439208984375, 213.7982177734375, 225.9525146484375, 238.1068115234375, 250.2611083984375, 262.4154052734375, 274.5697021484375, 286.7239990234375, 298.8782958984375, 311.0325927734375, 323.1868896484375, 335.3411865234375, 347.4954833984375, 359.6497802734375, 371.8040771484375, 383.9583740234375, 396.1126708984375, 408.2669677734375, 420.4212341308594]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 5.0, 14.0, 7.0, 18.0, 14.0, 16.0, 18.0, 16.0, 28.0, 30.0, 34.0, 35.0, 42.0, 89.0, 160.0, 83.0, 57.0, 39.0, 43.0, 33.0, 27.0, 27.0, 20.0, 13.0, 16.0, 18.0, 12.0, 15.0, 10.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.95846557617188, -127.90067291259766, -123.8428726196289, -119.78507995605469, -115.72727966308594, -111.66948699951172, -107.6116943359375, -103.55389404296875, -99.49609375, -95.43830108642578, -91.38050079345703, -87.32270812988281, -83.26490783691406, -79.20711517333984, -75.14932250976562, -71.09152221679688, -67.03372955322266, -62.97593307495117, -58.91813659667969, -54.86034393310547, -50.80254364013672, -46.7447509765625, -42.686954498291016, -38.62915802001953, -34.57136154174805, -30.513565063476562, -26.455768585205078, -22.397974014282227, -18.340177536010742, -14.282381057739258, -10.224586486816406, -6.166790008544922, -2.1089859008789062, 1.94881010055542, 6.006606101989746, 10.064401626586914, 14.122198104858398, 18.179994583129883, 22.237789154052734, 26.29558563232422, 30.353382110595703, 34.41117858886719, 38.46897506713867, 42.526771545410156, 46.584564208984375, 50.642364501953125, 54.700157165527344, 58.75795364379883, 62.81575012207031, 66.87354278564453, 70.93134307861328, 74.9891357421875, 79.04693603515625, 83.10472869873047, 87.16252136230469, 91.22032165527344, 95.27812194824219, 99.3359146118164, 103.39371490478516, 107.45150756835938, 111.50930786132812, 115.56710052490234, 119.62489318847656, 123.68269348144531, 127.74048614501953]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 7.0, 7.0, 12.0, 15.0, 17.0, 31.0, 33.0, 41.0, 60.0, 66.0, 120.0, 167.0, 293.0, 568.0, 1312.0, 3466.0, 13038.0, 123960.0, 2451229.0, 1509959.0, 74584.0, 10021.0, 2867.0, 1098.0, 518.0, 275.0, 158.0, 94.0, 67.0, 59.0, 37.0, 27.0, 25.0, 13.0, 14.0, 8.0, 9.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.612548828125, -20.97509765625, -20.337646484375, -19.7001953125, -19.062744140625, -18.42529296875, -17.787841796875, -17.150390625, -16.512939453125, -15.87548828125, -15.238037109375, -14.6005859375, -13.963134765625, -13.32568359375, -12.688232421875, -12.05078125, -11.413330078125, -10.77587890625, -10.138427734375, -9.5009765625, -8.863525390625, -8.22607421875, -7.588623046875, -6.951171875, -6.313720703125, -5.67626953125, -5.038818359375, -4.4013671875, -3.763916015625, -3.12646484375, -2.489013671875, -1.8515625, -1.214111328125, -0.57666015625, 0.060791015625, 0.6982421875, 1.335693359375, 1.97314453125, 2.610595703125, 3.248046875, 3.885498046875, 4.52294921875, 5.160400390625, 5.7978515625, 6.435302734375, 7.07275390625, 7.710205078125, 8.34765625, 8.985107421875, 9.62255859375, 10.260009765625, 10.8974609375, 11.534912109375, 12.17236328125, 12.809814453125, 13.447265625, 14.084716796875, 14.72216796875, 15.359619140625, 15.9970703125, 16.634521484375, 17.27197265625, 17.909423828125, 18.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 5.0, 13.0, 13.0, 20.0, 35.0, 27.0, 24.0, 46.0, 39.0, 52.0, 52.0, 53.0, 56.0, 60.0, 62.0, 70.0, 70.0, 45.0, 26.0, 43.0, 43.0, 37.0, 31.0, 13.0, 16.0, 7.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.3546142578125, -9.092041015625, -8.8294677734375, -8.56689453125, -8.3043212890625, -8.041748046875, -7.7791748046875, -7.5166015625, -7.2540283203125, -6.991455078125, -6.7288818359375, -6.46630859375, -6.2037353515625, -5.941162109375, -5.6785888671875, -5.416015625, -5.1534423828125, -4.890869140625, -4.6282958984375, -4.36572265625, -4.1031494140625, -3.840576171875, -3.5780029296875, -3.3154296875, -3.0528564453125, -2.790283203125, -2.5277099609375, -2.26513671875, -2.0025634765625, -1.739990234375, -1.4774169921875, -1.21484375, -0.9522705078125, -0.689697265625, -0.4271240234375, -0.16455078125, 0.0980224609375, 0.360595703125, 0.6231689453125, 0.8857421875, 1.1483154296875, 1.410888671875, 1.6734619140625, 1.93603515625, 2.1986083984375, 2.461181640625, 2.7237548828125, 2.986328125, 3.2489013671875, 3.511474609375, 3.7740478515625, 4.03662109375, 4.2991943359375, 4.561767578125, 4.8243408203125, 5.0869140625, 5.3494873046875, 5.612060546875, 5.8746337890625, 6.13720703125, 6.3997802734375, 6.662353515625, 6.9249267578125, 7.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 11.0, 15.0, 21.0, 33.0, 71.0, 111.0, 221.0, 441.0, 1110.0, 4686.0, 109177.0, 4052202.0, 21803.0, 2676.0, 843.0, 369.0, 186.0, 98.0, 60.0, 46.0, 23.0, 17.0, 18.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.15625, -52.09716796875, -50.0380859375, -47.97900390625, -45.919921875, -43.86083984375, -41.8017578125, -39.74267578125, -37.68359375, -35.62451171875, -33.5654296875, -31.50634765625, -29.447265625, -27.38818359375, -25.3291015625, -23.27001953125, -21.2109375, -19.15185546875, -17.0927734375, -15.03369140625, -12.974609375, -10.91552734375, -8.8564453125, -6.79736328125, -4.73828125, -2.67919921875, -0.6201171875, 1.43896484375, 3.498046875, 5.55712890625, 7.6162109375, 9.67529296875, 11.734375, 13.79345703125, 15.8525390625, 17.91162109375, 19.970703125, 22.02978515625, 24.0888671875, 26.14794921875, 28.20703125, 30.26611328125, 32.3251953125, 34.38427734375, 36.443359375, 38.50244140625, 40.5615234375, 42.62060546875, 44.6796875, 46.73876953125, 48.7978515625, 50.85693359375, 52.916015625, 54.97509765625, 57.0341796875, 59.09326171875, 61.15234375, 63.21142578125, 65.2705078125, 67.32958984375, 69.388671875, 71.44775390625, 73.5068359375, 75.56591796875, 77.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 9.0, 16.0, 38.0, 49.0, 95.0, 180.0, 359.0, 720.0, 1089.0, 689.0, 366.0, 203.0, 104.0, 63.0, 34.0, 19.0, 14.0, 6.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.30322265625, -31.1689453125, -30.03466796875, -28.900390625, -27.76611328125, -26.6318359375, -25.49755859375, -24.36328125, -23.22900390625, -22.0947265625, -20.96044921875, -19.826171875, -18.69189453125, -17.5576171875, -16.42333984375, -15.2890625, -14.15478515625, -13.0205078125, -11.88623046875, -10.751953125, -9.61767578125, -8.4833984375, -7.34912109375, -6.21484375, -5.08056640625, -3.9462890625, -2.81201171875, -1.677734375, -0.54345703125, 0.5908203125, 1.72509765625, 2.859375, 3.99365234375, 5.1279296875, 6.26220703125, 7.396484375, 8.53076171875, 9.6650390625, 10.79931640625, 11.93359375, 13.06787109375, 14.2021484375, 15.33642578125, 16.470703125, 17.60498046875, 18.7392578125, 19.87353515625, 21.0078125, 22.14208984375, 23.2763671875, 24.41064453125, 25.544921875, 26.67919921875, 27.8134765625, 28.94775390625, 30.08203125, 31.21630859375, 32.3505859375, 33.48486328125, 34.619140625, 35.75341796875, 36.8876953125, 38.02197265625, 39.15625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 10.0, 17.0, 18.0, 37.0, 49.0, 75.0, 122.0, 181.0, 146.0, 125.0, 69.0, 30.0, 27.0, 25.0, 7.0, 17.0, 10.0, 5.0, 5.0, 5.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-231.99697875976562, -225.3108367919922, -218.62469482421875, -211.9385528564453, -205.25241088867188, -198.56626892089844, -191.880126953125, -185.19398498535156, -178.50784301757812, -171.8217010498047, -165.13555908203125, -158.4494171142578, -151.76327514648438, -145.07713317871094, -138.3909912109375, -131.70484924316406, -125.01870727539062, -118.33256530761719, -111.64642333984375, -104.96028137207031, -98.27413940429688, -91.58799743652344, -84.90185546875, -78.21571350097656, -71.52957153320312, -64.84342956542969, -58.15728759765625, -51.47114562988281, -44.785003662109375, -38.09886169433594, -31.4127197265625, -24.726577758789062, -18.040435791015625, -11.354293823242188, -4.66815185546875, 2.0179901123046875, 8.704132080078125, 15.390274047851562, 22.076416015625, 28.762557983398438, 35.448699951171875, 42.13484191894531, 48.82098388671875, 55.50712585449219, 62.193267822265625, 68.87940979003906, 75.5655517578125, 82.25169372558594, 88.93783569335938, 95.62397766113281, 102.31011962890625, 108.99626159667969, 115.68240356445312, 122.36854553222656, 129.0546875, 135.74082946777344, 142.42697143554688, 149.1131134033203, 155.79925537109375, 162.4853973388672, 169.17153930664062, 175.85768127441406, 182.5438232421875, 189.22996520996094, 195.91610717773438]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 7.0, 6.0, 15.0, 16.0, 29.0, 26.0, 28.0, 22.0, 28.0, 44.0, 53.0, 38.0, 51.0, 58.0, 71.0, 61.0, 61.0, 59.0, 48.0, 34.0, 42.0, 32.0, 15.0, 30.0, 18.0, 21.0, 16.0, 13.0, 11.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-137.24017333984375, -133.484619140625, -129.7290802001953, -125.97352600097656, -122.21797943115234, -118.4624252319336, -114.70687866210938, -110.95132446289062, -107.1957778930664, -103.44023132324219, -99.68467712402344, -95.92913055419922, -92.173583984375, -88.41802978515625, -84.66248321533203, -80.90693664550781, -77.15138244628906, -73.39583587646484, -69.6402816772461, -65.88473510742188, -62.12918472290039, -58.373634338378906, -54.61808776855469, -50.8625373840332, -47.10699462890625, -43.351444244384766, -39.59589767456055, -35.84034729003906, -32.08479690551758, -28.329248428344727, -24.573699951171875, -20.81814956665039, -17.062599182128906, -13.307049751281738, -9.55150032043457, -5.795951843261719, -2.040402412414551, 1.7151470184326172, 5.470695495605469, 9.226245880126953, 12.981794357299805, 16.737342834472656, 20.49289321899414, 24.248441696166992, 28.003990173339844, 31.759540557861328, 35.51509094238281, 39.27063751220703, 43.026187896728516, 46.78173828125, 50.53728485107422, 54.2928352355957, 58.04838562011719, 61.803932189941406, 65.55947875976562, 69.31503295898438, 73.0705795288086, 76.82612609863281, 80.58168029785156, 84.33722686767578, 88.0927734375, 91.84832763671875, 95.60387420654297, 99.35942077636719, 103.11497497558594]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 13.0, 5.0, 11.0, 17.0, 27.0, 36.0, 35.0, 74.0, 111.0, 177.0, 265.0, 434.0, 726.0, 1256.0, 2380.0, 4951.0, 11144.0, 32869.0, 148365.0, 641122.0, 149714.0, 33251.0, 11144.0, 4848.0, 2395.0, 1274.0, 711.0, 415.0, 271.0, 167.0, 108.0, 70.0, 43.0, 34.0, 27.0, 18.0, 10.0, 14.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.671875, -15.2041015625, -14.736328125, -14.2685546875, -13.80078125, -13.3330078125, -12.865234375, -12.3974609375, -11.9296875, -11.4619140625, -10.994140625, -10.5263671875, -10.05859375, -9.5908203125, -9.123046875, -8.6552734375, -8.1875, -7.7197265625, -7.251953125, -6.7841796875, -6.31640625, -5.8486328125, -5.380859375, -4.9130859375, -4.4453125, -3.9775390625, -3.509765625, -3.0419921875, -2.57421875, -2.1064453125, -1.638671875, -1.1708984375, -0.703125, -0.2353515625, 0.232421875, 0.7001953125, 1.16796875, 1.6357421875, 2.103515625, 2.5712890625, 3.0390625, 3.5068359375, 3.974609375, 4.4423828125, 4.91015625, 5.3779296875, 5.845703125, 6.3134765625, 6.78125, 7.2490234375, 7.716796875, 8.1845703125, 8.65234375, 9.1201171875, 9.587890625, 10.0556640625, 10.5234375, 10.9912109375, 11.458984375, 11.9267578125, 12.39453125, 12.8623046875, 13.330078125, 13.7978515625, 14.265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 10.0, 21.0, 14.0, 45.0, 49.0, 48.0, 57.0, 65.0, 69.0, 66.0, 65.0, 79.0, 80.0, 72.0, 52.0, 51.0, 35.0, 27.0, 21.0, 17.0, 14.0, 4.0, 15.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.402587890625, -11.96923828125, -11.535888671875, -11.1025390625, -10.669189453125, -10.23583984375, -9.802490234375, -9.369140625, -8.935791015625, -8.50244140625, -8.069091796875, -7.6357421875, -7.202392578125, -6.76904296875, -6.335693359375, -5.90234375, -5.468994140625, -5.03564453125, -4.602294921875, -4.1689453125, -3.735595703125, -3.30224609375, -2.868896484375, -2.435546875, -2.002197265625, -1.56884765625, -1.135498046875, -0.7021484375, -0.268798828125, 0.16455078125, 0.597900390625, 1.03125, 1.464599609375, 1.89794921875, 2.331298828125, 2.7646484375, 3.197998046875, 3.63134765625, 4.064697265625, 4.498046875, 4.931396484375, 5.36474609375, 5.798095703125, 6.2314453125, 6.664794921875, 7.09814453125, 7.531494140625, 7.96484375, 8.398193359375, 8.83154296875, 9.264892578125, 9.6982421875, 10.131591796875, 10.56494140625, 10.998291015625, 11.431640625, 11.864990234375, 12.29833984375, 12.731689453125, 13.1650390625, 13.598388671875, 14.03173828125, 14.465087890625, 14.8984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 3.0, 14.0, 13.0, 14.0, 30.0, 50.0, 85.0, 101.0, 178.0, 392.0, 805.0, 2360.0, 10193.0, 119616.0, 883088.0, 24967.0, 4201.0, 1216.0, 527.0, 239.0, 159.0, 89.0, 50.0, 37.0, 37.0, 22.0, 13.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.75537109375, -19.9638671875, -19.17236328125, -18.380859375, -17.58935546875, -16.7978515625, -16.00634765625, -15.21484375, -14.42333984375, -13.6318359375, -12.84033203125, -12.048828125, -11.25732421875, -10.4658203125, -9.67431640625, -8.8828125, -8.09130859375, -7.2998046875, -6.50830078125, -5.716796875, -4.92529296875, -4.1337890625, -3.34228515625, -2.55078125, -1.75927734375, -0.9677734375, -0.17626953125, 0.615234375, 1.40673828125, 2.1982421875, 2.98974609375, 3.78125, 4.57275390625, 5.3642578125, 6.15576171875, 6.947265625, 7.73876953125, 8.5302734375, 9.32177734375, 10.11328125, 10.90478515625, 11.6962890625, 12.48779296875, 13.279296875, 14.07080078125, 14.8623046875, 15.65380859375, 16.4453125, 17.23681640625, 18.0283203125, 18.81982421875, 19.611328125, 20.40283203125, 21.1943359375, 21.98583984375, 22.77734375, 23.56884765625, 24.3603515625, 25.15185546875, 25.943359375, 26.73486328125, 27.5263671875, 28.31787109375, 29.109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 8.0, 10.0, 5.0, 5.0, 7.0, 8.0, 13.0, 13.0, 17.0, 18.0, 22.0, 18.0, 24.0, 31.0, 32.0, 50.0, 50.0, 51.0, 66.0, 74.0, 48.0, 58.0, 55.0, 44.0, 30.0, 35.0, 25.0, 32.0, 19.0, 18.0, 11.0, 18.0, 10.0, 9.0, 9.0, 7.0, 9.0, 6.0, 11.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-31.25, -30.320068359375, -29.39013671875, -28.460205078125, -27.5302734375, -26.600341796875, -25.67041015625, -24.740478515625, -23.810546875, -22.880615234375, -21.95068359375, -21.020751953125, -20.0908203125, -19.160888671875, -18.23095703125, -17.301025390625, -16.37109375, -15.441162109375, -14.51123046875, -13.581298828125, -12.6513671875, -11.721435546875, -10.79150390625, -9.861572265625, -8.931640625, -8.001708984375, -7.07177734375, -6.141845703125, -5.2119140625, -4.281982421875, -3.35205078125, -2.422119140625, -1.4921875, -0.562255859375, 0.36767578125, 1.297607421875, 2.2275390625, 3.157470703125, 4.08740234375, 5.017333984375, 5.947265625, 6.877197265625, 7.80712890625, 8.737060546875, 9.6669921875, 10.596923828125, 11.52685546875, 12.456787109375, 13.38671875, 14.316650390625, 15.24658203125, 16.176513671875, 17.1064453125, 18.036376953125, 18.96630859375, 19.896240234375, 20.826171875, 21.756103515625, 22.68603515625, 23.615966796875, 24.5458984375, 25.475830078125, 26.40576171875, 27.335693359375, 28.265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 3.0, 7.0, 9.0, 10.0, 15.0, 23.0, 37.0, 50.0, 86.0, 144.0, 298.0, 690.0, 1949.0, 7065.0, 45415.0, 951027.0, 33029.0, 5889.0, 1551.0, 586.0, 271.0, 144.0, 79.0, 52.0, 30.0, 23.0, 13.0, 13.0, 12.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.6875, -8.419677734375, -8.15185546875, -7.884033203125, -7.6162109375, -7.348388671875, -7.08056640625, -6.812744140625, -6.544921875, -6.277099609375, -6.00927734375, -5.741455078125, -5.4736328125, -5.205810546875, -4.93798828125, -4.670166015625, -4.40234375, -4.134521484375, -3.86669921875, -3.598876953125, -3.3310546875, -3.063232421875, -2.79541015625, -2.527587890625, -2.259765625, -1.991943359375, -1.72412109375, -1.456298828125, -1.1884765625, -0.920654296875, -0.65283203125, -0.385009765625, -0.1171875, 0.150634765625, 0.41845703125, 0.686279296875, 0.9541015625, 1.221923828125, 1.48974609375, 1.757568359375, 2.025390625, 2.293212890625, 2.56103515625, 2.828857421875, 3.0966796875, 3.364501953125, 3.63232421875, 3.900146484375, 4.16796875, 4.435791015625, 4.70361328125, 4.971435546875, 5.2392578125, 5.507080078125, 5.77490234375, 6.042724609375, 6.310546875, 6.578369140625, 6.84619140625, 7.114013671875, 7.3818359375, 7.649658203125, 7.91748046875, 8.185302734375, 8.453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 10.0, 13.0, 29.0, 21.0, 42.0, 56.0, 154.0, 245.0, 177.0, 77.0, 52.0, 29.0, 17.0, 17.0, 8.0, 6.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0017910003662109375, -0.001715153455734253, -0.0016393065452575684, -0.0015634596347808838, -0.0014876127243041992, -0.0014117658138275146, -0.00133591890335083, -0.0012600719928741455, -0.001184225082397461, -0.0011083781719207764, -0.0010325312614440918, -0.0009566843509674072, -0.0008808374404907227, -0.0008049905300140381, -0.0007291436195373535, -0.0006532967090606689, -0.0005774497985839844, -0.0005016028881072998, -0.00042575597763061523, -0.00034990906715393066, -0.0002740621566772461, -0.00019821524620056152, -0.00012236833572387695, -4.652142524719238e-05, 2.9325485229492188e-05, 0.00010517239570617676, 0.00018101930618286133, 0.0002568662166595459, 0.00033271312713623047, 0.00040856003761291504, 0.0004844069480895996, 0.0005602538585662842, 0.0006361007690429688, 0.0007119476795196533, 0.0007877945899963379, 0.0008636415004730225, 0.000939488410949707, 0.0010153353214263916, 0.0010911822319030762, 0.0011670291423797607, 0.0012428760528564453, 0.0013187229633331299, 0.0013945698738098145, 0.001470416784286499, 0.0015462636947631836, 0.0016221106052398682, 0.0016979575157165527, 0.0017738044261932373, 0.0018496513366699219, 0.0019254982471466064, 0.002001345157623291, 0.0020771920680999756, 0.00215303897857666, 0.0022288858890533447, 0.0023047327995300293, 0.002380579710006714, 0.0024564266204833984, 0.002532273530960083, 0.0026081204414367676, 0.002683967351913452, 0.0027598142623901367, 0.0028356611728668213, 0.002911508083343506, 0.0029873549938201904, 0.003063201904296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 9.0, 8.0, 13.0, 28.0, 30.0, 46.0, 60.0, 83.0, 148.0, 221.0, 360.0, 645.0, 1211.0, 2720.0, 7926.0, 46439.0, 936887.0, 39231.0, 7278.0, 2597.0, 1103.0, 548.0, 321.0, 199.0, 115.0, 81.0, 69.0, 44.0, 30.0, 18.0, 16.0, 11.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.2379150390625, -6.983642578125, -6.7293701171875, -6.47509765625, -6.2208251953125, -5.966552734375, -5.7122802734375, -5.4580078125, -5.2037353515625, -4.949462890625, -4.6951904296875, -4.44091796875, -4.1866455078125, -3.932373046875, -3.6781005859375, -3.423828125, -3.1695556640625, -2.915283203125, -2.6610107421875, -2.40673828125, -2.1524658203125, -1.898193359375, -1.6439208984375, -1.3896484375, -1.1353759765625, -0.881103515625, -0.6268310546875, -0.37255859375, -0.1182861328125, 0.135986328125, 0.3902587890625, 0.64453125, 0.8988037109375, 1.153076171875, 1.4073486328125, 1.66162109375, 1.9158935546875, 2.170166015625, 2.4244384765625, 2.6787109375, 2.9329833984375, 3.187255859375, 3.4415283203125, 3.69580078125, 3.9500732421875, 4.204345703125, 4.4586181640625, 4.712890625, 4.9671630859375, 5.221435546875, 5.4757080078125, 5.72998046875, 5.9842529296875, 6.238525390625, 6.4927978515625, 6.7470703125, 7.0013427734375, 7.255615234375, 7.5098876953125, 7.76416015625, 8.0184326171875, 8.272705078125, 8.5269775390625, 8.78125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 12.0, 3.0, 6.0, 7.0, 7.0, 9.0, 7.0, 21.0, 14.0, 31.0, 39.0, 48.0, 88.0, 124.0, 154.0, 127.0, 92.0, 50.0, 46.0, 30.0, 19.0, 11.0, 8.0, 4.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.7734375, -5.58978271484375, -5.4061279296875, -5.22247314453125, -5.038818359375, -4.85516357421875, -4.6715087890625, -4.48785400390625, -4.30419921875, -4.12054443359375, -3.9368896484375, -3.75323486328125, -3.569580078125, -3.38592529296875, -3.2022705078125, -3.01861572265625, -2.8349609375, -2.65130615234375, -2.4676513671875, -2.28399658203125, -2.100341796875, -1.91668701171875, -1.7330322265625, -1.54937744140625, -1.36572265625, -1.18206787109375, -0.9984130859375, -0.81475830078125, -0.631103515625, -0.44744873046875, -0.2637939453125, -0.08013916015625, 0.103515625, 0.28717041015625, 0.4708251953125, 0.65447998046875, 0.838134765625, 1.02178955078125, 1.2054443359375, 1.38909912109375, 1.57275390625, 1.75640869140625, 1.9400634765625, 2.12371826171875, 2.307373046875, 2.49102783203125, 2.6746826171875, 2.85833740234375, 3.0419921875, 3.22564697265625, 3.4093017578125, 3.59295654296875, 3.776611328125, 3.96026611328125, 4.1439208984375, 4.32757568359375, 4.51123046875, 4.69488525390625, 4.8785400390625, 5.06219482421875, 5.245849609375, 5.42950439453125, 5.6131591796875, 5.79681396484375, 5.98046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 24.0, 37.0, 73.0, 151.0, 485.0, 96.0, 49.0, 27.0, 13.0, 12.0, 6.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.74563598632812, -201.07403564453125, -195.4024200439453, -189.73081970214844, -184.0592041015625, -178.38760375976562, -172.71600341796875, -167.04440307617188, -161.37278747558594, -155.70118713378906, -150.02957153320312, -144.35797119140625, -138.68637084960938, -133.01475524902344, -127.34315490722656, -121.67154693603516, -115.99993896484375, -110.32833099365234, -104.65672302246094, -98.98512268066406, -93.31351470947266, -87.64190673828125, -81.97030639648438, -76.29869842529297, -70.62709045410156, -64.95548248291016, -59.283878326416016, -53.612274169921875, -47.94066619873047, -42.26905822753906, -36.59745407104492, -30.92584991455078, -25.254257202148438, -19.582651138305664, -13.91104507446289, -8.239439010620117, -2.5678329467773438, 3.1037731170654297, 8.775379180908203, 14.446983337402344, 20.11859130859375, 25.790197372436523, 31.461803436279297, 37.13340759277344, 42.805015563964844, 48.47662353515625, 54.14822769165039, 59.81983184814453, 65.49143981933594, 71.16304779052734, 76.83465576171875, 82.50625610351562, 88.17786407470703, 93.84947204589844, 99.52107238769531, 105.19268035888672, 110.86428833007812, 116.53589630126953, 122.20750427246094, 127.87910461425781, 133.55072021484375, 139.22232055664062, 144.8939208984375, 150.56552124023438, 156.2371368408203]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 4.0, 4.0, 4.0, 9.0, 4.0, 9.0, 15.0, 17.0, 19.0, 10.0, 28.0, 16.0, 23.0, 34.0, 40.0, 134.0, 275.0, 99.0, 32.0, 20.0, 23.0, 26.0, 22.0, 21.0, 13.0, 10.0, 24.0, 12.0, 8.0, 9.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.91108703613281, -93.6082534790039, -90.30542755126953, -87.00259399414062, -83.69976806640625, -80.39693450927734, -77.09410095214844, -73.79127502441406, -70.48844146728516, -67.18560791015625, -63.882781982421875, -60.57994842529297, -57.27711868286133, -53.97428894042969, -50.67145919799805, -47.368629455566406, -44.065799713134766, -40.762969970703125, -37.460140228271484, -34.157310485839844, -30.854476928710938, -27.551647186279297, -24.248817443847656, -20.945985794067383, -17.643156051635742, -14.340325355529785, -11.037494659423828, -7.7346649169921875, -4.4318342208862305, -1.1290035247802734, 2.173826217651367, 5.476657867431641, 8.779487609863281, 12.082318305969238, 15.385149002075195, 18.687978744506836, 21.99081039428711, 25.29364013671875, 28.59646987915039, 31.899301528930664, 35.20213317871094, 38.50496292114258, 41.80779266357422, 45.110626220703125, 48.413455963134766, 51.716285705566406, 55.01911544799805, 58.32194519042969, 61.62477493286133, 64.92760467529297, 68.23043823242188, 71.53326416015625, 74.83609771728516, 78.13893127441406, 81.44175720214844, 84.74459075927734, 88.04741668701172, 91.35025024414062, 94.653076171875, 97.9559097290039, 101.25873565673828, 104.56156921386719, 107.86439514160156, 111.16722869873047, 114.47006225585938]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 12.0, 11.0, 17.0, 24.0, 24.0, 35.0, 41.0, 44.0, 36.0, 105.0, 232.0, 105.0, 41.0, 33.0, 38.0, 28.0, 13.0, 29.0, 21.0, 13.0, 10.0, 13.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.3748779296875, -7.046630859375, -6.7183837890625, -6.39013671875, -6.0618896484375, -5.733642578125, -5.4053955078125, -5.0771484375, -4.7489013671875, -4.420654296875, -4.0924072265625, -3.76416015625, -3.4359130859375, -3.107666015625, -2.7794189453125, -2.451171875, -2.1229248046875, -1.794677734375, -1.4664306640625, -1.13818359375, -0.8099365234375, -0.481689453125, -0.1534423828125, 0.1748046875, 0.5030517578125, 0.831298828125, 1.1595458984375, 1.48779296875, 1.8160400390625, 2.144287109375, 2.4725341796875, 2.80078125, 3.1290283203125, 3.457275390625, 3.7855224609375, 4.11376953125, 4.4420166015625, 4.770263671875, 5.0985107421875, 5.4267578125, 5.7550048828125, 6.083251953125, 6.4114990234375, 6.73974609375, 7.0679931640625, 7.396240234375, 7.7244873046875, 8.052734375, 8.3809814453125, 8.709228515625, 9.0374755859375, 9.36572265625, 9.6939697265625, 10.022216796875, 10.3504638671875, 10.6787109375, 11.0069580078125, 11.335205078125, 11.6634521484375, 11.99169921875, 12.3199462890625, 12.648193359375, 12.9764404296875, 13.3046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 20.0, 38.0, 58.0, 142.0, 384.0, 1134.0, 7844.0, 8360771.0, 15697.0, 1660.0, 438.0, 187.0, 78.0, 38.0, 29.0, 15.0, 4.0, 7.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-169.37770080566406, -165.74429321289062, -162.11087036132812, -158.4774627685547, -154.8440399169922, -151.21063232421875, -147.57720947265625, -143.9438018798828, -140.3103790283203, -136.67697143554688, -133.04354858398438, -129.41014099121094, -125.77671813964844, -122.14330291748047, -118.5098876953125, -114.87648010253906, -111.2430648803711, -107.60964965820312, -103.97623443603516, -100.34281921386719, -96.70940399169922, -93.07598876953125, -89.44258117675781, -85.80915832519531, -82.17575073242188, -78.5423355102539, -74.90892028808594, -71.27550506591797, -67.64208984375, -64.00867462158203, -60.37526321411133, -56.74184799194336, -53.108436584472656, -49.47502136230469, -45.84160614013672, -42.20819091796875, -38.57477569580078, -34.94136047363281, -31.30794906616211, -27.67453384399414, -24.041118621826172, -20.407703399658203, -16.774288177490234, -13.140874862670898, -9.50745964050293, -5.874044418334961, -2.240631103515625, 1.3927841186523438, 5.0261993408203125, 8.659614562988281, 12.293028831481934, 15.926443099975586, 19.559858322143555, 23.193273544311523, 26.82668685913086, 30.460102081298828, 34.0935173034668, 37.726932525634766, 41.360347747802734, 44.99375915527344, 48.627174377441406, 52.260589599609375, 55.894004821777344, 59.52742004394531, 63.16083526611328]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 7.0, 3.0, 0.0, 5.0, 7.0, 11.0, 12.0, 2.0, 2.0, 2.0, 2.0, 9.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-125.534912109375, -122.53495025634766, -119.53499603271484, -116.5350341796875, -113.53507995605469, -110.53511810302734, -107.53515625, -104.53520202636719, -101.53524017333984, -98.5352783203125, -95.53532409667969, -92.53536224365234, -89.53540802001953, -86.53544616699219, -83.53549194335938, -80.53553009033203, -77.53556823730469, -74.53560638427734, -71.53565216064453, -68.53569030761719, -65.53573608398438, -62.53577423095703, -59.53581619262695, -56.535858154296875, -53.53590393066406, -50.535945892333984, -47.535987854003906, -44.53602600097656, -41.536067962646484, -38.536109924316406, -35.53615188598633, -32.53619384765625, -29.536231994628906, -26.536273956298828, -23.536314010620117, -20.53635597229004, -17.536396026611328, -14.53643798828125, -11.536479949951172, -8.536520004272461, -5.536561965942383, -2.5366032123565674, 0.46335554122924805, 3.4633140563964844, 6.463273048400879, 9.463232040405273, 12.463190078735352, 15.463150024414062, 18.46310806274414, 21.46306610107422, 24.46302604675293, 27.462984085083008, 30.46294403076172, 33.4629020690918, 36.462860107421875, 39.46282196044922, 42.46277618408203, 45.46273422241211, 48.46269226074219, 51.46265411376953, 54.46261215209961, 57.46257019042969, 60.462528228759766, 63.462486267089844, 66.46244812011719]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 6.0, 9.0, 13.0, 11.0, 13.0, 16.0, 24.0, 28.0, 29.0, 48.0, 53.0, 45.0, 41.0, 52.0, 59.0, 65.0, 76.0, 49.0, 54.0, 47.0, 38.0, 38.0, 30.0, 30.0, 25.0, 12.0, 12.0, 14.0, 18.0, 7.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.40899658203125, -4.2711181640625, -4.13323974609375, -3.995361328125, -3.85748291015625, -3.7196044921875, -3.58172607421875, -3.44384765625, -3.30596923828125, -3.1680908203125, -3.03021240234375, -2.892333984375, -2.75445556640625, -2.6165771484375, -2.47869873046875, -2.3408203125, -2.20294189453125, -2.0650634765625, -1.92718505859375, -1.789306640625, -1.65142822265625, -1.5135498046875, -1.37567138671875, -1.23779296875, -1.09991455078125, -0.9620361328125, -0.82415771484375, -0.686279296875, -0.54840087890625, -0.4105224609375, -0.27264404296875, -0.134765625, 0.00311279296875, 0.1409912109375, 0.27886962890625, 0.416748046875, 0.55462646484375, 0.6925048828125, 0.83038330078125, 0.96826171875, 1.10614013671875, 1.2440185546875, 1.38189697265625, 1.519775390625, 1.65765380859375, 1.7955322265625, 1.93341064453125, 2.0712890625, 2.20916748046875, 2.3470458984375, 2.48492431640625, 2.622802734375, 2.76068115234375, 2.8985595703125, 3.03643798828125, 3.17431640625, 3.31219482421875, 3.4500732421875, 3.58795166015625, 3.725830078125, 3.86370849609375, 4.0015869140625, 4.13946533203125, 4.27734375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 5.0, 21.0, 23.0, 27.0, 40.0, 73.0, 136.0, 219.0, 420.0, 818.0, 2011.0, 5917.0, 23315.0, 131211.0, 283343.0, 58907.0, 11697.0, 3353.0, 1322.0, 582.0, 315.0, 167.0, 122.0, 75.0, 48.0, 27.0, 15.0, 11.0, 13.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-100.1875, -97.083984375, -93.98046875, -90.876953125, -87.7734375, -84.669921875, -81.56640625, -78.462890625, -75.359375, -72.255859375, -69.15234375, -66.048828125, -62.9453125, -59.841796875, -56.73828125, -53.634765625, -50.53125, -47.427734375, -44.32421875, -41.220703125, -38.1171875, -35.013671875, -31.91015625, -28.806640625, -25.703125, -22.599609375, -19.49609375, -16.392578125, -13.2890625, -10.185546875, -7.08203125, -3.978515625, -0.875, 2.228515625, 5.33203125, 8.435546875, 11.5390625, 14.642578125, 17.74609375, 20.849609375, 23.953125, 27.056640625, 30.16015625, 33.263671875, 36.3671875, 39.470703125, 42.57421875, 45.677734375, 48.78125, 51.884765625, 54.98828125, 58.091796875, 61.1953125, 64.298828125, 67.40234375, 70.505859375, 73.609375, 76.712890625, 79.81640625, 82.919921875, 86.0234375, 89.126953125, 92.23046875, 95.333984375, 98.4375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 8.0, 8.0, 3.0, 6.0, 12.0, 17.0, 18.0, 11.0, 27.0, 28.0, 34.0, 43.0, 48.0, 45.0, 59.0, 63.0, 61.0, 53.0, 54.0, 69.0, 49.0, 49.0, 31.0, 37.0, 34.0, 23.0, 22.0, 19.0, 13.0, 12.0, 9.0, 6.0, 3.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.6875, -10.40191650390625, -10.1163330078125, -9.83074951171875, -9.545166015625, -9.25958251953125, -8.9739990234375, -8.68841552734375, -8.40283203125, -8.11724853515625, -7.8316650390625, -7.54608154296875, -7.260498046875, -6.97491455078125, -6.6893310546875, -6.40374755859375, -6.1181640625, -5.83258056640625, -5.5469970703125, -5.26141357421875, -4.975830078125, -4.69024658203125, -4.4046630859375, -4.11907958984375, -3.83349609375, -3.54791259765625, -3.2623291015625, -2.97674560546875, -2.691162109375, -2.40557861328125, -2.1199951171875, -1.83441162109375, -1.548828125, -1.26324462890625, -0.9776611328125, -0.69207763671875, -0.406494140625, -0.12091064453125, 0.1646728515625, 0.45025634765625, 0.73583984375, 1.02142333984375, 1.3070068359375, 1.59259033203125, 1.878173828125, 2.16375732421875, 2.4493408203125, 2.73492431640625, 3.0205078125, 3.30609130859375, 3.5916748046875, 3.87725830078125, 4.162841796875, 4.44842529296875, 4.7340087890625, 5.01959228515625, 5.30517578125, 5.59075927734375, 5.8763427734375, 6.16192626953125, 6.447509765625, 6.73309326171875, 7.0186767578125, 7.30426025390625, 7.58984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 11.0, 20.0, 15.0, 39.0, 87.0, 99.0, 96.0, 46.0, 23.0, 15.0, 9.0, 13.0, 3.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.67760467529297, -80.07489013671875, -77.47216796875, -74.86945343017578, -72.26673889160156, -69.66401672363281, -67.0613021850586, -64.45858764648438, -61.855865478515625, -59.25314712524414, -56.650428771972656, -54.04771423339844, -51.44499588012695, -48.84227752685547, -46.23956298828125, -43.636844635009766, -41.03412628173828, -38.4314079284668, -35.82868957519531, -33.225975036621094, -30.62325668334961, -28.020538330078125, -25.417821884155273, -22.815105438232422, -20.212387084960938, -17.609668731689453, -15.006952285766602, -12.404234886169434, -9.801517486572266, -7.198800086975098, -4.59608268737793, -1.9933662414550781, 0.609344482421875, 3.212061882019043, 5.814779281616211, 8.417496681213379, 11.020214080810547, 13.622931480407715, 16.225648880004883, 18.828365325927734, 21.43108367919922, 24.033802032470703, 26.636518478393555, 29.239234924316406, 31.84195327758789, 34.444671630859375, 37.047386169433594, 39.65010452270508, 42.25282287597656, 44.85554122924805, 47.45825958251953, 50.06097412109375, 52.663692474365234, 55.26641082763672, 57.86912536621094, 60.47184371948242, 63.074562072753906, 65.67727661132812, 68.27999877929688, 70.8827133178711, 73.48542785644531, 76.08815002441406, 78.69086456298828, 81.2935791015625, 83.89630126953125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 5.0, 6.0, 17.0, 17.0, 17.0, 46.0, 57.0, 92.0, 70.0, 44.0, 40.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.68903350830078, -47.28626251220703, -45.88349533081055, -44.4807243347168, -43.07795333862305, -41.67518615722656, -40.27241516113281, -38.86964416503906, -37.46687698364258, -36.06410598754883, -34.661338806152344, -33.258567810058594, -31.855798721313477, -30.45302963256836, -29.05025863647461, -27.647489547729492, -26.244718551635742, -24.841949462890625, -23.439178466796875, -22.036409378051758, -20.63364028930664, -19.23086929321289, -17.828100204467773, -16.425331115722656, -15.022561073303223, -13.619791030883789, -12.217021942138672, -10.814251899719238, -9.411481857299805, -8.008712768554688, -6.605942726135254, -5.203173637390137, -3.800403594970703, -2.3976340293884277, -0.9948642253875732, 0.40790557861328125, 1.8106751441955566, 3.213444709777832, 4.616214752197266, 6.018983840942383, 7.421753883361816, 8.82452392578125, 10.227293014526367, 11.6300630569458, 13.032833099365234, 14.435602188110352, 15.838372230529785, 17.24114227294922, 18.643911361694336, 20.046680450439453, 21.449451446533203, 22.85222053527832, 24.254989624023438, 25.657760620117188, 27.060529708862305, 28.463298797607422, 29.866069793701172, 31.26883888244629, 32.671607971191406, 34.074378967285156, 35.477149963378906, 36.87991714477539, 38.28268814086914, 39.685455322265625, 41.088226318359375]}, "eval/loss": 0.7765135765075684, "eval/wer": 0.13639428798095993, "eval/runtime": 828.6657, "eval/samples_per_second": 3.188, "eval/steps_per_second": 0.399} \ No newline at end of file +{"train/loss": 0.4546, "train/learning_rate": 7.340845070422535e-06, "train/epoch": 19.17, "train/global_step": 17096, "_runtime": 106531, "_timestamp": 1648051110, "_step": 17106, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 5.0, 8.0, 10.0, 12.0, 9.0, 13.0, 14.0, 24.0, 23.0, 20.0, 30.0, 35.0, 34.0, 24.0, 20.0, 25.0, 40.0, 47.0, 31.0, 50.0, 36.0, 39.0, 41.0, 33.0, 30.0, 25.0, 39.0, 28.0, 29.0, 28.0, 22.0, 24.0, 17.0, 19.0, 18.0, 16.0, 15.0, 10.0, 9.0, 12.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.029391288757324, -5.889625549316406, -5.74985933303833, -5.610093593597412, -5.470327854156494, -5.330561637878418, -5.1907958984375, -5.051030158996582, -4.911263942718506, -4.771498203277588, -4.631731986999512, -4.491966247558594, -4.352200508117676, -4.2124342918396, -4.072668552398682, -3.9329025745391846, -3.7931368350982666, -3.6533708572387695, -3.5136051177978516, -3.3738391399383545, -3.2340731620788574, -3.0943074226379395, -2.9545414447784424, -2.8147754669189453, -2.6750097274780273, -2.5352437496185303, -2.3954780101776123, -2.2557120323181152, -2.115946054458618, -1.9761801958084106, -1.8364143371582031, -1.696648359298706, -1.5568821430206299, -1.4171162843704224, -1.2773503065109253, -1.1375844478607178, -0.9978185296058655, -0.8580526113510132, -0.7182867527008057, -0.5785208344459534, -0.4387549161911011, -0.2989889979362488, -0.15922310948371887, -0.019457221031188965, 0.12030869722366333, 0.2600746154785156, 0.39984047412872314, 0.5396063923835754, 0.6793723106384277, 0.81913822889328, 0.9589041471481323, 1.0986700057983398, 1.238435983657837, 1.3782018423080444, 1.517967700958252, 1.657733678817749, 1.7974995374679565, 1.937265396118164, 2.077031373977661, 2.216797351837158, 2.356563091278076, 2.4963290691375732, 2.6360950469970703, 2.7758607864379883, 2.9156267642974854]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 11.0, 9.0, 13.0, 8.0, 17.0, 19.0, 20.0, 13.0, 23.0, 32.0, 24.0, 32.0, 33.0, 30.0, 31.0, 30.0, 42.0, 36.0, 35.0, 40.0, 47.0, 26.0, 34.0, 40.0, 37.0, 37.0, 41.0, 34.0, 31.0, 23.0, 14.0, 28.0, 21.0, 17.0, 11.0, 10.0, 9.0, 4.0, 10.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.518879413604736, -4.373701572418213, -4.228523254394531, -4.083345413208008, -3.9381673336029053, -3.7929892539978027, -3.6478111743927, -3.5026330947875977, -3.357455253601074, -3.2122771739959717, -3.067099094390869, -2.9219212532043457, -2.776743173599243, -2.6315650939941406, -2.486387014389038, -2.3412089347839355, -2.196030855178833, -2.0508527755737305, -1.9056748151779175, -1.760496735572815, -1.615318775177002, -1.4701406955718994, -1.3249626159667969, -1.1797846555709839, -1.0346065759658813, -0.8894285559654236, -0.7442505359649658, -0.5990724563598633, -0.4538944363594055, -0.30871641635894775, -0.16353833675384521, -0.018360376358032227, 0.1268177032470703, 0.2719957232475281, 0.4171737730503082, 0.5623518228530884, 0.7075298428535461, 0.8527078628540039, 0.9978859424591064, 1.1430639028549194, 1.288241982460022, 1.4334200620651245, 1.5785980224609375, 1.72377610206604, 1.8689541816711426, 2.014132022857666, 2.1593103408813477, 2.304488182067871, 2.4496662616729736, 2.594844341278076, 2.7400224208831787, 2.8852005004882812, 3.0303783416748047, 3.1755564212799072, 3.3207345008850098, 3.465912342071533, 3.611090660095215, 3.7562687397003174, 3.90144681930542, 4.046624660491943, 4.191802978515625, 4.336980819702148, 4.482158660888672, 4.6273369789123535, 4.772514820098877]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 9.0, 8.0, 10.0, 21.0, 31.0, 44.0, 86.0, 159.0, 236.0, 352.0, 628.0, 998.0, 1594.0, 2705.0, 4333.0, 7189.0, 11697.0, 19060.0, 31794.0, 52286.0, 83858.0, 136184.0, 214006.0, 328789.0, 467884.0, 592811.0, 622318.0, 530161.0, 390312.0, 261023.0, 166246.0, 104286.0, 63957.0, 38569.0, 23874.0, 14436.0, 8748.0, 5384.0, 3182.0, 1962.0, 1194.0, 704.0, 481.0, 269.0, 158.0, 116.0, 51.0, 36.0, 15.0, 14.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.55975341796875, -5.3695068359375, -5.17926025390625, -4.989013671875, -4.79876708984375, -4.6085205078125, -4.41827392578125, -4.22802734375, -4.03778076171875, -3.8475341796875, -3.65728759765625, -3.467041015625, -3.27679443359375, -3.0865478515625, -2.89630126953125, -2.7060546875, -2.51580810546875, -2.3255615234375, -2.13531494140625, -1.945068359375, -1.75482177734375, -1.5645751953125, -1.37432861328125, -1.18408203125, -0.99383544921875, -0.8035888671875, -0.61334228515625, -0.423095703125, -0.23284912109375, -0.0426025390625, 0.14764404296875, 0.337890625, 0.52813720703125, 0.7183837890625, 0.90863037109375, 1.098876953125, 1.28912353515625, 1.4793701171875, 1.66961669921875, 1.85986328125, 2.05010986328125, 2.2403564453125, 2.43060302734375, 2.620849609375, 2.81109619140625, 3.0013427734375, 3.19158935546875, 3.3818359375, 3.57208251953125, 3.7623291015625, 3.95257568359375, 4.142822265625, 4.33306884765625, 4.5233154296875, 4.71356201171875, 4.90380859375, 5.09405517578125, 5.2843017578125, 5.47454833984375, 5.664794921875, 5.85504150390625, 6.0452880859375, 6.23553466796875, 6.42578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 10.0, 4.0, 13.0, 13.0, 24.0, 24.0, 30.0, 21.0, 31.0, 31.0, 45.0, 35.0, 35.0, 45.0, 36.0, 43.0, 51.0, 51.0, 41.0, 51.0, 40.0, 42.0, 30.0, 39.0, 32.0, 23.0, 32.0, 33.0, 23.0, 14.0, 13.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.08984375, -5.9052734375, -5.720703125, -5.5361328125, -5.3515625, -5.1669921875, -4.982421875, -4.7978515625, -4.61328125, -4.4287109375, -4.244140625, -4.0595703125, -3.875, -3.6904296875, -3.505859375, -3.3212890625, -3.13671875, -2.9521484375, -2.767578125, -2.5830078125, -2.3984375, -2.2138671875, -2.029296875, -1.8447265625, -1.66015625, -1.4755859375, -1.291015625, -1.1064453125, -0.921875, -0.7373046875, -0.552734375, -0.3681640625, -0.18359375, 0.0009765625, 0.185546875, 0.3701171875, 0.5546875, 0.7392578125, 0.923828125, 1.1083984375, 1.29296875, 1.4775390625, 1.662109375, 1.8466796875, 2.03125, 2.2158203125, 2.400390625, 2.5849609375, 2.76953125, 2.9541015625, 3.138671875, 3.3232421875, 3.5078125, 3.6923828125, 3.876953125, 4.0615234375, 4.24609375, 4.4306640625, 4.615234375, 4.7998046875, 4.984375, 5.1689453125, 5.353515625, 5.5380859375, 5.72265625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 16.0, 22.0, 28.0, 37.0, 55.0, 95.0, 133.0, 217.0, 363.0, 584.0, 884.0, 1514.0, 2567.0, 4092.0, 6955.0, 11722.0, 19988.0, 32872.0, 55144.0, 89683.0, 143099.0, 222204.0, 326090.0, 448266.0, 551612.0, 580791.0, 517513.0, 400439.0, 282793.0, 187994.0, 119648.0, 74028.0, 44890.0, 27102.0, 16293.0, 9798.0, 5839.0, 3531.0, 2122.0, 1206.0, 755.0, 465.0, 289.0, 189.0, 118.0, 81.0, 60.0, 34.0, 22.0, 23.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-5.56640625, -5.39410400390625, -5.2218017578125, -5.04949951171875, -4.877197265625, -4.70489501953125, -4.5325927734375, -4.36029052734375, -4.18798828125, -4.01568603515625, -3.8433837890625, -3.67108154296875, -3.498779296875, -3.32647705078125, -3.1541748046875, -2.98187255859375, -2.8095703125, -2.63726806640625, -2.4649658203125, -2.29266357421875, -2.120361328125, -1.94805908203125, -1.7757568359375, -1.60345458984375, -1.43115234375, -1.25885009765625, -1.0865478515625, -0.91424560546875, -0.741943359375, -0.56964111328125, -0.3973388671875, -0.22503662109375, -0.052734375, 0.11956787109375, 0.2918701171875, 0.46417236328125, 0.636474609375, 0.80877685546875, 0.9810791015625, 1.15338134765625, 1.32568359375, 1.49798583984375, 1.6702880859375, 1.84259033203125, 2.014892578125, 2.18719482421875, 2.3594970703125, 2.53179931640625, 2.7041015625, 2.87640380859375, 3.0487060546875, 3.22100830078125, 3.393310546875, 3.56561279296875, 3.7379150390625, 3.91021728515625, 4.08251953125, 4.25482177734375, 4.4271240234375, 4.59942626953125, 4.771728515625, 4.94403076171875, 5.1163330078125, 5.28863525390625, 5.4609375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 18.0, 18.0, 37.0, 31.0, 43.0, 50.0, 71.0, 87.0, 107.0, 135.0, 147.0, 196.0, 185.0, 204.0, 238.0, 232.0, 256.0, 255.0, 271.0, 238.0, 232.0, 191.0, 155.0, 143.0, 108.0, 83.0, 70.0, 53.0, 57.0, 32.0, 28.0, 19.0, 13.0, 14.0, 11.0, 10.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.851348876953125, -2.76910400390625, -2.686859130859375, -2.6046142578125, -2.522369384765625, -2.44012451171875, -2.357879638671875, -2.275634765625, -2.193389892578125, -2.11114501953125, -2.028900146484375, -1.9466552734375, -1.864410400390625, -1.78216552734375, -1.699920654296875, -1.61767578125, -1.535430908203125, -1.45318603515625, -1.370941162109375, -1.2886962890625, -1.206451416015625, -1.12420654296875, -1.041961669921875, -0.959716796875, -0.877471923828125, -0.79522705078125, -0.712982177734375, -0.6307373046875, -0.548492431640625, -0.46624755859375, -0.384002685546875, -0.3017578125, -0.219512939453125, -0.13726806640625, -0.055023193359375, 0.0272216796875, 0.109466552734375, 0.19171142578125, 0.273956298828125, 0.356201171875, 0.438446044921875, 0.52069091796875, 0.602935791015625, 0.6851806640625, 0.767425537109375, 0.84967041015625, 0.931915283203125, 1.01416015625, 1.096405029296875, 1.17864990234375, 1.260894775390625, 1.3431396484375, 1.425384521484375, 1.50762939453125, 1.589874267578125, 1.672119140625, 1.754364013671875, 1.83660888671875, 1.918853759765625, 2.0010986328125, 2.083343505859375, 2.16558837890625, 2.247833251953125, 2.330078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 7.0, 8.0, 10.0, 13.0, 9.0, 16.0, 20.0, 12.0, 15.0, 29.0, 20.0, 22.0, 32.0, 34.0, 41.0, 44.0, 48.0, 46.0, 50.0, 33.0, 54.0, 36.0, 36.0, 37.0, 39.0, 37.0, 24.0, 27.0, 34.0, 15.0, 21.0, 21.0, 14.0, 19.0, 13.0, 12.0, 13.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.7683515548706055, -5.592494010925293, -5.416636943817139, -5.240779876708984, -5.064922332763672, -4.889064788818359, -4.713207721710205, -4.537350654602051, -4.361493110656738, -4.185635566711426, -4.0097784996032715, -3.833921194076538, -3.6580638885498047, -3.4822065830230713, -3.306349277496338, -3.1304919719696045, -2.954634666442871, -2.7787773609161377, -2.6029200553894043, -2.427062749862671, -2.2512054443359375, -2.075348138809204, -1.8994908332824707, -1.7236335277557373, -1.547776222229004, -1.3719189167022705, -1.196061611175537, -1.0202043056488037, -0.8443470001220703, -0.6684896945953369, -0.4926323890686035, -0.3167750835418701, -0.14091777801513672, 0.03493952751159668, 0.21079683303833008, 0.3866541385650635, 0.5625114440917969, 0.7383687496185303, 0.9142260551452637, 1.090083360671997, 1.2659406661987305, 1.4417979717254639, 1.6176552772521973, 1.7935125827789307, 1.969369888305664, 2.1452271938323975, 2.321084499359131, 2.4969418048858643, 2.6727991104125977, 2.848656415939331, 3.0245137214660645, 3.200371026992798, 3.3762283325195312, 3.5520856380462646, 3.727942943572998, 3.9038002490997314, 4.079657554626465, 4.255515098571777, 4.431372165679932, 4.607229232788086, 4.783086776733398, 4.958944320678711, 5.134801387786865, 5.3106584548950195, 5.486515998840332]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 3.0, 6.0, 2.0, 6.0, 4.0, 8.0, 7.0, 17.0, 14.0, 29.0, 21.0, 28.0, 31.0, 27.0, 25.0, 32.0, 35.0, 36.0, 50.0, 27.0, 44.0, 37.0, 39.0, 48.0, 34.0, 39.0, 46.0, 33.0, 40.0, 23.0, 39.0, 35.0, 25.0, 17.0, 16.0, 15.0, 22.0, 11.0, 11.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.509216785430908, -6.32017183303833, -6.131126880645752, -5.942081451416016, -5.7530364990234375, -5.563991546630859, -5.374946594238281, -5.185901641845703, -4.996856689453125, -4.807811737060547, -4.618766784667969, -4.429721832275391, -4.240676403045654, -4.051631450653076, -3.862586498260498, -3.67354154586792, -3.4844961166381836, -3.2954511642456055, -3.1064059734344482, -2.91736102104187, -2.728315830230713, -2.5392708778381348, -2.3502259254455566, -2.1611809730529785, -1.9721357822418213, -1.7830907106399536, -1.594045639038086, -1.4050006866455078, -1.2159556150436401, -1.0269105434417725, -0.8378655910491943, -0.6488205194473267, -0.459775447845459, -0.2707304060459137, -0.08168536424636841, 0.10735964775085449, 0.29640471935272217, 0.48544979095458984, 0.674494743347168, 0.8635398149490356, 1.0525848865509033, 1.241629958152771, 1.4306750297546387, 1.6197199821472168, 1.8087650537490845, 1.9978101253509521, 2.1868550777435303, 2.3759002685546875, 2.5649452209472656, 2.7539901733398438, 2.943035364151001, 3.132080316543579, 3.3211255073547363, 3.5101704597473145, 3.6992154121398926, 3.8882603645324707, 4.077305793762207, 4.266350746154785, 4.455395698547363, 4.644440650939941, 4.833486080169678, 5.022531032562256, 5.211575984954834, 5.400620937347412, 5.58966588973999]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 3.0, 12.0, 15.0, 37.0, 48.0, 83.0, 111.0, 156.0, 232.0, 320.0, 515.0, 741.0, 1249.0, 1942.0, 3121.0, 4914.0, 8151.0, 13503.0, 23342.0, 38986.0, 65457.0, 102804.0, 148938.0, 177780.0, 159231.0, 113739.0, 72447.0, 44429.0, 26482.0, 15408.0, 9193.0, 5611.0, 3529.0, 2085.0, 1365.0, 922.0, 530.0, 377.0, 254.0, 156.0, 102.0, 80.0, 54.0, 28.0, 20.0, 17.0, 13.0, 8.0, 2.0, 6.0, 2.0, 3.0], "bins": [-2.77734375, -2.699371337890625, -2.62139892578125, -2.543426513671875, -2.4654541015625, -2.387481689453125, -2.30950927734375, -2.231536865234375, -2.153564453125, -2.075592041015625, -1.99761962890625, -1.919647216796875, -1.8416748046875, -1.763702392578125, -1.68572998046875, -1.607757568359375, -1.52978515625, -1.451812744140625, -1.37384033203125, -1.295867919921875, -1.2178955078125, -1.139923095703125, -1.06195068359375, -0.983978271484375, -0.906005859375, -0.828033447265625, -0.75006103515625, -0.672088623046875, -0.5941162109375, -0.516143798828125, -0.43817138671875, -0.360198974609375, -0.2822265625, -0.204254150390625, -0.12628173828125, -0.048309326171875, 0.0296630859375, 0.107635498046875, 0.18560791015625, 0.263580322265625, 0.341552734375, 0.419525146484375, 0.49749755859375, 0.575469970703125, 0.6534423828125, 0.731414794921875, 0.80938720703125, 0.887359619140625, 0.96533203125, 1.043304443359375, 1.12127685546875, 1.199249267578125, 1.2772216796875, 1.355194091796875, 1.43316650390625, 1.511138916015625, 1.589111328125, 1.667083740234375, 1.74505615234375, 1.823028564453125, 1.9010009765625, 1.978973388671875, 2.05694580078125, 2.134918212890625, 2.212890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 3.0, 11.0, 19.0, 7.0, 12.0, 25.0, 26.0, 24.0, 23.0, 22.0, 28.0, 46.0, 47.0, 42.0, 38.0, 43.0, 38.0, 42.0, 45.0, 44.0, 40.0, 41.0, 40.0, 42.0, 36.0, 36.0, 30.0, 28.0, 22.0, 19.0, 13.0, 17.0, 11.0, 10.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-7.6171875, -7.4090576171875, -7.200927734375, -6.9927978515625, -6.78466796875, -6.5765380859375, -6.368408203125, -6.1602783203125, -5.9521484375, -5.7440185546875, -5.535888671875, -5.3277587890625, -5.11962890625, -4.9114990234375, -4.703369140625, -4.4952392578125, -4.287109375, -4.0789794921875, -3.870849609375, -3.6627197265625, -3.45458984375, -3.2464599609375, -3.038330078125, -2.8302001953125, -2.6220703125, -2.4139404296875, -2.205810546875, -1.9976806640625, -1.78955078125, -1.5814208984375, -1.373291015625, -1.1651611328125, -0.95703125, -0.7489013671875, -0.540771484375, -0.3326416015625, -0.12451171875, 0.0836181640625, 0.291748046875, 0.4998779296875, 0.7080078125, 0.9161376953125, 1.124267578125, 1.3323974609375, 1.54052734375, 1.7486572265625, 1.956787109375, 2.1649169921875, 2.373046875, 2.5811767578125, 2.789306640625, 2.9974365234375, 3.20556640625, 3.4136962890625, 3.621826171875, 3.8299560546875, 4.0380859375, 4.2462158203125, 4.454345703125, 4.6624755859375, 4.87060546875, 5.0787353515625, 5.286865234375, 5.4949951171875, 5.703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 13.0, 12.0, 24.0, 25.0, 47.0, 59.0, 63.0, 129.0, 193.0, 396.0, 724.0, 1621.0, 3937.0, 10298.0, 30547.0, 657716.0, 301257.0, 26046.0, 9003.0, 3449.0, 1407.0, 650.0, 322.0, 190.0, 127.0, 82.0, 55.0, 36.0, 25.0, 27.0, 14.0, 9.0, 12.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.04205322265625, -6.8067626953125, -6.57147216796875, -6.336181640625, -6.10089111328125, -5.8656005859375, -5.63031005859375, -5.39501953125, -5.15972900390625, -4.9244384765625, -4.68914794921875, -4.453857421875, -4.21856689453125, -3.9832763671875, -3.74798583984375, -3.5126953125, -3.27740478515625, -3.0421142578125, -2.80682373046875, -2.571533203125, -2.33624267578125, -2.1009521484375, -1.86566162109375, -1.63037109375, -1.39508056640625, -1.1597900390625, -0.92449951171875, -0.689208984375, -0.45391845703125, -0.2186279296875, 0.01666259765625, 0.251953125, 0.48724365234375, 0.7225341796875, 0.95782470703125, 1.193115234375, 1.42840576171875, 1.6636962890625, 1.89898681640625, 2.13427734375, 2.36956787109375, 2.6048583984375, 2.84014892578125, 3.075439453125, 3.31072998046875, 3.5460205078125, 3.78131103515625, 4.0166015625, 4.25189208984375, 4.4871826171875, 4.72247314453125, 4.957763671875, 5.19305419921875, 5.4283447265625, 5.66363525390625, 5.89892578125, 6.13421630859375, 6.3695068359375, 6.60479736328125, 6.840087890625, 7.07537841796875, 7.3106689453125, 7.54595947265625, 7.78125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 8.0, 13.0, 9.0, 10.0, 19.0, 17.0, 18.0, 23.0, 25.0, 30.0, 29.0, 32.0, 45.0, 33.0, 43.0, 33.0, 34.0, 44.0, 36.0, 48.0, 45.0, 33.0, 34.0, 38.0, 37.0, 23.0, 40.0, 22.0, 23.0, 27.0, 21.0, 11.0, 10.0, 12.0, 15.0, 6.0, 10.0, 4.0, 4.0, 6.0, 7.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.0848388671875, -3.947021484375, -3.8092041015625, -3.67138671875, -3.5335693359375, -3.395751953125, -3.2579345703125, -3.1201171875, -2.9822998046875, -2.844482421875, -2.7066650390625, -2.56884765625, -2.4310302734375, -2.293212890625, -2.1553955078125, -2.017578125, -1.8797607421875, -1.741943359375, -1.6041259765625, -1.46630859375, -1.3284912109375, -1.190673828125, -1.0528564453125, -0.9150390625, -0.7772216796875, -0.639404296875, -0.5015869140625, -0.36376953125, -0.2259521484375, -0.088134765625, 0.0496826171875, 0.1875, 0.3253173828125, 0.463134765625, 0.6009521484375, 0.73876953125, 0.8765869140625, 1.014404296875, 1.1522216796875, 1.2900390625, 1.4278564453125, 1.565673828125, 1.7034912109375, 1.84130859375, 1.9791259765625, 2.116943359375, 2.2547607421875, 2.392578125, 2.5303955078125, 2.668212890625, 2.8060302734375, 2.94384765625, 3.0816650390625, 3.219482421875, 3.3572998046875, 3.4951171875, 3.6329345703125, 3.770751953125, 3.9085693359375, 4.04638671875, 4.1842041015625, 4.322021484375, 4.4598388671875, 4.59765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 9.0, 8.0, 28.0, 17.0, 32.0, 47.0, 52.0, 83.0, 125.0, 212.0, 309.0, 628.0, 1312.0, 2686.0, 6158.0, 14560.0, 38345.0, 781046.0, 158828.0, 25049.0, 10370.0, 4419.0, 1991.0, 939.0, 502.0, 277.0, 161.0, 112.0, 77.0, 33.0, 30.0, 24.0, 27.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9244461059570312, -0.8923492431640625, -0.8602523803710938, -0.828155517578125, -0.7960586547851562, -0.7639617919921875, -0.7318649291992188, -0.69976806640625, -0.6676712036132812, -0.6355743408203125, -0.6034774780273438, -0.571380615234375, -0.5392837524414062, -0.5071868896484375, -0.47509002685546875, -0.4429931640625, -0.41089630126953125, -0.3787994384765625, -0.34670257568359375, -0.314605712890625, -0.28250885009765625, -0.2504119873046875, -0.21831512451171875, -0.18621826171875, -0.15412139892578125, -0.1220245361328125, -0.08992767333984375, -0.057830810546875, -0.02573394775390625, 0.0063629150390625, 0.03845977783203125, 0.070556640625, 0.10265350341796875, 0.1347503662109375, 0.16684722900390625, 0.198944091796875, 0.23104095458984375, 0.2631378173828125, 0.29523468017578125, 0.32733154296875, 0.35942840576171875, 0.3915252685546875, 0.42362213134765625, 0.455718994140625, 0.48781585693359375, 0.5199127197265625, 0.5520095825195312, 0.5841064453125, 0.6162033081054688, 0.6483001708984375, 0.6803970336914062, 0.712493896484375, 0.7445907592773438, 0.7766876220703125, 0.8087844848632812, 0.84088134765625, 0.8729782104492188, 0.9050750732421875, 0.9371719360351562, 0.969268798828125, 1.0013656616210938, 1.0334625244140625, 1.0655593872070312, 1.09765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 18.0, 12.0, 21.0, 35.0, 32.0, 41.0, 54.0, 84.0, 62.0, 82.0, 63.0, 84.0, 58.0, 79.0, 49.0, 43.0, 31.0, 29.0, 30.0, 14.0, 12.0, 11.0, 10.0, 4.0, 8.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.37905502319336e-05, -7.163360714912415e-05, -6.94766640663147e-05, -6.731972098350525e-05, -6.51627779006958e-05, -6.300583481788635e-05, -6.0848891735076904e-05, -5.8691948652267456e-05, -5.653500556945801e-05, -5.437806248664856e-05, -5.222111940383911e-05, -5.006417632102966e-05, -4.7907233238220215e-05, -4.5750290155410767e-05, -4.359334707260132e-05, -4.143640398979187e-05, -3.927946090698242e-05, -3.7122517824172974e-05, -3.4965574741363525e-05, -3.280863165855408e-05, -3.065168857574463e-05, -2.849474549293518e-05, -2.6337802410125732e-05, -2.4180859327316284e-05, -2.2023916244506836e-05, -1.9866973161697388e-05, -1.771003007888794e-05, -1.555308699607849e-05, -1.3396143913269043e-05, -1.1239200830459595e-05, -9.082257747650146e-06, -6.925314664840698e-06, -4.76837158203125e-06, -2.6114284992218018e-06, -4.544854164123535e-07, 1.7024576663970947e-06, 3.859400749206543e-06, 6.016343832015991e-06, 8.17328691482544e-06, 1.0330229997634888e-05, 1.2487173080444336e-05, 1.4644116163253784e-05, 1.6801059246063232e-05, 1.895800232887268e-05, 2.111494541168213e-05, 2.3271888494491577e-05, 2.5428831577301025e-05, 2.7585774660110474e-05, 2.9742717742919922e-05, 3.189966082572937e-05, 3.405660390853882e-05, 3.6213546991348267e-05, 3.8370490074157715e-05, 4.052743315696716e-05, 4.268437623977661e-05, 4.484131932258606e-05, 4.699826240539551e-05, 4.9155205488204956e-05, 5.1312148571014404e-05, 5.346909165382385e-05, 5.56260347366333e-05, 5.778297781944275e-05, 5.99399209022522e-05, 6.209686398506165e-05, 6.42538070678711e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 13.0, 18.0, 25.0, 42.0, 63.0, 93.0, 159.0, 201.0, 312.0, 465.0, 729.0, 1070.0, 1611.0, 2406.0, 3834.0, 5670.0, 8650.0, 13456.0, 21308.0, 32770.0, 50227.0, 76584.0, 111685.0, 149653.0, 158867.0, 133180.0, 95138.0, 63476.0, 41421.0, 26534.0, 16986.0, 10904.0, 7268.0, 4517.0, 3109.0, 1946.0, 1409.0, 909.0, 588.0, 385.0, 288.0, 207.0, 136.0, 90.0, 61.0, 20.0, 27.0, 10.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.64501953125, -0.625030517578125, -0.60504150390625, -0.585052490234375, -0.5650634765625, -0.545074462890625, -0.52508544921875, -0.505096435546875, -0.485107421875, -0.465118408203125, -0.44512939453125, -0.425140380859375, -0.4051513671875, -0.385162353515625, -0.36517333984375, -0.345184326171875, -0.3251953125, -0.305206298828125, -0.28521728515625, -0.265228271484375, -0.2452392578125, -0.225250244140625, -0.20526123046875, -0.185272216796875, -0.165283203125, -0.145294189453125, -0.12530517578125, -0.105316162109375, -0.0853271484375, -0.065338134765625, -0.04534912109375, -0.025360107421875, -0.00537109375, 0.014617919921875, 0.03460693359375, 0.054595947265625, 0.0745849609375, 0.094573974609375, 0.11456298828125, 0.134552001953125, 0.154541015625, 0.174530029296875, 0.19451904296875, 0.214508056640625, 0.2344970703125, 0.254486083984375, 0.27447509765625, 0.294464111328125, 0.314453125, 0.334442138671875, 0.35443115234375, 0.374420166015625, 0.3944091796875, 0.414398193359375, 0.43438720703125, 0.454376220703125, 0.474365234375, 0.494354248046875, 0.51434326171875, 0.534332275390625, 0.5543212890625, 0.574310302734375, 0.59429931640625, 0.614288330078125, 0.63427734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 5.0, 3.0, 6.0, 11.0, 10.0, 25.0, 15.0, 16.0, 33.0, 22.0, 26.0, 37.0, 34.0, 53.0, 66.0, 57.0, 58.0, 54.0, 61.0, 67.0, 58.0, 43.0, 45.0, 34.0, 32.0, 16.0, 17.0, 13.0, 15.0, 9.0, 8.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2386474609375, -0.2302074432373047, -0.22176742553710938, -0.21332740783691406, -0.20488739013671875, -0.19644737243652344, -0.18800735473632812, -0.1795673370361328, -0.1711273193359375, -0.1626873016357422, -0.15424728393554688, -0.14580726623535156, -0.13736724853515625, -0.12892723083496094, -0.12048721313476562, -0.11204719543457031, -0.103607177734375, -0.09516716003417969, -0.08672714233398438, -0.07828712463378906, -0.06984710693359375, -0.06140708923339844, -0.052967071533203125, -0.04452705383300781, -0.0360870361328125, -0.027647018432617188, -0.019207000732421875, -0.010766983032226562, -0.00232696533203125, 0.0061130523681640625, 0.014553070068359375, 0.022993087768554688, 0.03143310546875, 0.03987312316894531, 0.048313140869140625, 0.05675315856933594, 0.06519317626953125, 0.07363319396972656, 0.08207321166992188, 0.09051322937011719, 0.0989532470703125, 0.10739326477050781, 0.11583328247070312, 0.12427330017089844, 0.13271331787109375, 0.14115333557128906, 0.14959335327148438, 0.1580333709716797, 0.166473388671875, 0.1749134063720703, 0.18335342407226562, 0.19179344177246094, 0.20023345947265625, 0.20867347717285156, 0.21711349487304688, 0.2255535125732422, 0.2339935302734375, 0.2424335479736328, 0.2508735656738281, 0.25931358337402344, 0.26775360107421875, 0.27619361877441406, 0.2846336364746094, 0.2930736541748047, 0.301513671875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 7.0, 12.0, 14.0, 20.0, 18.0, 16.0, 22.0, 22.0, 23.0, 25.0, 30.0, 32.0, 40.0, 43.0, 49.0, 45.0, 37.0, 35.0, 48.0, 40.0, 32.0, 34.0, 40.0, 31.0, 25.0, 34.0, 18.0, 27.0, 22.0, 14.0, 16.0, 16.0, 17.0, 12.0, 15.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.479739189147949, -5.315057277679443, -5.150375843048096, -4.98569393157959, -4.821012020111084, -4.656330108642578, -4.4916486740112305, -4.326966762542725, -4.162284851074219, -3.997603178024292, -3.832921266555786, -3.6682395935058594, -3.5035576820373535, -3.3388760089874268, -3.1741943359375, -3.009512424468994, -2.8448309898376465, -2.6801493167877197, -2.515467405319214, -2.350785732269287, -2.1861038208007812, -2.0214221477508545, -1.8567404747009277, -1.6920586824417114, -1.5273768901824951, -1.3626950979232788, -1.1980133056640625, -1.0333316326141357, -0.8686498403549194, -0.7039680480957031, -0.5392863154411316, -0.37460458278656006, -0.20992231369018555, -0.045240551233291626, 0.1194412112236023, 0.2841229736804962, 0.44880473613739014, 0.6134865283966064, 0.778168261051178, 0.9428499937057495, 1.1075317859649658, 1.2722135782241821, 1.4368953704833984, 1.6015770435333252, 1.7662588357925415, 1.9309406280517578, 2.0956223011016846, 2.2603039741516113, 2.424985885620117, 2.589667558670044, 2.75434947013855, 2.9190311431884766, 3.0837130546569824, 3.248394727706909, 3.413076400756836, 3.577758312225342, 3.7424399852752686, 3.9071216583251953, 4.071803569793701, 4.236485481262207, 4.401166915893555, 4.5658488273620605, 4.730530738830566, 4.895212173461914, 5.05989408493042]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 6.0, 7.0, 9.0, 16.0, 15.0, 27.0, 26.0, 26.0, 22.0, 36.0, 20.0, 26.0, 39.0, 36.0, 43.0, 35.0, 44.0, 35.0, 36.0, 48.0, 36.0, 34.0, 46.0, 38.0, 29.0, 37.0, 30.0, 37.0, 21.0, 21.0, 20.0, 13.0, 21.0, 13.0, 11.0, 7.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.290111541748047, -6.106261730194092, -5.922411918640137, -5.738562107086182, -5.554712295532227, -5.3708624839782715, -5.187012672424316, -5.0031633377075195, -4.819313049316406, -4.635463237762451, -4.451613426208496, -4.267763614654541, -4.083913803100586, -3.900063991546631, -3.716214418411255, -3.5323646068573, -3.348515033721924, -3.1646652221679688, -2.9808154106140137, -2.7969655990600586, -2.6131157875061035, -2.4292659759521484, -2.2454164028167725, -2.0615665912628174, -1.8777167797088623, -1.6938669681549072, -1.5100171566009521, -1.3261674642562866, -1.1423176527023315, -0.9584678411483765, -0.7746181488037109, -0.5907683372497559, -0.4069185256958008, -0.2230687439441681, -0.0392189621925354, 0.1446307897567749, 0.32848060131073, 0.5123304128646851, 0.6961801052093506, 0.8800299167633057, 1.0638797283172607, 1.2477295398712158, 1.431579351425171, 1.6154290437698364, 1.7992788553237915, 1.9831286668777466, 2.166978359222412, 2.350828170776367, 2.5346779823303223, 2.7185277938842773, 2.9023776054382324, 3.0862274169921875, 3.2700772285461426, 3.4539270401000977, 3.6377766132354736, 3.8216264247894287, 4.005475997924805, 4.18932580947876, 4.373175621032715, 4.55702543258667, 4.740875244140625, 4.92472505569458, 5.108574867248535, 5.292424201965332, 5.476274490356445]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 22.0, 33.0, 63.0, 102.0, 135.0, 237.0, 328.0, 590.0, 832.0, 1337.0, 1924.0, 2941.0, 4205.0, 6309.0, 9201.0, 12558.0, 17892.0, 24148.0, 32070.0, 41010.0, 50865.0, 61669.0, 71577.0, 80015.0, 83360.0, 85203.0, 82441.0, 75622.0, 66344.0, 56545.0, 45746.0, 36345.0, 27795.0, 20395.0, 15019.0, 10698.0, 7415.0, 5143.0, 3496.0, 2374.0, 1581.0, 1043.0, 689.0, 463.0, 283.0, 190.0, 108.0, 71.0, 50.0, 25.0, 15.0, 8.0, 9.0, 3.0, 6.0, 1.0, 1.0], "bins": [-3.78125, -3.663970947265625, -3.54669189453125, -3.429412841796875, -3.3121337890625, -3.194854736328125, -3.07757568359375, -2.960296630859375, -2.843017578125, -2.725738525390625, -2.60845947265625, -2.491180419921875, -2.3739013671875, -2.256622314453125, -2.13934326171875, -2.022064208984375, -1.90478515625, -1.787506103515625, -1.67022705078125, -1.552947998046875, -1.4356689453125, -1.318389892578125, -1.20111083984375, -1.083831787109375, -0.966552734375, -0.849273681640625, -0.73199462890625, -0.614715576171875, -0.4974365234375, -0.380157470703125, -0.26287841796875, -0.145599365234375, -0.0283203125, 0.088958740234375, 0.20623779296875, 0.323516845703125, 0.4407958984375, 0.558074951171875, 0.67535400390625, 0.792633056640625, 0.909912109375, 1.027191162109375, 1.14447021484375, 1.261749267578125, 1.3790283203125, 1.496307373046875, 1.61358642578125, 1.730865478515625, 1.84814453125, 1.965423583984375, 2.08270263671875, 2.199981689453125, 2.3172607421875, 2.434539794921875, 2.55181884765625, 2.669097900390625, 2.786376953125, 2.903656005859375, 3.02093505859375, 3.138214111328125, 3.2554931640625, 3.372772216796875, 3.49005126953125, 3.607330322265625, 3.724609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 14.0, 23.0, 13.0, 19.0, 22.0, 21.0, 27.0, 29.0, 26.0, 28.0, 27.0, 28.0, 33.0, 35.0, 36.0, 45.0, 39.0, 44.0, 42.0, 29.0, 34.0, 38.0, 38.0, 35.0, 29.0, 33.0, 23.0, 23.0, 31.0, 18.0, 14.0, 22.0, 11.0, 12.0, 9.0, 9.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.94921875, -5.7694091796875, -5.589599609375, -5.4097900390625, -5.22998046875, -5.0501708984375, -4.870361328125, -4.6905517578125, -4.5107421875, -4.3309326171875, -4.151123046875, -3.9713134765625, -3.79150390625, -3.6116943359375, -3.431884765625, -3.2520751953125, -3.072265625, -2.8924560546875, -2.712646484375, -2.5328369140625, -2.35302734375, -2.1732177734375, -1.993408203125, -1.8135986328125, -1.6337890625, -1.4539794921875, -1.274169921875, -1.0943603515625, -0.91455078125, -0.7347412109375, -0.554931640625, -0.3751220703125, -0.1953125, -0.0155029296875, 0.164306640625, 0.3441162109375, 0.52392578125, 0.7037353515625, 0.883544921875, 1.0633544921875, 1.2431640625, 1.4229736328125, 1.602783203125, 1.7825927734375, 1.96240234375, 2.1422119140625, 2.322021484375, 2.5018310546875, 2.681640625, 2.8614501953125, 3.041259765625, 3.2210693359375, 3.40087890625, 3.5806884765625, 3.760498046875, 3.9403076171875, 4.1201171875, 4.2999267578125, 4.479736328125, 4.6595458984375, 4.83935546875, 5.0191650390625, 5.198974609375, 5.3787841796875, 5.55859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 6.0, 16.0, 22.0, 38.0, 57.0, 77.0, 110.0, 175.0, 299.0, 424.0, 674.0, 984.0, 1491.0, 2252.0, 3415.0, 4993.0, 7737.0, 11043.0, 15940.0, 22290.0, 30193.0, 40864.0, 52453.0, 65242.0, 77314.0, 86425.0, 91998.0, 92617.0, 87487.0, 79168.0, 67215.0, 54704.0, 42645.0, 32093.0, 23330.0, 16777.0, 11490.0, 8125.0, 5489.0, 3752.0, 2418.0, 1603.0, 1073.0, 694.0, 464.0, 325.0, 229.0, 129.0, 77.0, 39.0, 40.0, 24.0, 13.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.71875, -4.5618896484375, -4.405029296875, -4.2481689453125, -4.09130859375, -3.9344482421875, -3.777587890625, -3.6207275390625, -3.4638671875, -3.3070068359375, -3.150146484375, -2.9932861328125, -2.83642578125, -2.6795654296875, -2.522705078125, -2.3658447265625, -2.208984375, -2.0521240234375, -1.895263671875, -1.7384033203125, -1.58154296875, -1.4246826171875, -1.267822265625, -1.1109619140625, -0.9541015625, -0.7972412109375, -0.640380859375, -0.4835205078125, -0.32666015625, -0.1697998046875, -0.012939453125, 0.1439208984375, 0.30078125, 0.4576416015625, 0.614501953125, 0.7713623046875, 0.92822265625, 1.0850830078125, 1.241943359375, 1.3988037109375, 1.5556640625, 1.7125244140625, 1.869384765625, 2.0262451171875, 2.18310546875, 2.3399658203125, 2.496826171875, 2.6536865234375, 2.810546875, 2.9674072265625, 3.124267578125, 3.2811279296875, 3.43798828125, 3.5948486328125, 3.751708984375, 3.9085693359375, 4.0654296875, 4.2222900390625, 4.379150390625, 4.5360107421875, 4.69287109375, 4.8497314453125, 5.006591796875, 5.1634521484375, 5.3203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 6.0, 11.0, 18.0, 8.0, 17.0, 16.0, 16.0, 15.0, 29.0, 31.0, 38.0, 36.0, 32.0, 36.0, 35.0, 40.0, 41.0, 51.0, 46.0, 49.0, 45.0, 34.0, 35.0, 27.0, 37.0, 46.0, 28.0, 25.0, 24.0, 20.0, 16.0, 20.0, 13.0, 11.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.799591064453125, -3.67535400390625, -3.551116943359375, -3.4268798828125, -3.302642822265625, -3.17840576171875, -3.054168701171875, -2.929931640625, -2.805694580078125, -2.68145751953125, -2.557220458984375, -2.4329833984375, -2.308746337890625, -2.18450927734375, -2.060272216796875, -1.93603515625, -1.811798095703125, -1.68756103515625, -1.563323974609375, -1.4390869140625, -1.314849853515625, -1.19061279296875, -1.066375732421875, -0.942138671875, -0.817901611328125, -0.69366455078125, -0.569427490234375, -0.4451904296875, -0.320953369140625, -0.19671630859375, -0.072479248046875, 0.0517578125, 0.175994873046875, 0.30023193359375, 0.424468994140625, 0.5487060546875, 0.672943115234375, 0.79718017578125, 0.921417236328125, 1.045654296875, 1.169891357421875, 1.29412841796875, 1.418365478515625, 1.5426025390625, 1.666839599609375, 1.79107666015625, 1.915313720703125, 2.03955078125, 2.163787841796875, 2.28802490234375, 2.412261962890625, 2.5364990234375, 2.660736083984375, 2.78497314453125, 2.909210205078125, 3.033447265625, 3.157684326171875, 3.28192138671875, 3.406158447265625, 3.5303955078125, 3.654632568359375, 3.77886962890625, 3.903106689453125, 4.02734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 4.0, 21.0, 15.0, 39.0, 46.0, 76.0, 123.0, 215.0, 371.0, 635.0, 1047.0, 1855.0, 3242.0, 5511.0, 9425.0, 15599.0, 26261.0, 41312.0, 63442.0, 88980.0, 115986.0, 133644.0, 135575.0, 120627.0, 96641.0, 69235.0, 46206.0, 29159.0, 18000.0, 10477.0, 6210.0, 3541.0, 2037.0, 1177.0, 755.0, 437.0, 253.0, 146.0, 94.0, 58.0, 36.0, 13.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.853515625, -1.795806884765625, -1.73809814453125, -1.680389404296875, -1.6226806640625, -1.564971923828125, -1.50726318359375, -1.449554443359375, -1.391845703125, -1.334136962890625, -1.27642822265625, -1.218719482421875, -1.1610107421875, -1.103302001953125, -1.04559326171875, -0.987884521484375, -0.93017578125, -0.872467041015625, -0.81475830078125, -0.757049560546875, -0.6993408203125, -0.641632080078125, -0.58392333984375, -0.526214599609375, -0.468505859375, -0.410797119140625, -0.35308837890625, -0.295379638671875, -0.2376708984375, -0.179962158203125, -0.12225341796875, -0.064544677734375, -0.0068359375, 0.050872802734375, 0.10858154296875, 0.166290283203125, 0.2239990234375, 0.281707763671875, 0.33941650390625, 0.397125244140625, 0.454833984375, 0.512542724609375, 0.57025146484375, 0.627960205078125, 0.6856689453125, 0.743377685546875, 0.80108642578125, 0.858795166015625, 0.91650390625, 0.974212646484375, 1.03192138671875, 1.089630126953125, 1.1473388671875, 1.205047607421875, 1.26275634765625, 1.320465087890625, 1.378173828125, 1.435882568359375, 1.49359130859375, 1.551300048828125, 1.6090087890625, 1.666717529296875, 1.72442626953125, 1.782135009765625, 1.83984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 15.0, 21.0, 29.0, 28.0, 38.0, 43.0, 39.0, 40.0, 34.0, 63.0, 65.0, 57.0, 76.0, 55.0, 54.0, 70.0, 29.0, 49.0, 32.0, 20.0, 20.0, 22.0, 13.0, 16.0, 9.0, 13.0, 7.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025010108947753906, -0.0002415291965007782, -0.00023295730352401733, -0.00022438541054725647, -0.0002158135175704956, -0.00020724162459373474, -0.00019866973161697388, -0.000190097838640213, -0.00018152594566345215, -0.00017295405268669128, -0.00016438215970993042, -0.00015581026673316956, -0.0001472383737564087, -0.00013866648077964783, -0.00013009458780288696, -0.0001215226948261261, -0.00011295080184936523, -0.00010437890887260437, -9.58070158958435e-05, -8.723512291908264e-05, -7.866322994232178e-05, -7.009133696556091e-05, -6.151944398880005e-05, -5.2947551012039185e-05, -4.437565803527832e-05, -3.5803765058517456e-05, -2.7231872081756592e-05, -1.8659979104995728e-05, -1.0088086128234863e-05, -1.516193151473999e-06, 7.055699825286865e-06, 1.562759280204773e-05, 2.4199485778808594e-05, 3.277137875556946e-05, 4.134327173233032e-05, 4.9915164709091187e-05, 5.848705768585205e-05, 6.705895066261292e-05, 7.563084363937378e-05, 8.420273661613464e-05, 9.277462959289551e-05, 0.00010134652256965637, 0.00010991841554641724, 0.0001184903085231781, 0.00012706220149993896, 0.00013563409447669983, 0.0001442059874534607, 0.00015277788043022156, 0.00016134977340698242, 0.00016992166638374329, 0.00017849355936050415, 0.00018706545233726501, 0.00019563734531402588, 0.00020420923829078674, 0.0002127811312675476, 0.00022135302424430847, 0.00022992491722106934, 0.0002384968101978302, 0.00024706870317459106, 0.00025564059615135193, 0.0002642124891281128, 0.00027278438210487366, 0.0002813562750816345, 0.0002899281680583954, 0.00029850006103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 12.0, 18.0, 34.0, 35.0, 74.0, 127.0, 208.0, 306.0, 513.0, 776.0, 1239.0, 1954.0, 3132.0, 4980.0, 7820.0, 12407.0, 19257.0, 28652.0, 41544.0, 58146.0, 76219.0, 93717.0, 108409.0, 113129.0, 110268.0, 96412.0, 78703.0, 60183.0, 43663.0, 30114.0, 20248.0, 13363.0, 8466.0, 5323.0, 3384.0, 2175.0, 1338.0, 797.0, 493.0, 351.0, 186.0, 143.0, 88.0, 48.0, 32.0, 28.0, 15.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4091796875, -1.3615264892578125, -1.313873291015625, -1.2662200927734375, -1.21856689453125, -1.1709136962890625, -1.123260498046875, -1.0756072998046875, -1.0279541015625, -0.9803009033203125, -0.932647705078125, -0.8849945068359375, -0.83734130859375, -0.7896881103515625, -0.742034912109375, -0.6943817138671875, -0.646728515625, -0.5990753173828125, -0.551422119140625, -0.5037689208984375, -0.45611572265625, -0.4084625244140625, -0.360809326171875, -0.3131561279296875, -0.2655029296875, -0.2178497314453125, -0.170196533203125, -0.1225433349609375, -0.07489013671875, -0.0272369384765625, 0.020416259765625, 0.0680694580078125, 0.11572265625, 0.1633758544921875, 0.211029052734375, 0.2586822509765625, 0.30633544921875, 0.3539886474609375, 0.401641845703125, 0.4492950439453125, 0.4969482421875, 0.5446014404296875, 0.592254638671875, 0.6399078369140625, 0.68756103515625, 0.7352142333984375, 0.782867431640625, 0.8305206298828125, 0.878173828125, 0.9258270263671875, 0.973480224609375, 1.0211334228515625, 1.06878662109375, 1.1164398193359375, 1.164093017578125, 1.2117462158203125, 1.2593994140625, 1.3070526123046875, 1.354705810546875, 1.4023590087890625, 1.45001220703125, 1.4976654052734375, 1.545318603515625, 1.5929718017578125, 1.640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 8.0, 7.0, 7.0, 15.0, 10.0, 13.0, 25.0, 23.0, 30.0, 33.0, 26.0, 27.0, 40.0, 36.0, 49.0, 35.0, 44.0, 29.0, 44.0, 46.0, 40.0, 43.0, 44.0, 39.0, 25.0, 34.0, 31.0, 24.0, 21.0, 20.0, 20.0, 7.0, 18.0, 13.0, 11.0, 10.0, 8.0, 6.0, 3.0, 6.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.69970703125, -0.6800460815429688, -0.6603851318359375, -0.6407241821289062, -0.621063232421875, -0.6014022827148438, -0.5817413330078125, -0.5620803833007812, -0.54241943359375, -0.5227584838867188, -0.5030975341796875, -0.48343658447265625, -0.463775634765625, -0.44411468505859375, -0.4244537353515625, -0.40479278564453125, -0.3851318359375, -0.36547088623046875, -0.3458099365234375, -0.32614898681640625, -0.306488037109375, -0.28682708740234375, -0.2671661376953125, -0.24750518798828125, -0.22784423828125, -0.20818328857421875, -0.1885223388671875, -0.16886138916015625, -0.149200439453125, -0.12953948974609375, -0.1098785400390625, -0.09021759033203125, -0.070556640625, -0.05089569091796875, -0.0312347412109375, -0.01157379150390625, 0.008087158203125, 0.02774810791015625, 0.0474090576171875, 0.06707000732421875, 0.08673095703125, 0.10639190673828125, 0.1260528564453125, 0.14571380615234375, 0.165374755859375, 0.18503570556640625, 0.2046966552734375, 0.22435760498046875, 0.2440185546875, 0.26367950439453125, 0.2833404541015625, 0.30300140380859375, 0.322662353515625, 0.34232330322265625, 0.3619842529296875, 0.38164520263671875, 0.40130615234375, 0.42096710205078125, 0.4406280517578125, 0.46028900146484375, 0.479949951171875, 0.49961090087890625, 0.5192718505859375, 0.5389328002929688, 0.55859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 11.0, 8.0, 11.0, 12.0, 18.0, 19.0, 27.0, 9.0, 20.0, 29.0, 27.0, 31.0, 25.0, 39.0, 39.0, 49.0, 47.0, 40.0, 31.0, 48.0, 46.0, 33.0, 41.0, 34.0, 48.0, 40.0, 24.0, 37.0, 25.0, 16.0, 18.0, 13.0, 18.0, 10.0, 10.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.98337459564209, -5.800719261169434, -5.6180644035339355, -5.4354095458984375, -5.252754211425781, -5.070098876953125, -4.887444019317627, -4.704789161682129, -4.522133827209473, -4.339478492736816, -4.156823635101318, -3.974168539047241, -3.791513442993164, -3.608858346939087, -3.4262032508850098, -3.2435481548309326, -3.0608930587768555, -2.8782379627227783, -2.695582866668701, -2.512927770614624, -2.330272674560547, -2.1476175785064697, -1.9649624824523926, -1.7823073863983154, -1.5996522903442383, -1.4169971942901611, -1.234342098236084, -1.0516870021820068, -0.8690319061279297, -0.6863768100738525, -0.5037217140197754, -0.32106661796569824, -0.1384119987487793, 0.04424309730529785, 0.226898193359375, 0.40955328941345215, 0.5922083854675293, 0.7748634815216064, 0.9575185775756836, 1.1401736736297607, 1.322828769683838, 1.505483865737915, 1.6881389617919922, 1.8707940578460693, 2.0534491539001465, 2.2361042499542236, 2.418759346008301, 2.601414442062378, 2.784069538116455, 2.9667246341705322, 3.1493797302246094, 3.3320348262786865, 3.5146899223327637, 3.697345018386841, 3.880000114440918, 4.062655448913574, 4.245310306549072, 4.42796516418457, 4.610620498657227, 4.793275833129883, 4.975930690765381, 5.158585548400879, 5.341240882873535, 5.523896217346191, 5.7065510749816895]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 13.0, 9.0, 7.0, 9.0, 16.0, 14.0, 23.0, 16.0, 26.0, 26.0, 27.0, 31.0, 25.0, 28.0, 33.0, 43.0, 37.0, 35.0, 33.0, 42.0, 34.0, 30.0, 32.0, 38.0, 38.0, 37.0, 35.0, 27.0, 39.0, 27.0, 25.0, 21.0, 12.0, 12.0, 12.0, 14.0, 13.0, 3.0, 9.0, 4.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-5.853611469268799, -5.679995536804199, -5.5063796043396, -5.332763671875, -5.1591477394104, -4.985531806945801, -4.811915874481201, -4.638299942016602, -4.464684009552002, -4.291068077087402, -4.117452144622803, -3.943836212158203, -3.7702202796936035, -3.596604347229004, -3.4229884147644043, -3.2493724822998047, -3.075756549835205, -2.9021406173706055, -2.728524684906006, -2.5549087524414062, -2.3812928199768066, -2.207676887512207, -2.0340609550476074, -1.8604450225830078, -1.6868290901184082, -1.5132131576538086, -1.339597225189209, -1.1659812927246094, -0.9923653602600098, -0.8187494277954102, -0.6451334953308105, -0.47151756286621094, -0.29790210723876953, -0.12428617477416992, 0.04932975769042969, 0.2229456901550293, 0.3965616226196289, 0.5701775550842285, 0.7437934875488281, 0.9174094200134277, 1.0910253524780273, 1.264641284942627, 1.4382572174072266, 1.6118731498718262, 1.7854890823364258, 1.9591050148010254, 2.132720947265625, 2.3063368797302246, 2.479952812194824, 2.653568744659424, 2.8271846771240234, 3.000800609588623, 3.1744165420532227, 3.3480324745178223, 3.521648406982422, 3.6952643394470215, 3.868880271911621, 4.042496204376221, 4.21611213684082, 4.38972806930542, 4.5633440017700195, 4.736959934234619, 4.910575866699219, 5.084191799163818, 5.257807731628418]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 18.0, 12.0, 35.0, 50.0, 61.0, 124.0, 168.0, 301.0, 456.0, 690.0, 1118.0, 1874.0, 2963.0, 4837.0, 8021.0, 13156.0, 21114.0, 35078.0, 57500.0, 93202.0, 147593.0, 231835.0, 348101.0, 477223.0, 575470.0, 588448.0, 506452.0, 379331.0, 258825.0, 167850.0, 105097.0, 64542.0, 40111.0, 24482.0, 14845.0, 8986.0, 5569.0, 3293.0, 2018.0, 1257.0, 786.0, 509.0, 318.0, 208.0, 127.0, 84.0, 53.0, 37.0, 22.0, 10.0, 11.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.79022216796875, -4.6312255859375, -4.47222900390625, -4.313232421875, -4.15423583984375, -3.9952392578125, -3.83624267578125, -3.67724609375, -3.51824951171875, -3.3592529296875, -3.20025634765625, -3.041259765625, -2.88226318359375, -2.7232666015625, -2.56427001953125, -2.4052734375, -2.24627685546875, -2.0872802734375, -1.92828369140625, -1.769287109375, -1.61029052734375, -1.4512939453125, -1.29229736328125, -1.13330078125, -0.97430419921875, -0.8153076171875, -0.65631103515625, -0.497314453125, -0.33831787109375, -0.1793212890625, -0.02032470703125, 0.138671875, 0.29766845703125, 0.4566650390625, 0.61566162109375, 0.774658203125, 0.93365478515625, 1.0926513671875, 1.25164794921875, 1.41064453125, 1.56964111328125, 1.7286376953125, 1.88763427734375, 2.046630859375, 2.20562744140625, 2.3646240234375, 2.52362060546875, 2.6826171875, 2.84161376953125, 3.0006103515625, 3.15960693359375, 3.318603515625, 3.47760009765625, 3.6365966796875, 3.79559326171875, 3.95458984375, 4.11358642578125, 4.2725830078125, 4.43157958984375, 4.590576171875, 4.74957275390625, 4.9085693359375, 5.06756591796875, 5.2265625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 2.0, 3.0, 10.0, 6.0, 11.0, 7.0, 20.0, 11.0, 18.0, 28.0, 15.0, 24.0, 18.0, 31.0, 31.0, 27.0, 27.0, 43.0, 38.0, 40.0, 33.0, 36.0, 30.0, 43.0, 37.0, 31.0, 33.0, 44.0, 30.0, 32.0, 31.0, 31.0, 22.0, 17.0, 30.0, 19.0, 5.0, 13.0, 8.0, 13.0, 2.0, 6.0, 12.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.9140625, -4.76434326171875, -4.6146240234375, -4.46490478515625, -4.315185546875, -4.16546630859375, -4.0157470703125, -3.86602783203125, -3.71630859375, -3.56658935546875, -3.4168701171875, -3.26715087890625, -3.117431640625, -2.96771240234375, -2.8179931640625, -2.66827392578125, -2.5185546875, -2.36883544921875, -2.2191162109375, -2.06939697265625, -1.919677734375, -1.76995849609375, -1.6202392578125, -1.47052001953125, -1.32080078125, -1.17108154296875, -1.0213623046875, -0.87164306640625, -0.721923828125, -0.57220458984375, -0.4224853515625, -0.27276611328125, -0.123046875, 0.02667236328125, 0.1763916015625, 0.32611083984375, 0.475830078125, 0.62554931640625, 0.7752685546875, 0.92498779296875, 1.07470703125, 1.22442626953125, 1.3741455078125, 1.52386474609375, 1.673583984375, 1.82330322265625, 1.9730224609375, 2.12274169921875, 2.2724609375, 2.42218017578125, 2.5718994140625, 2.72161865234375, 2.871337890625, 3.02105712890625, 3.1707763671875, 3.32049560546875, 3.47021484375, 3.61993408203125, 3.7696533203125, 3.91937255859375, 4.069091796875, 4.21881103515625, 4.3685302734375, 4.51824951171875, 4.66796875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 11.0, 11.0, 18.0, 24.0, 38.0, 54.0, 88.0, 133.0, 238.0, 400.0, 652.0, 1107.0, 1865.0, 3185.0, 5335.0, 9336.0, 16677.0, 28663.0, 49058.0, 83321.0, 139945.0, 224787.0, 341310.0, 478825.0, 590086.0, 613491.0, 529014.0, 394323.0, 265385.0, 169622.0, 102457.0, 60764.0, 35521.0, 20462.0, 11712.0, 6876.0, 3941.0, 2256.0, 1379.0, 750.0, 457.0, 270.0, 170.0, 111.0, 65.0, 32.0, 15.0, 21.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.375, -5.20269775390625, -5.0303955078125, -4.85809326171875, -4.685791015625, -4.51348876953125, -4.3411865234375, -4.16888427734375, -3.99658203125, -3.82427978515625, -3.6519775390625, -3.47967529296875, -3.307373046875, -3.13507080078125, -2.9627685546875, -2.79046630859375, -2.6181640625, -2.44586181640625, -2.2735595703125, -2.10125732421875, -1.928955078125, -1.75665283203125, -1.5843505859375, -1.41204833984375, -1.23974609375, -1.06744384765625, -0.8951416015625, -0.72283935546875, -0.550537109375, -0.37823486328125, -0.2059326171875, -0.03363037109375, 0.138671875, 0.31097412109375, 0.4832763671875, 0.65557861328125, 0.827880859375, 1.00018310546875, 1.1724853515625, 1.34478759765625, 1.51708984375, 1.68939208984375, 1.8616943359375, 2.03399658203125, 2.206298828125, 2.37860107421875, 2.5509033203125, 2.72320556640625, 2.8955078125, 3.06781005859375, 3.2401123046875, 3.41241455078125, 3.584716796875, 3.75701904296875, 3.9293212890625, 4.10162353515625, 4.27392578125, 4.44622802734375, 4.6185302734375, 4.79083251953125, 4.963134765625, 5.13543701171875, 5.3077392578125, 5.48004150390625, 5.65234375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 10.0, 13.0, 19.0, 22.0, 36.0, 33.0, 60.0, 48.0, 78.0, 66.0, 85.0, 123.0, 125.0, 162.0, 136.0, 170.0, 167.0, 193.0, 214.0, 222.0, 214.0, 192.0, 217.0, 178.0, 173.0, 154.0, 117.0, 125.0, 110.0, 114.0, 87.0, 89.0, 64.0, 50.0, 38.0, 28.0, 21.0, 28.0, 16.0, 14.0, 3.0, 9.0, 10.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0], "bins": [-2.2890625, -2.2235870361328125, -2.158111572265625, -2.0926361083984375, -2.02716064453125, -1.9616851806640625, -1.896209716796875, -1.8307342529296875, -1.7652587890625, -1.6997833251953125, -1.634307861328125, -1.5688323974609375, -1.50335693359375, -1.4378814697265625, -1.372406005859375, -1.3069305419921875, -1.241455078125, -1.1759796142578125, -1.110504150390625, -1.0450286865234375, -0.97955322265625, -0.9140777587890625, -0.848602294921875, -0.7831268310546875, -0.7176513671875, -0.6521759033203125, -0.586700439453125, -0.5212249755859375, -0.45574951171875, -0.3902740478515625, -0.324798583984375, -0.2593231201171875, -0.19384765625, -0.1283721923828125, -0.062896728515625, 0.0025787353515625, 0.06805419921875, 0.1335296630859375, 0.199005126953125, 0.2644805908203125, 0.3299560546875, 0.3954315185546875, 0.460906982421875, 0.5263824462890625, 0.59185791015625, 0.6573333740234375, 0.722808837890625, 0.7882843017578125, 0.853759765625, 0.9192352294921875, 0.984710693359375, 1.0501861572265625, 1.11566162109375, 1.1811370849609375, 1.246612548828125, 1.3120880126953125, 1.3775634765625, 1.4430389404296875, 1.508514404296875, 1.5739898681640625, 1.63946533203125, 1.7049407958984375, 1.770416259765625, 1.8358917236328125, 1.9013671875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 7.0, 8.0, 4.0, 18.0, 19.0, 17.0, 11.0, 20.0, 22.0, 29.0, 37.0, 33.0, 31.0, 33.0, 35.0, 50.0, 41.0, 60.0, 32.0, 39.0, 35.0, 43.0, 40.0, 36.0, 43.0, 45.0, 26.0, 31.0, 30.0, 17.0, 25.0, 10.0, 16.0, 10.0, 6.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.955866813659668, -4.770491600036621, -4.585116863250732, -4.3997416496276855, -4.214366912841797, -4.02899169921875, -3.8436167240142822, -3.6582417488098145, -3.4728667736053467, -3.287491798400879, -3.102116823196411, -2.9167418479919434, -2.7313666343688965, -2.545991897583008, -2.360616683959961, -2.175241708755493, -1.9898667335510254, -1.8044917583465576, -1.6191167831420898, -1.4337416887283325, -1.2483667135238647, -1.062991738319397, -0.8776166439056396, -0.6922416687011719, -0.5068666934967041, -0.32149168848991394, -0.13611668348312378, 0.04925835132598877, 0.23463332653045654, 0.4200083017349243, 0.6053833961486816, 0.7907583713531494, 0.9761338233947754, 1.1615087985992432, 1.346883773803711, 1.5322588682174683, 1.717633843421936, 1.9030088186264038, 2.088383913040161, 2.273758888244629, 2.4591338634490967, 2.6445088386535645, 2.8298838138580322, 3.0152587890625, 3.200634002685547, 3.3860087394714355, 3.5713839530944824, 3.75675892829895, 3.942133903503418, 4.127509117126465, 4.3128838539123535, 4.4982590675354, 4.683633804321289, 4.869009017944336, 5.054384231567383, 5.2397589683532715, 5.42513370513916, 5.610508918762207, 5.795883655548096, 5.981258869171143, 6.166633605957031, 6.352008819580078, 6.537384033203125, 6.722758769989014, 6.9081339836120605]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 11.0, 6.0, 8.0, 14.0, 10.0, 12.0, 17.0, 14.0, 20.0, 16.0, 22.0, 32.0, 29.0, 25.0, 33.0, 44.0, 28.0, 48.0, 35.0, 35.0, 47.0, 35.0, 50.0, 30.0, 46.0, 28.0, 38.0, 27.0, 30.0, 34.0, 21.0, 23.0, 19.0, 15.0, 15.0, 14.0, 11.0, 9.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 5.0, 5.0, 6.0, 1.0, 4.0, 1.0], "bins": [-6.0176568031311035, -5.845104217529297, -5.672552108764648, -5.499999523162842, -5.327446937561035, -5.154894828796387, -4.98234224319458, -4.809789657592773, -4.637237548828125, -4.464684963226318, -4.29213285446167, -4.119580268859863, -3.9470279216766357, -3.774475574493408, -3.6019229888916016, -3.429370641708374, -3.2568182945251465, -3.084265947341919, -2.9117136001586914, -2.7391610145568848, -2.5666086673736572, -2.3940563201904297, -2.221503734588623, -2.0489513874053955, -1.876399040222168, -1.7038466930389404, -1.5312942266464233, -1.3587417602539062, -1.1861894130706787, -1.0136370658874512, -0.8410845994949341, -0.668532133102417, -0.49597978591918945, -0.32342737913131714, -0.15087497234344482, 0.02167743444442749, 0.1942298412322998, 0.3667822480201721, 0.5393346548080444, 0.7118871212005615, 0.8844394683837891, 1.0569918155670166, 1.2295442819595337, 1.4020967483520508, 1.5746490955352783, 1.7472014427185059, 1.919753909111023, 2.09230637550354, 2.2648587226867676, 2.437411069869995, 2.6099634170532227, 2.7825160026550293, 2.955068349838257, 3.1276206970214844, 3.300173282623291, 3.4727256298065186, 3.645277976989746, 3.8178303241729736, 3.990382671356201, 4.162935256958008, 4.335487365722656, 4.508039951324463, 4.6805925369262695, 4.853144645690918, 5.025697231292725]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 9.0, 9.0, 25.0, 43.0, 57.0, 87.0, 191.0, 286.0, 440.0, 742.0, 1183.0, 1845.0, 2801.0, 4506.0, 6637.0, 9757.0, 14487.0, 20240.0, 27887.0, 37458.0, 48808.0, 61528.0, 73562.0, 84484.0, 91561.0, 93310.0, 90729.0, 81747.0, 70804.0, 58281.0, 46660.0, 35157.0, 26103.0, 18350.0, 13132.0, 8914.0, 5889.0, 3924.0, 2549.0, 1636.0, 1044.0, 669.0, 400.0, 252.0, 153.0, 97.0, 57.0, 29.0, 17.0, 11.0, 13.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.942718505859375, -1.87176513671875, -1.800811767578125, -1.7298583984375, -1.658905029296875, -1.58795166015625, -1.516998291015625, -1.446044921875, -1.375091552734375, -1.30413818359375, -1.233184814453125, -1.1622314453125, -1.091278076171875, -1.02032470703125, -0.949371337890625, -0.87841796875, -0.807464599609375, -0.73651123046875, -0.665557861328125, -0.5946044921875, -0.523651123046875, -0.45269775390625, -0.381744384765625, -0.310791015625, -0.239837646484375, -0.16888427734375, -0.097930908203125, -0.0269775390625, 0.043975830078125, 0.11492919921875, 0.185882568359375, 0.2568359375, 0.327789306640625, 0.39874267578125, 0.469696044921875, 0.5406494140625, 0.611602783203125, 0.68255615234375, 0.753509521484375, 0.824462890625, 0.895416259765625, 0.96636962890625, 1.037322998046875, 1.1082763671875, 1.179229736328125, 1.25018310546875, 1.321136474609375, 1.39208984375, 1.463043212890625, 1.53399658203125, 1.604949951171875, 1.6759033203125, 1.746856689453125, 1.81781005859375, 1.888763427734375, 1.959716796875, 2.030670166015625, 2.10162353515625, 2.172576904296875, 2.2435302734375, 2.314483642578125, 2.38543701171875, 2.456390380859375, 2.52734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 18.0, 13.0, 12.0, 19.0, 15.0, 13.0, 23.0, 22.0, 28.0, 37.0, 37.0, 29.0, 43.0, 40.0, 42.0, 40.0, 30.0, 39.0, 43.0, 46.0, 42.0, 35.0, 46.0, 40.0, 32.0, 22.0, 18.0, 24.0, 26.0, 17.0, 17.0, 16.0, 9.0, 8.0, 1.0, 4.0, 4.0, 5.0, 6.0, 3.0, 9.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.8046875, -5.6390380859375, -5.473388671875, -5.3077392578125, -5.14208984375, -4.9764404296875, -4.810791015625, -4.6451416015625, -4.4794921875, -4.3138427734375, -4.148193359375, -3.9825439453125, -3.81689453125, -3.6512451171875, -3.485595703125, -3.3199462890625, -3.154296875, -2.9886474609375, -2.822998046875, -2.6573486328125, -2.49169921875, -2.3260498046875, -2.160400390625, -1.9947509765625, -1.8291015625, -1.6634521484375, -1.497802734375, -1.3321533203125, -1.16650390625, -1.0008544921875, -0.835205078125, -0.6695556640625, -0.50390625, -0.3382568359375, -0.172607421875, -0.0069580078125, 0.15869140625, 0.3243408203125, 0.489990234375, 0.6556396484375, 0.8212890625, 0.9869384765625, 1.152587890625, 1.3182373046875, 1.48388671875, 1.6495361328125, 1.815185546875, 1.9808349609375, 2.146484375, 2.3121337890625, 2.477783203125, 2.6434326171875, 2.80908203125, 2.9747314453125, 3.140380859375, 3.3060302734375, 3.4716796875, 3.6373291015625, 3.802978515625, 3.9686279296875, 4.13427734375, 4.2999267578125, 4.465576171875, 4.6312255859375, 4.796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 14.0, 10.0, 12.0, 20.0, 25.0, 43.0, 42.0, 67.0, 97.0, 128.0, 189.0, 276.0, 406.0, 554.0, 897.0, 1262.0, 1888.0, 2840.0, 4097.0, 6073.0, 8964.0, 12939.0, 19818.0, 39984.0, 369479.0, 467618.0, 47250.0, 20936.0, 13536.0, 9395.0, 6392.0, 4261.0, 2831.0, 2002.0, 1341.0, 920.0, 595.0, 401.0, 272.0, 200.0, 129.0, 93.0, 70.0, 42.0, 23.0, 23.0, 24.0, 13.0, 7.0, 12.0, 10.0, 7.0, 3.0, 4.0, 1.0, 2.0], "bins": [-6.09765625, -5.9132080078125, -5.728759765625, -5.5443115234375, -5.35986328125, -5.1754150390625, -4.990966796875, -4.8065185546875, -4.6220703125, -4.4376220703125, -4.253173828125, -4.0687255859375, -3.88427734375, -3.6998291015625, -3.515380859375, -3.3309326171875, -3.146484375, -2.9620361328125, -2.777587890625, -2.5931396484375, -2.40869140625, -2.2242431640625, -2.039794921875, -1.8553466796875, -1.6708984375, -1.4864501953125, -1.302001953125, -1.1175537109375, -0.93310546875, -0.7486572265625, -0.564208984375, -0.3797607421875, -0.1953125, -0.0108642578125, 0.173583984375, 0.3580322265625, 0.54248046875, 0.7269287109375, 0.911376953125, 1.0958251953125, 1.2802734375, 1.4647216796875, 1.649169921875, 1.8336181640625, 2.01806640625, 2.2025146484375, 2.386962890625, 2.5714111328125, 2.755859375, 2.9403076171875, 3.124755859375, 3.3092041015625, 3.49365234375, 3.6781005859375, 3.862548828125, 4.0469970703125, 4.2314453125, 4.4158935546875, 4.600341796875, 4.7847900390625, 4.96923828125, 5.1536865234375, 5.338134765625, 5.5225830078125, 5.70703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 13.0, 4.0, 9.0, 10.0, 13.0, 21.0, 26.0, 34.0, 20.0, 32.0, 32.0, 39.0, 36.0, 29.0, 35.0, 38.0, 41.0, 35.0, 56.0, 39.0, 46.0, 37.0, 29.0, 37.0, 25.0, 31.0, 29.0, 29.0, 18.0, 17.0, 20.0, 15.0, 11.0, 15.0, 6.0, 10.0, 8.0, 6.0, 6.0, 6.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.609375, -5.43267822265625, -5.2559814453125, -5.07928466796875, -4.902587890625, -4.72589111328125, -4.5491943359375, -4.37249755859375, -4.19580078125, -4.01910400390625, -3.8424072265625, -3.66571044921875, -3.489013671875, -3.31231689453125, -3.1356201171875, -2.95892333984375, -2.7822265625, -2.60552978515625, -2.4288330078125, -2.25213623046875, -2.075439453125, -1.89874267578125, -1.7220458984375, -1.54534912109375, -1.36865234375, -1.19195556640625, -1.0152587890625, -0.83856201171875, -0.661865234375, -0.48516845703125, -0.3084716796875, -0.13177490234375, 0.044921875, 0.22161865234375, 0.3983154296875, 0.57501220703125, 0.751708984375, 0.92840576171875, 1.1051025390625, 1.28179931640625, 1.45849609375, 1.63519287109375, 1.8118896484375, 1.98858642578125, 2.165283203125, 2.34197998046875, 2.5186767578125, 2.69537353515625, 2.8720703125, 3.04876708984375, 3.2254638671875, 3.40216064453125, 3.578857421875, 3.75555419921875, 3.9322509765625, 4.10894775390625, 4.28564453125, 4.46234130859375, 4.6390380859375, 4.81573486328125, 4.992431640625, 5.16912841796875, 5.3458251953125, 5.52252197265625, 5.69921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 13.0, 33.0, 44.0, 60.0, 118.0, 217.0, 426.0, 800.0, 1670.0, 4525.0, 20376.0, 943439.0, 64395.0, 7673.0, 2475.0, 1072.0, 540.0, 286.0, 151.0, 86.0, 46.0, 34.0, 22.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9375, -15.5257568359375, -15.114013671875, -14.7022705078125, -14.29052734375, -13.8787841796875, -13.467041015625, -13.0552978515625, -12.6435546875, -12.2318115234375, -11.820068359375, -11.4083251953125, -10.99658203125, -10.5848388671875, -10.173095703125, -9.7613525390625, -9.349609375, -8.9378662109375, -8.526123046875, -8.1143798828125, -7.70263671875, -7.2908935546875, -6.879150390625, -6.4674072265625, -6.0556640625, -5.6439208984375, -5.232177734375, -4.8204345703125, -4.40869140625, -3.9969482421875, -3.585205078125, -3.1734619140625, -2.76171875, -2.3499755859375, -1.938232421875, -1.5264892578125, -1.11474609375, -0.7030029296875, -0.291259765625, 0.1204833984375, 0.5322265625, 0.9439697265625, 1.355712890625, 1.7674560546875, 2.17919921875, 2.5909423828125, 3.002685546875, 3.4144287109375, 3.826171875, 4.2379150390625, 4.649658203125, 5.0614013671875, 5.47314453125, 5.8848876953125, 6.296630859375, 6.7083740234375, 7.1201171875, 7.5318603515625, 7.943603515625, 8.3553466796875, 8.76708984375, 9.1788330078125, 9.590576171875, 10.0023193359375, 10.4140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 11.0, 14.0, 22.0, 22.0, 38.0, 58.0, 122.0, 122.0, 147.0, 117.0, 85.0, 76.0, 36.0, 32.0, 14.0, 13.0, 8.0, 13.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0017156600952148438, -0.0016712695360183716, -0.0016268789768218994, -0.0015824884176254272, -0.001538097858428955, -0.001493707299232483, -0.0014493167400360107, -0.0014049261808395386, -0.0013605356216430664, -0.0013161450624465942, -0.001271754503250122, -0.00122736394405365, -0.0011829733848571777, -0.0011385828256607056, -0.0010941922664642334, -0.0010498017072677612, -0.001005411148071289, -0.0009610205888748169, -0.0009166300296783447, -0.0008722394704818726, -0.0008278489112854004, -0.0007834583520889282, -0.0007390677928924561, -0.0006946772336959839, -0.0006502866744995117, -0.0006058961153030396, -0.0005615055561065674, -0.0005171149969100952, -0.00047272443771362305, -0.0004283338785171509, -0.0003839433193206787, -0.00033955276012420654, -0.0002951622009277344, -0.0002507716417312622, -0.00020638108253479004, -0.00016199052333831787, -0.0001175999641418457, -7.320940494537354e-05, -2.8818845748901367e-05, 1.55717134475708e-05, 5.996227264404297e-05, 0.00010435283184051514, 0.0001487433910369873, 0.00019313395023345947, 0.00023752450942993164, 0.0002819150686264038, 0.000326305627822876, 0.00037069618701934814, 0.0004150867462158203, 0.0004594773054122925, 0.0005038678646087646, 0.0005482584238052368, 0.000592648983001709, 0.0006370395421981812, 0.0006814301013946533, 0.0007258206605911255, 0.0007702112197875977, 0.0008146017789840698, 0.000858992338180542, 0.0009033828973770142, 0.0009477734565734863, 0.0009921640157699585, 0.0010365545749664307, 0.0010809451341629028, 0.001125335693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 8.0, 10.0, 22.0, 15.0, 28.0, 44.0, 60.0, 92.0, 101.0, 177.0, 241.0, 350.0, 498.0, 722.0, 1015.0, 1541.0, 2387.0, 3918.0, 6454.0, 11719.0, 23106.0, 60631.0, 286645.0, 480826.0, 99958.0, 31947.0, 14716.0, 7893.0, 4803.0, 2985.0, 1824.0, 1163.0, 776.0, 541.0, 367.0, 259.0, 209.0, 130.0, 117.0, 72.0, 44.0, 41.0, 31.0, 23.0, 8.0, 13.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.561767578125, -4.42431640625, -4.286865234375, -4.1494140625, -4.011962890625, -3.87451171875, -3.737060546875, -3.599609375, -3.462158203125, -3.32470703125, -3.187255859375, -3.0498046875, -2.912353515625, -2.77490234375, -2.637451171875, -2.5, -2.362548828125, -2.22509765625, -2.087646484375, -1.9501953125, -1.812744140625, -1.67529296875, -1.537841796875, -1.400390625, -1.262939453125, -1.12548828125, -0.988037109375, -0.8505859375, -0.713134765625, -0.57568359375, -0.438232421875, -0.30078125, -0.163330078125, -0.02587890625, 0.111572265625, 0.2490234375, 0.386474609375, 0.52392578125, 0.661376953125, 0.798828125, 0.936279296875, 1.07373046875, 1.211181640625, 1.3486328125, 1.486083984375, 1.62353515625, 1.760986328125, 1.8984375, 2.035888671875, 2.17333984375, 2.310791015625, 2.4482421875, 2.585693359375, 2.72314453125, 2.860595703125, 2.998046875, 3.135498046875, 3.27294921875, 3.410400390625, 3.5478515625, 3.685302734375, 3.82275390625, 3.960205078125, 4.09765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 9.0, 10.0, 15.0, 25.0, 28.0, 36.0, 40.0, 80.0, 102.0, 120.0, 120.0, 100.0, 75.0, 52.0, 40.0, 17.0, 17.0, 17.0, 9.0, 12.0, 10.0, 5.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9271469116210938, -0.8899383544921875, -0.8527297973632812, -0.815521240234375, -0.7783126831054688, -0.7411041259765625, -0.7038955688476562, -0.66668701171875, -0.6294784545898438, -0.5922698974609375, -0.5550613403320312, -0.517852783203125, -0.48064422607421875, -0.4434356689453125, -0.40622711181640625, -0.3690185546875, -0.33180999755859375, -0.2946014404296875, -0.25739288330078125, -0.220184326171875, -0.18297576904296875, -0.1457672119140625, -0.10855865478515625, -0.07135009765625, -0.03414154052734375, 0.0030670166015625, 0.04027557373046875, 0.077484130859375, 0.11469268798828125, 0.1519012451171875, 0.18910980224609375, 0.226318359375, 0.26352691650390625, 0.3007354736328125, 0.33794403076171875, 0.375152587890625, 0.41236114501953125, 0.4495697021484375, 0.48677825927734375, 0.52398681640625, 0.5611953735351562, 0.5984039306640625, 0.6356124877929688, 0.672821044921875, 0.7100296020507812, 0.7472381591796875, 0.7844467163085938, 0.8216552734375, 0.8588638305664062, 0.8960723876953125, 0.9332809448242188, 0.970489501953125, 1.0076980590820312, 1.0449066162109375, 1.0821151733398438, 1.11932373046875, 1.1565322875976562, 1.1937408447265625, 1.2309494018554688, 1.268157958984375, 1.3053665161132812, 1.3425750732421875, 1.3797836303710938, 1.4169921875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 9.0, 4.0, 8.0, 7.0, 10.0, 15.0, 23.0, 11.0, 25.0, 26.0, 36.0, 26.0, 36.0, 30.0, 38.0, 39.0, 54.0, 46.0, 43.0, 37.0, 41.0, 41.0, 44.0, 47.0, 43.0, 39.0, 29.0, 32.0, 22.0, 32.0, 24.0, 18.0, 16.0, 13.0, 4.0, 10.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.351984977722168, -6.155124664306641, -5.958264350891113, -5.761403560638428, -5.5645432472229, -5.367682933807373, -5.1708221435546875, -4.97396183013916, -4.777101516723633, -4.5802412033081055, -4.383380889892578, -4.186520099639893, -3.9896597862243652, -3.792799472808838, -3.5959389209747314, -3.399078369140625, -3.2022180557250977, -3.0053577423095703, -2.808497190475464, -2.6116366386413574, -2.41477632522583, -2.2179160118103027, -2.0210554599761963, -1.8241950273513794, -1.6273345947265625, -1.4304741621017456, -1.2336137294769287, -1.0367532968521118, -0.8398928642272949, -0.643032431602478, -0.44617199897766113, -0.24931156635284424, -0.05245161056518555, 0.14440882205963135, 0.34126925468444824, 0.5381296873092651, 0.734990119934082, 0.9318505525588989, 1.1287109851837158, 1.3255714178085327, 1.5224318504333496, 1.7192922830581665, 1.9161527156829834, 2.11301326751709, 2.309873580932617, 2.5067338943481445, 2.703594446182251, 2.9004549980163574, 3.0973153114318848, 3.294175624847412, 3.4910361766815186, 3.687896728515625, 3.8847570419311523, 4.08161735534668, 4.278477668762207, 4.475338459014893, 4.67219877243042, 4.869059085845947, 5.065919876098633, 5.26278018951416, 5.4596405029296875, 5.656500816345215, 5.853361129760742, 6.050221920013428, 6.247082233428955]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 12.0, 13.0, 23.0, 12.0, 24.0, 25.0, 25.0, 27.0, 27.0, 35.0, 51.0, 24.0, 36.0, 36.0, 39.0, 36.0, 41.0, 28.0, 28.0, 34.0, 36.0, 37.0, 35.0, 26.0, 26.0, 14.0, 18.0, 27.0, 12.0, 24.0, 20.0, 20.0, 14.0, 12.0, 10.0, 12.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 7.0, 3.0, 2.0, 6.0, 2.0], "bins": [-5.437624931335449, -5.276076793670654, -5.114528656005859, -4.9529805183410645, -4.7914323806762695, -4.629883766174316, -4.4683356285095215, -4.306787490844727, -4.145239353179932, -3.9836912155151367, -3.822143077850342, -3.6605947017669678, -3.499046564102173, -3.337498426437378, -3.175950050354004, -3.014401912689209, -2.852853775024414, -2.691305637359619, -2.529757499694824, -2.36820912361145, -2.2066609859466553, -2.0451128482818604, -1.8835645914077759, -1.7220163345336914, -1.5604681968688965, -1.3989200592041016, -1.237371802330017, -1.0758235454559326, -0.9142754077911377, -0.752727210521698, -0.5911790132522583, -0.42963075637817383, -0.2680821418762207, -0.106533944606781, 0.05501425266265869, 0.2165624499320984, 0.3781106472015381, 0.5396588444709778, 0.7012070417404175, 0.862755298614502, 1.0243034362792969, 1.1858515739440918, 1.3473998308181763, 1.5089480876922607, 1.6704962253570557, 1.8320443630218506, 1.993592619895935, 2.1551408767700195, 2.3166890144348145, 2.4782371520996094, 2.6397852897644043, 2.8013336658477783, 2.9628818035125732, 3.124429941177368, 3.285978317260742, 3.447526454925537, 3.609074592590332, 3.770622730255127, 3.932170867919922, 4.093719005584717, 4.255267143249512, 4.416815757751465, 4.57836389541626, 4.739912033081055, 4.90146017074585]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 6.0, 26.0, 31.0, 51.0, 86.0, 130.0, 198.0, 310.0, 548.0, 890.0, 1336.0, 2218.0, 3644.0, 6185.0, 10261.0, 16826.0, 28001.0, 44789.0, 68342.0, 97259.0, 124415.0, 140054.0, 137215.0, 117232.0, 88172.0, 60218.0, 38897.0, 24320.0, 14878.0, 8595.0, 5260.0, 3316.0, 1851.0, 1083.0, 737.0, 420.0, 295.0, 162.0, 98.0, 56.0, 42.0, 26.0, 26.0, 12.0, 13.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.0, -4.843017578125, -4.68603515625, -4.529052734375, -4.3720703125, -4.215087890625, -4.05810546875, -3.901123046875, -3.744140625, -3.587158203125, -3.43017578125, -3.273193359375, -3.1162109375, -2.959228515625, -2.80224609375, -2.645263671875, -2.48828125, -2.331298828125, -2.17431640625, -2.017333984375, -1.8603515625, -1.703369140625, -1.54638671875, -1.389404296875, -1.232421875, -1.075439453125, -0.91845703125, -0.761474609375, -0.6044921875, -0.447509765625, -0.29052734375, -0.133544921875, 0.0234375, 0.180419921875, 0.33740234375, 0.494384765625, 0.6513671875, 0.808349609375, 0.96533203125, 1.122314453125, 1.279296875, 1.436279296875, 1.59326171875, 1.750244140625, 1.9072265625, 2.064208984375, 2.22119140625, 2.378173828125, 2.53515625, 2.692138671875, 2.84912109375, 3.006103515625, 3.1630859375, 3.320068359375, 3.47705078125, 3.634033203125, 3.791015625, 3.947998046875, 4.10498046875, 4.261962890625, 4.4189453125, 4.575927734375, 4.73291015625, 4.889892578125, 5.046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 5.0, 6.0, 17.0, 10.0, 12.0, 18.0, 14.0, 28.0, 29.0, 18.0, 27.0, 25.0, 42.0, 38.0, 35.0, 39.0, 46.0, 37.0, 39.0, 31.0, 38.0, 47.0, 35.0, 31.0, 26.0, 28.0, 28.0, 26.0, 29.0, 17.0, 19.0, 23.0, 21.0, 15.0, 20.0, 7.0, 9.0, 9.0, 4.0, 10.0, 7.0, 5.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0], "bins": [-6.0078125, -5.83563232421875, -5.6634521484375, -5.49127197265625, -5.319091796875, -5.14691162109375, -4.9747314453125, -4.80255126953125, -4.63037109375, -4.45819091796875, -4.2860107421875, -4.11383056640625, -3.941650390625, -3.76947021484375, -3.5972900390625, -3.42510986328125, -3.2529296875, -3.08074951171875, -2.9085693359375, -2.73638916015625, -2.564208984375, -2.39202880859375, -2.2198486328125, -2.04766845703125, -1.87548828125, -1.70330810546875, -1.5311279296875, -1.35894775390625, -1.186767578125, -1.01458740234375, -0.8424072265625, -0.67022705078125, -0.498046875, -0.32586669921875, -0.1536865234375, 0.01849365234375, 0.190673828125, 0.36285400390625, 0.5350341796875, 0.70721435546875, 0.87939453125, 1.05157470703125, 1.2237548828125, 1.39593505859375, 1.568115234375, 1.74029541015625, 1.9124755859375, 2.08465576171875, 2.2568359375, 2.42901611328125, 2.6011962890625, 2.77337646484375, 2.945556640625, 3.11773681640625, 3.2899169921875, 3.46209716796875, 3.63427734375, 3.80645751953125, 3.9786376953125, 4.15081787109375, 4.322998046875, 4.49517822265625, 4.6673583984375, 4.83953857421875, 5.01171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 8.0, 23.0, 26.0, 43.0, 73.0, 96.0, 148.0, 268.0, 392.0, 660.0, 1060.0, 1868.0, 3069.0, 4908.0, 8300.0, 14625.0, 24618.0, 41550.0, 68412.0, 107117.0, 147342.0, 168029.0, 153805.0, 114628.0, 75096.0, 45625.0, 27239.0, 16192.0, 9416.0, 5586.0, 3256.0, 1963.0, 1172.0, 750.0, 429.0, 286.0, 182.0, 119.0, 75.0, 31.0, 30.0, 14.0, 5.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-9.0625, -8.800537109375, -8.53857421875, -8.276611328125, -8.0146484375, -7.752685546875, -7.49072265625, -7.228759765625, -6.966796875, -6.704833984375, -6.44287109375, -6.180908203125, -5.9189453125, -5.656982421875, -5.39501953125, -5.133056640625, -4.87109375, -4.609130859375, -4.34716796875, -4.085205078125, -3.8232421875, -3.561279296875, -3.29931640625, -3.037353515625, -2.775390625, -2.513427734375, -2.25146484375, -1.989501953125, -1.7275390625, -1.465576171875, -1.20361328125, -0.941650390625, -0.6796875, -0.417724609375, -0.15576171875, 0.106201171875, 0.3681640625, 0.630126953125, 0.89208984375, 1.154052734375, 1.416015625, 1.677978515625, 1.93994140625, 2.201904296875, 2.4638671875, 2.725830078125, 2.98779296875, 3.249755859375, 3.51171875, 3.773681640625, 4.03564453125, 4.297607421875, 4.5595703125, 4.821533203125, 5.08349609375, 5.345458984375, 5.607421875, 5.869384765625, 6.13134765625, 6.393310546875, 6.6552734375, 6.917236328125, 7.17919921875, 7.441162109375, 7.703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 3.0, 9.0, 11.0, 15.0, 13.0, 17.0, 21.0, 18.0, 26.0, 29.0, 28.0, 40.0, 24.0, 51.0, 38.0, 54.0, 36.0, 36.0, 47.0, 42.0, 52.0, 44.0, 37.0, 39.0, 33.0, 42.0, 38.0, 26.0, 12.0, 18.0, 20.0, 16.0, 12.0, 9.0, 6.0, 8.0, 8.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8785400390625, -4.721923828125, -4.5653076171875, -4.40869140625, -4.2520751953125, -4.095458984375, -3.9388427734375, -3.7822265625, -3.6256103515625, -3.468994140625, -3.3123779296875, -3.15576171875, -2.9991455078125, -2.842529296875, -2.6859130859375, -2.529296875, -2.3726806640625, -2.216064453125, -2.0594482421875, -1.90283203125, -1.7462158203125, -1.589599609375, -1.4329833984375, -1.2763671875, -1.1197509765625, -0.963134765625, -0.8065185546875, -0.64990234375, -0.4932861328125, -0.336669921875, -0.1800537109375, -0.0234375, 0.1331787109375, 0.289794921875, 0.4464111328125, 0.60302734375, 0.7596435546875, 0.916259765625, 1.0728759765625, 1.2294921875, 1.3861083984375, 1.542724609375, 1.6993408203125, 1.85595703125, 2.0125732421875, 2.169189453125, 2.3258056640625, 2.482421875, 2.6390380859375, 2.795654296875, 2.9522705078125, 3.10888671875, 3.2655029296875, 3.422119140625, 3.5787353515625, 3.7353515625, 3.8919677734375, 4.048583984375, 4.2052001953125, 4.36181640625, 4.5184326171875, 4.675048828125, 4.8316650390625, 4.98828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 13.0, 12.0, 19.0, 27.0, 33.0, 50.0, 87.0, 87.0, 118.0, 177.0, 239.0, 379.0, 534.0, 814.0, 1162.0, 1789.0, 2818.0, 4463.0, 7472.0, 13345.0, 26568.0, 67902.0, 243261.0, 421898.0, 158119.0, 47976.0, 20820.0, 10784.0, 6338.0, 3910.0, 2440.0, 1547.0, 1006.0, 694.0, 498.0, 323.0, 215.0, 173.0, 124.0, 83.0, 62.0, 44.0, 31.0, 28.0, 14.0, 10.0, 14.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0], "bins": [-8.7734375, -8.51025390625, -8.2470703125, -7.98388671875, -7.720703125, -7.45751953125, -7.1943359375, -6.93115234375, -6.66796875, -6.40478515625, -6.1416015625, -5.87841796875, -5.615234375, -5.35205078125, -5.0888671875, -4.82568359375, -4.5625, -4.29931640625, -4.0361328125, -3.77294921875, -3.509765625, -3.24658203125, -2.9833984375, -2.72021484375, -2.45703125, -2.19384765625, -1.9306640625, -1.66748046875, -1.404296875, -1.14111328125, -0.8779296875, -0.61474609375, -0.3515625, -0.08837890625, 0.1748046875, 0.43798828125, 0.701171875, 0.96435546875, 1.2275390625, 1.49072265625, 1.75390625, 2.01708984375, 2.2802734375, 2.54345703125, 2.806640625, 3.06982421875, 3.3330078125, 3.59619140625, 3.859375, 4.12255859375, 4.3857421875, 4.64892578125, 4.912109375, 5.17529296875, 5.4384765625, 5.70166015625, 5.96484375, 6.22802734375, 6.4912109375, 6.75439453125, 7.017578125, 7.28076171875, 7.5439453125, 7.80712890625, 8.0703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 5.0, 10.0, 6.0, 19.0, 22.0, 36.0, 69.0, 91.0, 155.0, 174.0, 139.0, 91.0, 46.0, 33.0, 16.0, 16.0, 14.0, 11.0, 5.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011434555053710938, -0.0011129677295684814, -0.0010824799537658691, -0.0010519921779632568, -0.0010215044021606445, -0.0009910166263580322, -0.0009605288505554199, -0.0009300410747528076, -0.0008995532989501953, -0.000869065523147583, -0.0008385777473449707, -0.0008080899715423584, -0.0007776021957397461, -0.0007471144199371338, -0.0007166266441345215, -0.0006861388683319092, -0.0006556510925292969, -0.0006251633167266846, -0.0005946755409240723, -0.00056418776512146, -0.0005336999893188477, -0.0005032122135162354, -0.00047272443771362305, -0.00044223666191101074, -0.00041174888610839844, -0.00038126111030578613, -0.00035077333450317383, -0.0003202855587005615, -0.0002897977828979492, -0.0002593100070953369, -0.0002288222312927246, -0.0001983344554901123, -0.0001678466796875, -0.0001373589038848877, -0.00010687112808227539, -7.638335227966309e-05, -4.589557647705078e-05, -1.5407800674438477e-05, 1.5079975128173828e-05, 4.556775093078613e-05, 7.605552673339844e-05, 0.00010654330253601074, 0.00013703107833862305, 0.00016751885414123535, 0.00019800662994384766, 0.00022849440574645996, 0.00025898218154907227, 0.00028946995735168457, 0.0003199577331542969, 0.0003504455089569092, 0.0003809332847595215, 0.0004114210605621338, 0.0004419088363647461, 0.0004723966121673584, 0.0005028843879699707, 0.000533372163772583, 0.0005638599395751953, 0.0005943477153778076, 0.0006248354911804199, 0.0006553232669830322, 0.0006858110427856445, 0.0007162988185882568, 0.0007467865943908691, 0.0007772743701934814, 0.0008077621459960938]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 10.0, 13.0, 19.0, 22.0, 33.0, 50.0, 74.0, 88.0, 129.0, 164.0, 290.0, 390.0, 568.0, 844.0, 1322.0, 1949.0, 3215.0, 5364.0, 9273.0, 17912.0, 39638.0, 99359.0, 240752.0, 319533.0, 176982.0, 67929.0, 28999.0, 13993.0, 7404.0, 4371.0, 2766.0, 1644.0, 1076.0, 733.0, 474.0, 340.0, 256.0, 162.0, 120.0, 84.0, 61.0, 43.0, 30.0, 17.0, 12.0, 18.0, 6.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.38671875, -5.208984375, -5.03125, -4.853515625, -4.67578125, -4.498046875, -4.3203125, -4.142578125, -3.96484375, -3.787109375, -3.609375, -3.431640625, -3.25390625, -3.076171875, -2.8984375, -2.720703125, -2.54296875, -2.365234375, -2.1875, -2.009765625, -1.83203125, -1.654296875, -1.4765625, -1.298828125, -1.12109375, -0.943359375, -0.765625, -0.587890625, -0.41015625, -0.232421875, -0.0546875, 0.123046875, 0.30078125, 0.478515625, 0.65625, 0.833984375, 1.01171875, 1.189453125, 1.3671875, 1.544921875, 1.72265625, 1.900390625, 2.078125, 2.255859375, 2.43359375, 2.611328125, 2.7890625, 2.966796875, 3.14453125, 3.322265625, 3.5, 3.677734375, 3.85546875, 4.033203125, 4.2109375, 4.388671875, 4.56640625, 4.744140625, 4.921875, 5.099609375, 5.27734375, 5.455078125, 5.6328125, 5.810546875, 5.98828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 13.0, 14.0, 23.0, 26.0, 36.0, 47.0, 62.0, 61.0, 66.0, 89.0, 84.0, 78.0, 58.0, 74.0, 55.0, 46.0, 33.0, 24.0, 22.0, 10.0, 13.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.302734375, -2.2447967529296875, -2.186859130859375, -2.1289215087890625, -2.07098388671875, -2.0130462646484375, -1.955108642578125, -1.8971710205078125, -1.8392333984375, -1.7812957763671875, -1.723358154296875, -1.6654205322265625, -1.60748291015625, -1.5495452880859375, -1.491607666015625, -1.4336700439453125, -1.375732421875, -1.3177947998046875, -1.259857177734375, -1.2019195556640625, -1.14398193359375, -1.0860443115234375, -1.028106689453125, -0.9701690673828125, -0.9122314453125, -0.8542938232421875, -0.796356201171875, -0.7384185791015625, -0.68048095703125, -0.6225433349609375, -0.564605712890625, -0.5066680908203125, -0.44873046875, -0.3907928466796875, -0.332855224609375, -0.2749176025390625, -0.21697998046875, -0.1590423583984375, -0.101104736328125, -0.0431671142578125, 0.0147705078125, 0.0727081298828125, 0.130645751953125, 0.1885833740234375, 0.24652099609375, 0.3044586181640625, 0.362396240234375, 0.4203338623046875, 0.478271484375, 0.5362091064453125, 0.594146728515625, 0.6520843505859375, 0.71002197265625, 0.7679595947265625, 0.825897216796875, 0.8838348388671875, 0.9417724609375, 0.9997100830078125, 1.057647705078125, 1.1155853271484375, 1.17352294921875, 1.2314605712890625, 1.289398193359375, 1.3473358154296875, 1.4052734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 14.0, 10.0, 19.0, 17.0, 21.0, 26.0, 28.0, 37.0, 33.0, 42.0, 45.0, 36.0, 42.0, 42.0, 58.0, 50.0, 43.0, 52.0, 52.0, 34.0, 41.0, 31.0, 36.0, 28.0, 31.0, 17.0, 11.0, 13.0, 15.0, 9.0, 12.0, 6.0, 9.0, 9.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.519323348999023, -6.3072052001953125, -6.095086574554443, -5.882968425750732, -5.6708502769470215, -5.458731651306152, -5.246613502502441, -5.0344953536987305, -4.8223772048950195, -4.610259056091309, -4.3981404304504395, -4.1860222816467285, -3.9739041328430176, -3.7617857456207275, -3.5496673583984375, -3.3375492095947266, -3.1254305839538574, -2.9133121967315674, -2.7011940479278564, -2.4890756607055664, -2.2769575119018555, -2.0648391246795654, -1.8527207374572754, -1.640602469444275, -1.4284842014312744, -1.216365933418274, -1.0042476654052734, -0.7921292781829834, -0.5800110101699829, -0.3678927421569824, -0.15577435493469238, 0.056343913078308105, 0.2684621810913086, 0.48058047890663147, 0.6926987767219543, 0.9048171043395996, 1.1169353723526, 1.3290536403656006, 1.5411720275878906, 1.7532902956008911, 1.9654085636138916, 2.1775269508361816, 2.3896450996398926, 2.6017634868621826, 2.8138818740844727, 3.0260000228881836, 3.2381184101104736, 3.4502367973327637, 3.6623549461364746, 3.8744733333587646, 4.086591720581055, 4.298709869384766, 4.510828018188477, 4.7229461669921875, 4.935064792633057, 5.147182941436768, 5.359301567077637, 5.571419715881348, 5.783538341522217, 5.995656490325928, 6.207774639129639, 6.419893264770508, 6.632011413574219, 6.84412956237793, 7.056247711181641]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 4.0, 9.0, 3.0, 13.0, 7.0, 8.0, 18.0, 12.0, 23.0, 16.0, 15.0, 32.0, 30.0, 27.0, 30.0, 41.0, 49.0, 32.0, 40.0, 33.0, 33.0, 42.0, 51.0, 48.0, 40.0, 35.0, 28.0, 41.0, 35.0, 19.0, 23.0, 31.0, 20.0, 19.0, 20.0, 6.0, 11.0, 6.0, 9.0, 6.0, 6.0, 7.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4632439613342285, -5.275616645812988, -5.087989807128906, -4.900362491607666, -4.712735176086426, -4.525108337402344, -4.3374810218811035, -4.149853706359863, -3.962226629257202, -3.774599552154541, -3.586972236633301, -3.3993451595306396, -3.2117180824279785, -3.0240907669067383, -2.836463689804077, -2.648836612701416, -2.461209297180176, -2.2735822200775146, -2.0859549045562744, -1.8983278274536133, -1.7107006311416626, -1.523073434829712, -1.3354463577270508, -1.1478191614151, -0.9601919651031494, -0.7725647687911987, -0.5849376320838928, -0.3973104953765869, -0.20968329906463623, -0.022056102752685547, 0.16557097434997559, 0.35319817066192627, 0.5408258438110352, 0.7284530401229858, 0.9160801768302917, 1.1037073135375977, 1.2913345098495483, 1.478961706161499, 1.6665887832641602, 1.8542159795761108, 2.0418431758880615, 2.2294702529907227, 2.417097568511963, 2.604724645614624, 2.792351722717285, 2.9799790382385254, 3.1676061153411865, 3.3552331924438477, 3.542860507965088, 3.730487585067749, 3.9181149005889893, 4.10574197769165, 4.293369293212891, 4.480996131896973, 4.668623447418213, 4.856250762939453, 5.043877601623535, 5.231504917144775, 5.419131755828857, 5.606759071350098, 5.794386386871338, 5.982013702392578, 6.16964054107666, 6.3572678565979, 6.544895172119141]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 10.0, 23.0, 30.0, 47.0, 79.0, 131.0, 172.0, 364.0, 632.0, 1120.0, 1975.0, 3708.0, 7297.0, 15684.0, 35592.0, 86011.0, 211771.0, 484609.0, 878914.0, 1046745.0, 760591.0, 380820.0, 159380.0, 64558.0, 27436.0, 12655.0, 6211.0, 3208.0, 1793.0, 1032.0, 577.0, 382.0, 247.0, 162.0, 103.0, 63.0, 38.0, 36.0, 25.0, 17.0, 12.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.0078125, -6.76904296875, -6.5302734375, -6.29150390625, -6.052734375, -5.81396484375, -5.5751953125, -5.33642578125, -5.09765625, -4.85888671875, -4.6201171875, -4.38134765625, -4.142578125, -3.90380859375, -3.6650390625, -3.42626953125, -3.1875, -2.94873046875, -2.7099609375, -2.47119140625, -2.232421875, -1.99365234375, -1.7548828125, -1.51611328125, -1.27734375, -1.03857421875, -0.7998046875, -0.56103515625, -0.322265625, -0.08349609375, 0.1552734375, 0.39404296875, 0.6328125, 0.87158203125, 1.1103515625, 1.34912109375, 1.587890625, 1.82666015625, 2.0654296875, 2.30419921875, 2.54296875, 2.78173828125, 3.0205078125, 3.25927734375, 3.498046875, 3.73681640625, 3.9755859375, 4.21435546875, 4.453125, 4.69189453125, 4.9306640625, 5.16943359375, 5.408203125, 5.64697265625, 5.8857421875, 6.12451171875, 6.36328125, 6.60205078125, 6.8408203125, 7.07958984375, 7.318359375, 7.55712890625, 7.7958984375, 8.03466796875, 8.2734375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 9.0, 7.0, 6.0, 8.0, 9.0, 18.0, 14.0, 16.0, 18.0, 23.0, 22.0, 30.0, 33.0, 36.0, 34.0, 38.0, 38.0, 40.0, 38.0, 51.0, 52.0, 44.0, 48.0, 35.0, 37.0, 38.0, 30.0, 26.0, 26.0, 24.0, 21.0, 12.0, 27.0, 14.0, 12.0, 11.0, 10.0, 7.0, 10.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1015625, -4.93621826171875, -4.7708740234375, -4.60552978515625, -4.440185546875, -4.27484130859375, -4.1094970703125, -3.94415283203125, -3.77880859375, -3.61346435546875, -3.4481201171875, -3.28277587890625, -3.117431640625, -2.95208740234375, -2.7867431640625, -2.62139892578125, -2.4560546875, -2.29071044921875, -2.1253662109375, -1.96002197265625, -1.794677734375, -1.62933349609375, -1.4639892578125, -1.29864501953125, -1.13330078125, -0.96795654296875, -0.8026123046875, -0.63726806640625, -0.471923828125, -0.30657958984375, -0.1412353515625, 0.02410888671875, 0.189453125, 0.35479736328125, 0.5201416015625, 0.68548583984375, 0.850830078125, 1.01617431640625, 1.1815185546875, 1.34686279296875, 1.51220703125, 1.67755126953125, 1.8428955078125, 2.00823974609375, 2.173583984375, 2.33892822265625, 2.5042724609375, 2.66961669921875, 2.8349609375, 3.00030517578125, 3.1656494140625, 3.33099365234375, 3.496337890625, 3.66168212890625, 3.8270263671875, 3.99237060546875, 4.15771484375, 4.32305908203125, 4.4884033203125, 4.65374755859375, 4.819091796875, 4.98443603515625, 5.1497802734375, 5.31512451171875, 5.48046875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 12.0, 10.0, 15.0, 24.0, 51.0, 75.0, 101.0, 149.0, 217.0, 355.0, 553.0, 870.0, 1431.0, 2412.0, 4025.0, 7435.0, 13958.0, 27174.0, 54788.0, 112340.0, 233917.0, 455186.0, 754665.0, 912936.0, 734617.0, 437594.0, 222580.0, 107962.0, 52368.0, 25949.0, 13256.0, 7156.0, 3963.0, 2352.0, 1372.0, 863.0, 537.0, 341.0, 175.0, 150.0, 90.0, 72.0, 50.0, 34.0, 33.0, 19.0, 18.0, 5.0, 11.0, 4.0, 3.0, 5.0], "bins": [-8.75, -8.5032958984375, -8.256591796875, -8.0098876953125, -7.76318359375, -7.5164794921875, -7.269775390625, -7.0230712890625, -6.7763671875, -6.5296630859375, -6.282958984375, -6.0362548828125, -5.78955078125, -5.5428466796875, -5.296142578125, -5.0494384765625, -4.802734375, -4.5560302734375, -4.309326171875, -4.0626220703125, -3.81591796875, -3.5692138671875, -3.322509765625, -3.0758056640625, -2.8291015625, -2.5823974609375, -2.335693359375, -2.0889892578125, -1.84228515625, -1.5955810546875, -1.348876953125, -1.1021728515625, -0.85546875, -0.6087646484375, -0.362060546875, -0.1153564453125, 0.13134765625, 0.3780517578125, 0.624755859375, 0.8714599609375, 1.1181640625, 1.3648681640625, 1.611572265625, 1.8582763671875, 2.10498046875, 2.3516845703125, 2.598388671875, 2.8450927734375, 3.091796875, 3.3385009765625, 3.585205078125, 3.8319091796875, 4.07861328125, 4.3253173828125, 4.572021484375, 4.8187255859375, 5.0654296875, 5.3121337890625, 5.558837890625, 5.8055419921875, 6.05224609375, 6.2989501953125, 6.545654296875, 6.7923583984375, 7.0390625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 10.0, 16.0, 16.0, 23.0, 41.0, 52.0, 54.0, 66.0, 90.0, 95.0, 134.0, 132.0, 219.0, 218.0, 238.0, 231.0, 289.0, 281.0, 254.0, 230.0, 226.0, 191.0, 177.0, 156.0, 117.0, 101.0, 97.0, 73.0, 66.0, 33.0, 25.0, 20.0, 20.0, 19.0, 10.0, 6.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.42718505859375, -2.3446044921875, -2.26202392578125, -2.179443359375, -2.09686279296875, -2.0142822265625, -1.93170166015625, -1.84912109375, -1.76654052734375, -1.6839599609375, -1.60137939453125, -1.518798828125, -1.43621826171875, -1.3536376953125, -1.27105712890625, -1.1884765625, -1.10589599609375, -1.0233154296875, -0.94073486328125, -0.858154296875, -0.77557373046875, -0.6929931640625, -0.61041259765625, -0.52783203125, -0.44525146484375, -0.3626708984375, -0.28009033203125, -0.197509765625, -0.11492919921875, -0.0323486328125, 0.05023193359375, 0.1328125, 0.21539306640625, 0.2979736328125, 0.38055419921875, 0.463134765625, 0.54571533203125, 0.6282958984375, 0.71087646484375, 0.79345703125, 0.87603759765625, 0.9586181640625, 1.04119873046875, 1.123779296875, 1.20635986328125, 1.2889404296875, 1.37152099609375, 1.4541015625, 1.53668212890625, 1.6192626953125, 1.70184326171875, 1.784423828125, 1.86700439453125, 1.9495849609375, 2.03216552734375, 2.11474609375, 2.19732666015625, 2.2799072265625, 2.36248779296875, 2.445068359375, 2.52764892578125, 2.6102294921875, 2.69281005859375, 2.775390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 10.0, 8.0, 14.0, 14.0, 10.0, 6.0, 17.0, 26.0, 24.0, 28.0, 27.0, 22.0, 52.0, 31.0, 39.0, 49.0, 41.0, 39.0, 42.0, 33.0, 44.0, 42.0, 40.0, 43.0, 32.0, 39.0, 38.0, 26.0, 27.0, 28.0, 15.0, 20.0, 15.0, 5.0, 8.0, 7.0, 9.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.964357852935791, -5.780377388000488, -5.596397399902344, -5.412416934967041, -5.2284369468688965, -5.044456481933594, -4.860476493835449, -4.6764960289001465, -4.492516040802002, -4.308535575866699, -4.124555587768555, -3.940575361251831, -3.7565951347351074, -3.572614908218384, -3.38863468170166, -3.2046542167663574, -3.020673990249634, -2.83669376373291, -2.6527135372161865, -2.468733310699463, -2.2847530841827393, -2.1007728576660156, -1.9167925119400024, -1.7328122854232788, -1.5488320589065552, -1.3648518323898315, -1.180871605873108, -0.9968913197517395, -0.8129110932350159, -0.6289308667182922, -0.44495058059692383, -0.2609703540802002, -0.07699012756347656, 0.10699011385440826, 0.2909703552722931, 0.4749506115913391, 0.6589308381080627, 0.8429110646247864, 1.0268913507461548, 1.2108715772628784, 1.394851803779602, 1.5788320302963257, 1.7628122568130493, 1.9467926025390625, 2.130772829055786, 2.3147530555725098, 2.4987332820892334, 2.682713508605957, 2.8666937351226807, 3.0506739616394043, 3.234654188156128, 3.4186344146728516, 3.602614641189575, 3.786594867706299, 3.9705753326416016, 4.154555320739746, 4.338535785675049, 4.522516250610352, 4.706496238708496, 4.890476703643799, 5.074456691741943, 5.258437156677246, 5.442417144775391, 5.626397609710693, 5.810377597808838]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 5.0, 8.0, 9.0, 13.0, 10.0, 19.0, 23.0, 17.0, 24.0, 24.0, 22.0, 24.0, 41.0, 40.0, 35.0, 42.0, 44.0, 46.0, 40.0, 37.0, 46.0, 35.0, 35.0, 36.0, 40.0, 36.0, 27.0, 24.0, 21.0, 21.0, 23.0, 21.0, 14.0, 12.0, 13.0, 7.0, 11.0, 8.0, 4.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.498565196990967, -5.316170692443848, -5.133776664733887, -4.951382160186768, -4.768988132476807, -4.5865936279296875, -4.404199600219727, -4.221805095672607, -4.039410591125488, -3.8570163249969482, -3.674622058868408, -3.492227554321289, -3.309833526611328, -3.127439022064209, -2.945044755935669, -2.762650489807129, -2.580256462097168, -2.397862195968628, -2.215467929840088, -2.0330734252929688, -1.8506792783737183, -1.6682850122451782, -1.4858906269073486, -1.3034963607788086, -1.1211020946502686, -0.9387078285217285, -0.7563135027885437, -0.5739191770553589, -0.39152491092681885, -0.2091306447982788, -0.02673625946044922, 0.15565800666809082, 0.33805179595947266, 0.5204460620880127, 0.7028403878211975, 0.8852347135543823, 1.0676289796829224, 1.2500232458114624, 1.432417631149292, 1.614811897277832, 1.797206163406372, 1.979600429534912, 2.161994695663452, 2.344388961791992, 2.5267834663391113, 2.7091774940490723, 2.8915719985961914, 3.0739662647247314, 3.2563605308532715, 3.4387547969818115, 3.6211490631103516, 3.8035435676574707, 3.9859375953674316, 4.168332099914551, 4.350726127624512, 4.533120632171631, 4.71551513671875, 4.897909641265869, 5.08030366897583, 5.262698173522949, 5.44509220123291, 5.627486705780029, 5.809881210327148, 5.992275238037109, 6.17466926574707]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 17.0, 22.0, 34.0, 41.0, 67.0, 108.0, 211.0, 299.0, 532.0, 844.0, 1254.0, 2070.0, 3353.0, 5260.0, 8268.0, 12754.0, 18828.0, 27663.0, 38879.0, 53296.0, 69065.0, 84289.0, 97228.0, 104195.0, 104053.0, 96193.0, 83286.0, 67638.0, 52147.0, 37929.0, 26686.0, 18492.0, 11955.0, 8047.0, 5023.0, 3223.0, 1949.0, 1289.0, 750.0, 507.0, 291.0, 192.0, 131.0, 71.0, 52.0, 27.0, 23.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.521484375, -2.440032958984375, -2.35858154296875, -2.277130126953125, -2.1956787109375, -2.114227294921875, -2.03277587890625, -1.951324462890625, -1.869873046875, -1.788421630859375, -1.70697021484375, -1.625518798828125, -1.5440673828125, -1.462615966796875, -1.38116455078125, -1.299713134765625, -1.21826171875, -1.136810302734375, -1.05535888671875, -0.973907470703125, -0.8924560546875, -0.811004638671875, -0.72955322265625, -0.648101806640625, -0.566650390625, -0.485198974609375, -0.40374755859375, -0.322296142578125, -0.2408447265625, -0.159393310546875, -0.07794189453125, 0.003509521484375, 0.0849609375, 0.166412353515625, 0.24786376953125, 0.329315185546875, 0.4107666015625, 0.492218017578125, 0.57366943359375, 0.655120849609375, 0.736572265625, 0.818023681640625, 0.89947509765625, 0.980926513671875, 1.0623779296875, 1.143829345703125, 1.22528076171875, 1.306732177734375, 1.38818359375, 1.469635009765625, 1.55108642578125, 1.632537841796875, 1.7139892578125, 1.795440673828125, 1.87689208984375, 1.958343505859375, 2.039794921875, 2.121246337890625, 2.20269775390625, 2.284149169921875, 2.3656005859375, 2.447052001953125, 2.52850341796875, 2.609954833984375, 2.69140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 6.0, 7.0, 8.0, 14.0, 10.0, 14.0, 11.0, 20.0, 20.0, 19.0, 19.0, 25.0, 30.0, 27.0, 41.0, 44.0, 41.0, 34.0, 35.0, 40.0, 34.0, 48.0, 60.0, 44.0, 35.0, 29.0, 29.0, 33.0, 27.0, 21.0, 21.0, 18.0, 18.0, 18.0, 14.0, 16.0, 13.0, 8.0, 3.0, 5.0, 1.0, 8.0, 7.0, 2.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.597412109375, -4.42919921875, -4.260986328125, -4.0927734375, -3.924560546875, -3.75634765625, -3.588134765625, -3.419921875, -3.251708984375, -3.08349609375, -2.915283203125, -2.7470703125, -2.578857421875, -2.41064453125, -2.242431640625, -2.07421875, -1.906005859375, -1.73779296875, -1.569580078125, -1.4013671875, -1.233154296875, -1.06494140625, -0.896728515625, -0.728515625, -0.560302734375, -0.39208984375, -0.223876953125, -0.0556640625, 0.112548828125, 0.28076171875, 0.448974609375, 0.6171875, 0.785400390625, 0.95361328125, 1.121826171875, 1.2900390625, 1.458251953125, 1.62646484375, 1.794677734375, 1.962890625, 2.131103515625, 2.29931640625, 2.467529296875, 2.6357421875, 2.803955078125, 2.97216796875, 3.140380859375, 3.30859375, 3.476806640625, 3.64501953125, 3.813232421875, 3.9814453125, 4.149658203125, 4.31787109375, 4.486083984375, 4.654296875, 4.822509765625, 4.99072265625, 5.158935546875, 5.3271484375, 5.495361328125, 5.66357421875, 5.831787109375, 6.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 14.0, 6.0, 21.0, 35.0, 50.0, 61.0, 90.0, 160.0, 204.0, 383.0, 618.0, 981.0, 1642.0, 2846.0, 4768.0, 8086.0, 13596.0, 23491.0, 59603.0, 729813.0, 134632.0, 27816.0, 16103.0, 9545.0, 5570.0, 3318.0, 2033.0, 1182.0, 747.0, 391.0, 268.0, 162.0, 97.0, 69.0, 38.0, 35.0, 22.0, 16.0, 9.0, 9.0, 7.0, 1.0, 6.0, 0.0, 3.0, 3.0, 2.0], "bins": [-10.671875, -10.38067626953125, -10.0894775390625, -9.79827880859375, -9.507080078125, -9.21588134765625, -8.9246826171875, -8.63348388671875, -8.34228515625, -8.05108642578125, -7.7598876953125, -7.46868896484375, -7.177490234375, -6.88629150390625, -6.5950927734375, -6.30389404296875, -6.0126953125, -5.72149658203125, -5.4302978515625, -5.13909912109375, -4.847900390625, -4.55670166015625, -4.2655029296875, -3.97430419921875, -3.68310546875, -3.39190673828125, -3.1007080078125, -2.80950927734375, -2.518310546875, -2.22711181640625, -1.9359130859375, -1.64471435546875, -1.353515625, -1.06231689453125, -0.7711181640625, -0.47991943359375, -0.188720703125, 0.10247802734375, 0.3936767578125, 0.68487548828125, 0.97607421875, 1.26727294921875, 1.5584716796875, 1.84967041015625, 2.140869140625, 2.43206787109375, 2.7232666015625, 3.01446533203125, 3.3056640625, 3.59686279296875, 3.8880615234375, 4.17926025390625, 4.470458984375, 4.76165771484375, 5.0528564453125, 5.34405517578125, 5.63525390625, 5.92645263671875, 6.2176513671875, 6.50885009765625, 6.800048828125, 7.09124755859375, 7.3824462890625, 7.67364501953125, 7.96484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 8.0, 7.0, 8.0, 8.0, 15.0, 6.0, 23.0, 16.0, 22.0, 30.0, 34.0, 34.0, 35.0, 33.0, 43.0, 34.0, 43.0, 42.0, 47.0, 45.0, 37.0, 35.0, 39.0, 38.0, 28.0, 37.0, 38.0, 25.0, 27.0, 20.0, 19.0, 18.0, 18.0, 22.0, 9.0, 12.0, 13.0, 5.0, 7.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.41015625, -7.18218994140625, -6.9542236328125, -6.72625732421875, -6.498291015625, -6.27032470703125, -6.0423583984375, -5.81439208984375, -5.58642578125, -5.35845947265625, -5.1304931640625, -4.90252685546875, -4.674560546875, -4.44659423828125, -4.2186279296875, -3.99066162109375, -3.7626953125, -3.53472900390625, -3.3067626953125, -3.07879638671875, -2.850830078125, -2.62286376953125, -2.3948974609375, -2.16693115234375, -1.93896484375, -1.71099853515625, -1.4830322265625, -1.25506591796875, -1.027099609375, -0.79913330078125, -0.5711669921875, -0.34320068359375, -0.115234375, 0.11273193359375, 0.3406982421875, 0.56866455078125, 0.796630859375, 1.02459716796875, 1.2525634765625, 1.48052978515625, 1.70849609375, 1.93646240234375, 2.1644287109375, 2.39239501953125, 2.620361328125, 2.84832763671875, 3.0762939453125, 3.30426025390625, 3.5322265625, 3.76019287109375, 3.9881591796875, 4.21612548828125, 4.444091796875, 4.67205810546875, 4.9000244140625, 5.12799072265625, 5.35595703125, 5.58392333984375, 5.8118896484375, 6.03985595703125, 6.267822265625, 6.49578857421875, 6.7237548828125, 6.95172119140625, 7.1796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 9.0, 18.0, 28.0, 37.0, 67.0, 70.0, 120.0, 137.0, 225.0, 363.0, 534.0, 863.0, 1447.0, 2445.0, 4582.0, 9016.0, 18886.0, 59556.0, 763574.0, 136640.0, 25406.0, 11312.0, 5578.0, 3019.0, 1676.0, 1058.0, 630.0, 397.0, 259.0, 188.0, 125.0, 79.0, 54.0, 50.0, 18.0, 19.0, 14.0, 14.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.28125, -3.180816650390625, -3.08038330078125, -2.979949951171875, -2.8795166015625, -2.779083251953125, -2.67864990234375, -2.578216552734375, -2.477783203125, -2.377349853515625, -2.27691650390625, -2.176483154296875, -2.0760498046875, -1.975616455078125, -1.87518310546875, -1.774749755859375, -1.67431640625, -1.573883056640625, -1.47344970703125, -1.373016357421875, -1.2725830078125, -1.172149658203125, -1.07171630859375, -0.971282958984375, -0.870849609375, -0.770416259765625, -0.66998291015625, -0.569549560546875, -0.4691162109375, -0.368682861328125, -0.26824951171875, -0.167816162109375, -0.0673828125, 0.033050537109375, 0.13348388671875, 0.233917236328125, 0.3343505859375, 0.434783935546875, 0.53521728515625, 0.635650634765625, 0.736083984375, 0.836517333984375, 0.93695068359375, 1.037384033203125, 1.1378173828125, 1.238250732421875, 1.33868408203125, 1.439117431640625, 1.53955078125, 1.639984130859375, 1.74041748046875, 1.840850830078125, 1.9412841796875, 2.041717529296875, 2.14215087890625, 2.242584228515625, 2.343017578125, 2.443450927734375, 2.54388427734375, 2.644317626953125, 2.7447509765625, 2.845184326171875, 2.94561767578125, 3.046051025390625, 3.146484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 6.0, 14.0, 9.0, 17.0, 17.0, 27.0, 40.0, 39.0, 59.0, 62.0, 78.0, 88.0, 85.0, 59.0, 72.0, 64.0, 41.0, 48.0, 29.0, 21.0, 34.0, 16.0, 13.0, 11.0, 11.0, 4.0, 6.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008087158203125, -0.0007844269275665283, -0.0007601380348205566, -0.000735849142074585, -0.0007115602493286133, -0.0006872713565826416, -0.0006629824638366699, -0.0006386935710906982, -0.0006144046783447266, -0.0005901157855987549, -0.0005658268928527832, -0.0005415380001068115, -0.0005172491073608398, -0.0004929602146148682, -0.0004686713218688965, -0.0004443824291229248, -0.0004200935363769531, -0.00039580464363098145, -0.00037151575088500977, -0.0003472268581390381, -0.0003229379653930664, -0.0002986490726470947, -0.00027436017990112305, -0.00025007128715515137, -0.0002257823944091797, -0.000201493501663208, -0.00017720460891723633, -0.00015291571617126465, -0.00012862682342529297, -0.00010433793067932129, -8.004903793334961e-05, -5.576014518737793e-05, -3.147125244140625e-05, -7.18235969543457e-06, 1.710653305053711e-05, 4.139542579650879e-05, 6.568431854248047e-05, 8.997321128845215e-05, 0.00011426210403442383, 0.0001385509967803955, 0.0001628398895263672, 0.00018712878227233887, 0.00021141767501831055, 0.00023570656776428223, 0.0002599954605102539, 0.0002842843532562256, 0.00030857324600219727, 0.00033286213874816895, 0.0003571510314941406, 0.0003814399242401123, 0.000405728816986084, 0.00043001770973205566, 0.00045430660247802734, 0.000478595495223999, 0.0005028843879699707, 0.0005271732807159424, 0.0005514621734619141, 0.0005757510662078857, 0.0006000399589538574, 0.0006243288516998291, 0.0006486177444458008, 0.0006729066371917725, 0.0006971955299377441, 0.0007214844226837158, 0.0007457733154296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 8.0, 11.0, 9.0, 8.0, 20.0, 25.0, 47.0, 62.0, 86.0, 130.0, 190.0, 248.0, 343.0, 569.0, 835.0, 1229.0, 1835.0, 2731.0, 4193.0, 6429.0, 9987.0, 15807.0, 25118.0, 41800.0, 70841.0, 123344.0, 191652.0, 203288.0, 140678.0, 81529.0, 46913.0, 28450.0, 17889.0, 11005.0, 7216.0, 4739.0, 3050.0, 1990.0, 1415.0, 878.0, 601.0, 451.0, 286.0, 193.0, 134.0, 99.0, 74.0, 35.0, 24.0, 23.0, 16.0, 9.0, 5.0, 3.0, 4.0, 0.0, 4.0], "bins": [-1.1611328125, -1.127105712890625, -1.09307861328125, -1.059051513671875, -1.0250244140625, -0.990997314453125, -0.95697021484375, -0.922943115234375, -0.888916015625, -0.854888916015625, -0.82086181640625, -0.786834716796875, -0.7528076171875, -0.718780517578125, -0.68475341796875, -0.650726318359375, -0.61669921875, -0.582672119140625, -0.54864501953125, -0.514617919921875, -0.4805908203125, -0.446563720703125, -0.41253662109375, -0.378509521484375, -0.344482421875, -0.310455322265625, -0.27642822265625, -0.242401123046875, -0.2083740234375, -0.174346923828125, -0.14031982421875, -0.106292724609375, -0.072265625, -0.038238525390625, -0.00421142578125, 0.029815673828125, 0.0638427734375, 0.097869873046875, 0.13189697265625, 0.165924072265625, 0.199951171875, 0.233978271484375, 0.26800537109375, 0.302032470703125, 0.3360595703125, 0.370086669921875, 0.40411376953125, 0.438140869140625, 0.47216796875, 0.506195068359375, 0.54022216796875, 0.574249267578125, 0.6082763671875, 0.642303466796875, 0.67633056640625, 0.710357666015625, 0.744384765625, 0.778411865234375, 0.81243896484375, 0.846466064453125, 0.8804931640625, 0.914520263671875, 0.94854736328125, 0.982574462890625, 1.0166015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 6.0, 9.0, 4.0, 8.0, 7.0, 12.0, 22.0, 19.0, 26.0, 24.0, 27.0, 32.0, 44.0, 32.0, 56.0, 39.0, 51.0, 39.0, 43.0, 51.0, 60.0, 44.0, 40.0, 41.0, 37.0, 37.0, 16.0, 25.0, 20.0, 15.0, 24.0, 13.0, 15.0, 5.0, 9.0, 7.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.327880859375, -0.3172760009765625, -0.306671142578125, -0.2960662841796875, -0.28546142578125, -0.2748565673828125, -0.264251708984375, -0.2536468505859375, -0.2430419921875, -0.2324371337890625, -0.221832275390625, -0.2112274169921875, -0.20062255859375, -0.1900177001953125, -0.179412841796875, -0.1688079833984375, -0.158203125, -0.1475982666015625, -0.136993408203125, -0.1263885498046875, -0.11578369140625, -0.1051788330078125, -0.094573974609375, -0.0839691162109375, -0.0733642578125, -0.0627593994140625, -0.052154541015625, -0.0415496826171875, -0.03094482421875, -0.0203399658203125, -0.009735107421875, 0.0008697509765625, 0.011474609375, 0.0220794677734375, 0.032684326171875, 0.0432891845703125, 0.05389404296875, 0.0644989013671875, 0.075103759765625, 0.0857086181640625, 0.0963134765625, 0.1069183349609375, 0.117523193359375, 0.1281280517578125, 0.13873291015625, 0.1493377685546875, 0.159942626953125, 0.1705474853515625, 0.18115234375, 0.1917572021484375, 0.202362060546875, 0.2129669189453125, 0.22357177734375, 0.2341766357421875, 0.244781494140625, 0.2553863525390625, 0.2659912109375, 0.2765960693359375, 0.287200927734375, 0.2978057861328125, 0.30841064453125, 0.3190155029296875, 0.329620361328125, 0.3402252197265625, 0.350830078125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 6.0, 6.0, 9.0, 5.0, 11.0, 16.0, 15.0, 18.0, 21.0, 31.0, 28.0, 40.0, 42.0, 31.0, 40.0, 50.0, 53.0, 52.0, 44.0, 58.0, 39.0, 57.0, 45.0, 33.0, 31.0, 28.0, 33.0, 30.0, 30.0, 17.0, 17.0, 12.0, 6.0, 10.0, 14.0, 4.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.026797294616699, -6.820054054260254, -6.61331033706665, -6.406567096710205, -6.19982385635376, -5.993080139160156, -5.786336898803711, -5.579593658447266, -5.372849941253662, -5.166106700897217, -4.959362983703613, -4.752619743347168, -4.545876502990723, -4.339132785797119, -4.132389545440674, -3.9256460666656494, -3.718902826309204, -3.5121593475341797, -3.3054161071777344, -3.09867262840271, -2.8919291496276855, -2.6851859092712402, -2.478442430496216, -2.2716989517211914, -2.064955711364746, -1.8582123517990112, -1.6514688730239868, -1.444725513458252, -1.2379820346832275, -1.0312386751174927, -0.8244953155517578, -0.6177518367767334, -0.411008358001709, -0.20426495373249054, 0.0024784505367279053, 0.20922183990478516, 0.4159652590751648, 0.6227086782455444, 0.8294520378112793, 1.0361955165863037, 1.2429388761520386, 1.4496822357177734, 1.6564257144927979, 1.8631690740585327, 2.0699124336242676, 2.276655912399292, 2.4833993911743164, 2.6901426315307617, 2.896886110305786, 3.1036295890808105, 3.310372829437256, 3.5171163082122803, 3.7238597869873047, 3.93060302734375, 4.137346267700195, 4.344089984893799, 4.550833225250244, 4.7575764656066895, 4.964320182800293, 5.171063423156738, 5.377806663513184, 5.584550380706787, 5.791293621063232, 5.998037338256836, 6.204780578613281]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 7.0, 6.0, 7.0, 14.0, 13.0, 17.0, 25.0, 17.0, 28.0, 19.0, 26.0, 30.0, 28.0, 38.0, 46.0, 45.0, 43.0, 48.0, 38.0, 38.0, 40.0, 41.0, 43.0, 26.0, 30.0, 37.0, 32.0, 25.0, 24.0, 20.0, 25.0, 16.0, 12.0, 15.0, 10.0, 8.0, 10.0, 6.0, 15.0, 4.0, 8.0, 1.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265275001525879, -5.089991092681885, -4.914707660675049, -4.739423751831055, -4.564140319824219, -4.388856410980225, -4.2135725021362305, -4.0382890701293945, -3.8630053997039795, -3.6877217292785645, -3.5124380588531494, -3.3371543884277344, -3.1618704795837402, -2.9865870475769043, -2.81130313873291, -2.636019468307495, -2.46073579788208, -2.285452127456665, -2.11016845703125, -1.9348846673965454, -1.7596009969711304, -1.5843173265457153, -1.4090335369110107, -1.2337498664855957, -1.0584661960601807, -0.8831825256347656, -0.7078987956047058, -0.532615065574646, -0.35733139514923096, -0.18204772472381592, -0.006763935089111328, 0.1685197353363037, 0.34380388259887695, 0.519087553024292, 0.6943712830543518, 0.8696550130844116, 1.0449386835098267, 1.2202223539352417, 1.3955061435699463, 1.5707898139953613, 1.7460734844207764, 1.9213571548461914, 2.0966408252716064, 2.2719244956970215, 2.4472084045410156, 2.6224918365478516, 2.7977757453918457, 2.9730594158172607, 3.148343086242676, 3.323626756668091, 3.498910427093506, 3.6741943359375, 3.849477767944336, 4.02476167678833, 4.200045585632324, 4.37532901763916, 4.550612449645996, 4.72589635848999, 4.901179790496826, 5.07646369934082, 5.251747131347656, 5.42703104019165, 5.6023149490356445, 5.7775983810424805, 5.952882289886475]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 10.0, 12.0, 14.0, 21.0, 42.0, 53.0, 64.0, 92.0, 156.0, 241.0, 408.0, 661.0, 1156.0, 2053.0, 4096.0, 8190.0, 17027.0, 35615.0, 73583.0, 136986.0, 205868.0, 218747.0, 161707.0, 92024.0, 46204.0, 21906.0, 10336.0, 5032.0, 2701.0, 1411.0, 828.0, 433.0, 297.0, 210.0, 113.0, 79.0, 52.0, 42.0, 26.0, 11.0, 16.0, 7.0, 4.0, 4.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.546875, -7.3193359375, -7.091796875, -6.8642578125, -6.63671875, -6.4091796875, -6.181640625, -5.9541015625, -5.7265625, -5.4990234375, -5.271484375, -5.0439453125, -4.81640625, -4.5888671875, -4.361328125, -4.1337890625, -3.90625, -3.6787109375, -3.451171875, -3.2236328125, -2.99609375, -2.7685546875, -2.541015625, -2.3134765625, -2.0859375, -1.8583984375, -1.630859375, -1.4033203125, -1.17578125, -0.9482421875, -0.720703125, -0.4931640625, -0.265625, -0.0380859375, 0.189453125, 0.4169921875, 0.64453125, 0.8720703125, 1.099609375, 1.3271484375, 1.5546875, 1.7822265625, 2.009765625, 2.2373046875, 2.46484375, 2.6923828125, 2.919921875, 3.1474609375, 3.375, 3.6025390625, 3.830078125, 4.0576171875, 4.28515625, 4.5126953125, 4.740234375, 4.9677734375, 5.1953125, 5.4228515625, 5.650390625, 5.8779296875, 6.10546875, 6.3330078125, 6.560546875, 6.7880859375, 7.015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 11.0, 6.0, 10.0, 7.0, 8.0, 12.0, 19.0, 21.0, 18.0, 25.0, 21.0, 20.0, 36.0, 35.0, 39.0, 44.0, 54.0, 30.0, 38.0, 39.0, 49.0, 39.0, 30.0, 32.0, 35.0, 42.0, 30.0, 26.0, 27.0, 24.0, 23.0, 22.0, 15.0, 12.0, 14.0, 15.0, 7.0, 9.0, 9.0, 7.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.3828125, -5.218994140625, -5.05517578125, -4.891357421875, -4.7275390625, -4.563720703125, -4.39990234375, -4.236083984375, -4.072265625, -3.908447265625, -3.74462890625, -3.580810546875, -3.4169921875, -3.253173828125, -3.08935546875, -2.925537109375, -2.76171875, -2.597900390625, -2.43408203125, -2.270263671875, -2.1064453125, -1.942626953125, -1.77880859375, -1.614990234375, -1.451171875, -1.287353515625, -1.12353515625, -0.959716796875, -0.7958984375, -0.632080078125, -0.46826171875, -0.304443359375, -0.140625, 0.023193359375, 0.18701171875, 0.350830078125, 0.5146484375, 0.678466796875, 0.84228515625, 1.006103515625, 1.169921875, 1.333740234375, 1.49755859375, 1.661376953125, 1.8251953125, 1.989013671875, 2.15283203125, 2.316650390625, 2.48046875, 2.644287109375, 2.80810546875, 2.971923828125, 3.1357421875, 3.299560546875, 3.46337890625, 3.627197265625, 3.791015625, 3.954833984375, 4.11865234375, 4.282470703125, 4.4462890625, 4.610107421875, 4.77392578125, 4.937744140625, 5.1015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 7.0, 6.0, 14.0, 22.0, 26.0, 49.0, 37.0, 84.0, 101.0, 143.0, 229.0, 382.0, 623.0, 1066.0, 1984.0, 3621.0, 6794.0, 13252.0, 27382.0, 56807.0, 111526.0, 190241.0, 232725.0, 186046.0, 107434.0, 54135.0, 26269.0, 12835.0, 6573.0, 3498.0, 1844.0, 1063.0, 643.0, 363.0, 224.0, 176.0, 90.0, 53.0, 50.0, 35.0, 26.0, 21.0, 19.0, 9.0, 5.0, 7.0, 0.0, 7.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-9.6875, -9.3980712890625, -9.108642578125, -8.8192138671875, -8.52978515625, -8.2403564453125, -7.950927734375, -7.6614990234375, -7.3720703125, -7.0826416015625, -6.793212890625, -6.5037841796875, -6.21435546875, -5.9249267578125, -5.635498046875, -5.3460693359375, -5.056640625, -4.7672119140625, -4.477783203125, -4.1883544921875, -3.89892578125, -3.6094970703125, -3.320068359375, -3.0306396484375, -2.7412109375, -2.4517822265625, -2.162353515625, -1.8729248046875, -1.58349609375, -1.2940673828125, -1.004638671875, -0.7152099609375, -0.42578125, -0.1363525390625, 0.153076171875, 0.4425048828125, 0.73193359375, 1.0213623046875, 1.310791015625, 1.6002197265625, 1.8896484375, 2.1790771484375, 2.468505859375, 2.7579345703125, 3.04736328125, 3.3367919921875, 3.626220703125, 3.9156494140625, 4.205078125, 4.4945068359375, 4.783935546875, 5.0733642578125, 5.36279296875, 5.6522216796875, 5.941650390625, 6.2310791015625, 6.5205078125, 6.8099365234375, 7.099365234375, 7.3887939453125, 7.67822265625, 7.9676513671875, 8.257080078125, 8.5465087890625, 8.8359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 10.0, 13.0, 10.0, 14.0, 17.0, 23.0, 19.0, 25.0, 35.0, 31.0, 34.0, 31.0, 26.0, 37.0, 34.0, 34.0, 39.0, 43.0, 53.0, 37.0, 35.0, 36.0, 36.0, 19.0, 25.0, 28.0, 32.0, 26.0, 27.0, 21.0, 19.0, 13.0, 15.0, 12.0, 13.0, 13.0, 9.0, 9.0, 9.0, 9.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.4375, -3.324249267578125, -3.21099853515625, -3.097747802734375, -2.9844970703125, -2.871246337890625, -2.75799560546875, -2.644744873046875, -2.531494140625, -2.418243408203125, -2.30499267578125, -2.191741943359375, -2.0784912109375, -1.965240478515625, -1.85198974609375, -1.738739013671875, -1.62548828125, -1.512237548828125, -1.39898681640625, -1.285736083984375, -1.1724853515625, -1.059234619140625, -0.94598388671875, -0.832733154296875, -0.719482421875, -0.606231689453125, -0.49298095703125, -0.379730224609375, -0.2664794921875, -0.153228759765625, -0.03997802734375, 0.073272705078125, 0.1865234375, 0.299774169921875, 0.41302490234375, 0.526275634765625, 0.6395263671875, 0.752777099609375, 0.86602783203125, 0.979278564453125, 1.092529296875, 1.205780029296875, 1.31903076171875, 1.432281494140625, 1.5455322265625, 1.658782958984375, 1.77203369140625, 1.885284423828125, 1.99853515625, 2.111785888671875, 2.22503662109375, 2.338287353515625, 2.4515380859375, 2.564788818359375, 2.67803955078125, 2.791290283203125, 2.904541015625, 3.017791748046875, 3.13104248046875, 3.244293212890625, 3.3575439453125, 3.470794677734375, 3.58404541015625, 3.697296142578125, 3.810546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 17.0, 17.0, 34.0, 34.0, 63.0, 84.0, 104.0, 141.0, 212.0, 308.0, 489.0, 613.0, 915.0, 1321.0, 2001.0, 2856.0, 4440.0, 7071.0, 12332.0, 22725.0, 45785.0, 102558.0, 228764.0, 297519.0, 167078.0, 72538.0, 33831.0, 17532.0, 9870.0, 5781.0, 3715.0, 2413.0, 1612.0, 1172.0, 785.0, 515.0, 390.0, 280.0, 183.0, 136.0, 100.0, 67.0, 43.0, 40.0, 15.0, 23.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.06402587890625, -5.8702392578125, -5.67645263671875, -5.482666015625, -5.28887939453125, -5.0950927734375, -4.90130615234375, -4.70751953125, -4.51373291015625, -4.3199462890625, -4.12615966796875, -3.932373046875, -3.73858642578125, -3.5447998046875, -3.35101318359375, -3.1572265625, -2.96343994140625, -2.7696533203125, -2.57586669921875, -2.382080078125, -2.18829345703125, -1.9945068359375, -1.80072021484375, -1.60693359375, -1.41314697265625, -1.2193603515625, -1.02557373046875, -0.831787109375, -0.63800048828125, -0.4442138671875, -0.25042724609375, -0.056640625, 0.13714599609375, 0.3309326171875, 0.52471923828125, 0.718505859375, 0.91229248046875, 1.1060791015625, 1.29986572265625, 1.49365234375, 1.68743896484375, 1.8812255859375, 2.07501220703125, 2.268798828125, 2.46258544921875, 2.6563720703125, 2.85015869140625, 3.0439453125, 3.23773193359375, 3.4315185546875, 3.62530517578125, 3.819091796875, 4.01287841796875, 4.2066650390625, 4.40045166015625, 4.59423828125, 4.78802490234375, 4.9818115234375, 5.17559814453125, 5.369384765625, 5.56317138671875, 5.7569580078125, 5.95074462890625, 6.14453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 1.0, 2.0, 8.0, 17.0, 20.0, 22.0, 29.0, 48.0, 54.0, 99.0, 125.0, 147.0, 127.0, 85.0, 48.0, 40.0, 41.0, 24.0, 15.0, 16.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005950927734375, -0.0005706474184989929, -0.0005462020635604858, -0.0005217567086219788, -0.0004973113536834717, -0.0004728659987449646, -0.0004484206438064575, -0.00042397528886795044, -0.00039952993392944336, -0.0003750845789909363, -0.0003506392240524292, -0.0003261938691139221, -0.00030174851417541504, -0.00027730315923690796, -0.0002528578042984009, -0.0002284124493598938, -0.00020396709442138672, -0.00017952173948287964, -0.00015507638454437256, -0.00013063102960586548, -0.0001061856746673584, -8.174031972885132e-05, -5.729496479034424e-05, -3.284960985183716e-05, -8.404254913330078e-06, 1.6041100025177002e-05, 4.048645496368408e-05, 6.493180990219116e-05, 8.937716484069824e-05, 0.00011382251977920532, 0.0001382678747177124, 0.00016271322965621948, 0.00018715858459472656, 0.00021160393953323364, 0.00023604929447174072, 0.0002604946494102478, 0.0002849400043487549, 0.00030938535928726196, 0.00033383071422576904, 0.0003582760691642761, 0.0003827214241027832, 0.0004071667790412903, 0.00043161213397979736, 0.00045605748891830444, 0.0004805028438568115, 0.0005049481987953186, 0.0005293935537338257, 0.0005538389086723328, 0.0005782842636108398, 0.0006027296185493469, 0.000627174973487854, 0.0006516203284263611, 0.0006760656833648682, 0.0007005110383033752, 0.0007249563932418823, 0.0007494017481803894, 0.0007738471031188965, 0.0007982924580574036, 0.0008227378129959106, 0.0008471831679344177, 0.0008716285228729248, 0.0008960738778114319, 0.000920519232749939, 0.000944964587688446, 0.0009694099426269531]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 17.0, 19.0, 34.0, 51.0, 69.0, 95.0, 129.0, 224.0, 311.0, 402.0, 636.0, 1036.0, 1495.0, 2266.0, 3387.0, 5548.0, 9006.0, 14663.0, 25975.0, 48964.0, 96986.0, 186678.0, 255946.0, 185629.0, 95640.0, 48658.0, 25634.0, 14673.0, 8755.0, 5371.0, 3557.0, 2204.0, 1479.0, 983.0, 657.0, 441.0, 295.0, 189.0, 162.0, 79.0, 66.0, 44.0, 26.0, 17.0, 15.0, 11.0, 5.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.171875, -5.00225830078125, -4.8326416015625, -4.66302490234375, -4.493408203125, -4.32379150390625, -4.1541748046875, -3.98455810546875, -3.81494140625, -3.64532470703125, -3.4757080078125, -3.30609130859375, -3.136474609375, -2.96685791015625, -2.7972412109375, -2.62762451171875, -2.4580078125, -2.28839111328125, -2.1187744140625, -1.94915771484375, -1.779541015625, -1.60992431640625, -1.4403076171875, -1.27069091796875, -1.10107421875, -0.93145751953125, -0.7618408203125, -0.59222412109375, -0.422607421875, -0.25299072265625, -0.0833740234375, 0.08624267578125, 0.255859375, 0.42547607421875, 0.5950927734375, 0.76470947265625, 0.934326171875, 1.10394287109375, 1.2735595703125, 1.44317626953125, 1.61279296875, 1.78240966796875, 1.9520263671875, 2.12164306640625, 2.291259765625, 2.46087646484375, 2.6304931640625, 2.80010986328125, 2.9697265625, 3.13934326171875, 3.3089599609375, 3.47857666015625, 3.648193359375, 3.81781005859375, 3.9874267578125, 4.15704345703125, 4.32666015625, 4.49627685546875, 4.6658935546875, 4.83551025390625, 5.005126953125, 5.17474365234375, 5.3443603515625, 5.51397705078125, 5.68359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 0.0, 8.0, 9.0, 10.0, 6.0, 12.0, 9.0, 15.0, 12.0, 22.0, 24.0, 23.0, 38.0, 24.0, 46.0, 53.0, 56.0, 71.0, 65.0, 78.0, 52.0, 57.0, 57.0, 45.0, 37.0, 30.0, 29.0, 25.0, 9.0, 11.0, 9.0, 7.0, 8.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5400390625, -1.4908905029296875, -1.441741943359375, -1.3925933837890625, -1.34344482421875, -1.2942962646484375, -1.245147705078125, -1.1959991455078125, -1.1468505859375, -1.0977020263671875, -1.048553466796875, -0.9994049072265625, -0.95025634765625, -0.9011077880859375, -0.851959228515625, -0.8028106689453125, -0.753662109375, -0.7045135498046875, -0.655364990234375, -0.6062164306640625, -0.55706787109375, -0.5079193115234375, -0.458770751953125, -0.4096221923828125, -0.3604736328125, -0.3113250732421875, -0.262176513671875, -0.2130279541015625, -0.16387939453125, -0.1147308349609375, -0.065582275390625, -0.0164337158203125, 0.03271484375, 0.0818634033203125, 0.131011962890625, 0.1801605224609375, 0.22930908203125, 0.2784576416015625, 0.327606201171875, 0.3767547607421875, 0.4259033203125, 0.4750518798828125, 0.524200439453125, 0.5733489990234375, 0.62249755859375, 0.6716461181640625, 0.720794677734375, 0.7699432373046875, 0.819091796875, 0.8682403564453125, 0.917388916015625, 0.9665374755859375, 1.01568603515625, 1.0648345947265625, 1.113983154296875, 1.1631317138671875, 1.2122802734375, 1.2614288330078125, 1.310577392578125, 1.3597259521484375, 1.40887451171875, 1.4580230712890625, 1.507171630859375, 1.5563201904296875, 1.60546875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 2.0, 12.0, 12.0, 15.0, 19.0, 23.0, 25.0, 17.0, 22.0, 31.0, 34.0, 43.0, 50.0, 40.0, 37.0, 50.0, 45.0, 47.0, 56.0, 48.0, 47.0, 38.0, 47.0, 33.0, 35.0, 22.0, 23.0, 18.0, 20.0, 14.0, 6.0, 9.0, 7.0, 9.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.751357555389404, -6.550340175628662, -6.349322319030762, -6.1483049392700195, -5.947287559509277, -5.746270179748535, -5.545252799987793, -5.344234943389893, -5.14321756362915, -4.942200183868408, -4.741182327270508, -4.540164947509766, -4.339147567749023, -4.138130187988281, -3.93711256980896, -3.7360949516296387, -3.5350775718688965, -3.3340601921081543, -3.133042573928833, -2.9320249557495117, -2.7310075759887695, -2.5299901962280273, -2.328972578048706, -2.1279549598693848, -1.9269375801086426, -1.7259200811386108, -1.524902582168579, -1.3238850831985474, -1.1228675842285156, -0.9218500852584839, -0.7208325862884521, -0.5198150873184204, -0.31879711151123047, -0.11777961254119873, 0.08323788642883301, 0.28425538539886475, 0.4852728843688965, 0.6862903833389282, 0.88730788230896, 1.0883253812789917, 1.2893428802490234, 1.4903603792190552, 1.691377878189087, 1.8923953771591187, 2.0934128761291504, 2.2944302558898926, 2.495447874069214, 2.696465492248535, 2.8974828720092773, 3.0985002517700195, 3.299517869949341, 3.500535488128662, 3.7015528678894043, 3.9025702476501465, 4.103588104248047, 4.304605484008789, 4.505622863769531, 4.706640243530273, 4.907657623291016, 5.108675479888916, 5.309692859649658, 5.5107102394104, 5.711728096008301, 5.912745475769043, 6.113762855529785]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 9.0, 6.0, 7.0, 12.0, 14.0, 15.0, 13.0, 13.0, 16.0, 12.0, 20.0, 19.0, 34.0, 36.0, 38.0, 24.0, 39.0, 43.0, 47.0, 43.0, 39.0, 50.0, 29.0, 31.0, 46.0, 33.0, 29.0, 29.0, 24.0, 29.0, 28.0, 19.0, 20.0, 23.0, 15.0, 11.0, 15.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.359649658203125, -5.188055992126465, -5.016462326049805, -4.8448686599731445, -4.673274993896484, -4.501681327819824, -4.330087661743164, -4.158493995666504, -3.9869003295898438, -3.8153066635131836, -3.6437129974365234, -3.4721193313598633, -3.300525665283203, -3.128931999206543, -2.957338333129883, -2.7857446670532227, -2.6141512393951416, -2.4425575733184814, -2.2709639072418213, -2.099370241165161, -1.927776575088501, -1.7561829090118408, -1.5845893621444702, -1.41299569606781, -1.24140202999115, -1.0698083639144897, -0.8982146978378296, -0.7266210913658142, -0.555027425289154, -0.3834337592124939, -0.21184015274047852, -0.04024648666381836, 0.1313471794128418, 0.30294084548950195, 0.4745344817638397, 0.6461281180381775, 0.8177217841148376, 0.9893154501914978, 1.1609090566635132, 1.3325027227401733, 1.5040963888168335, 1.6756900548934937, 1.8472837209701538, 2.0188772678375244, 2.1904709339141846, 2.3620645999908447, 2.533658266067505, 2.705251932144165, 2.876845598220825, 3.0484392642974854, 3.2200329303741455, 3.3916265964508057, 3.563220262527466, 3.734813928604126, 3.906407356262207, 4.078001022338867, 4.249594688415527, 4.4211883544921875, 4.592782020568848, 4.764375686645508, 4.935969352722168, 5.107563018798828, 5.279156684875488, 5.450750350952148, 5.622344017028809]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 23.0, 28.0, 37.0, 38.0, 73.0, 113.0, 155.0, 191.0, 284.0, 482.0, 695.0, 1061.0, 1667.0, 2837.0, 4741.0, 8248.0, 15437.0, 30967.0, 68214.0, 164025.0, 384963.0, 752434.0, 1019170.0, 860038.0, 485062.0, 218662.0, 91318.0, 40006.0, 19277.0, 9866.0, 5401.0, 3205.0, 1989.0, 1219.0, 808.0, 522.0, 345.0, 200.0, 144.0, 94.0, 78.0, 50.0, 35.0, 17.0, 18.0, 15.0, 6.0, 5.0, 1.0, 1.0, 3.0], "bins": [-7.578125, -7.3656005859375, -7.153076171875, -6.9405517578125, -6.72802734375, -6.5155029296875, -6.302978515625, -6.0904541015625, -5.8779296875, -5.6654052734375, -5.452880859375, -5.2403564453125, -5.02783203125, -4.8153076171875, -4.602783203125, -4.3902587890625, -4.177734375, -3.9652099609375, -3.752685546875, -3.5401611328125, -3.32763671875, -3.1151123046875, -2.902587890625, -2.6900634765625, -2.4775390625, -2.2650146484375, -2.052490234375, -1.8399658203125, -1.62744140625, -1.4149169921875, -1.202392578125, -0.9898681640625, -0.77734375, -0.5648193359375, -0.352294921875, -0.1397705078125, 0.07275390625, 0.2852783203125, 0.497802734375, 0.7103271484375, 0.9228515625, 1.1353759765625, 1.347900390625, 1.5604248046875, 1.77294921875, 1.9854736328125, 2.197998046875, 2.4105224609375, 2.623046875, 2.8355712890625, 3.048095703125, 3.2606201171875, 3.47314453125, 3.6856689453125, 3.898193359375, 4.1107177734375, 4.3232421875, 4.5357666015625, 4.748291015625, 4.9608154296875, 5.17333984375, 5.3858642578125, 5.598388671875, 5.8109130859375, 6.0234375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 3.0, 9.0, 3.0, 4.0, 9.0, 12.0, 12.0, 16.0, 16.0, 11.0, 19.0, 10.0, 29.0, 29.0, 34.0, 44.0, 27.0, 37.0, 37.0, 51.0, 56.0, 52.0, 46.0, 33.0, 43.0, 34.0, 29.0, 27.0, 31.0, 23.0, 24.0, 30.0, 20.0, 23.0, 21.0, 10.0, 11.0, 14.0, 12.0, 13.0, 7.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.25390625, -5.09735107421875, -4.9407958984375, -4.78424072265625, -4.627685546875, -4.47113037109375, -4.3145751953125, -4.15802001953125, -4.00146484375, -3.84490966796875, -3.6883544921875, -3.53179931640625, -3.375244140625, -3.21868896484375, -3.0621337890625, -2.90557861328125, -2.7490234375, -2.59246826171875, -2.4359130859375, -2.27935791015625, -2.122802734375, -1.96624755859375, -1.8096923828125, -1.65313720703125, -1.49658203125, -1.34002685546875, -1.1834716796875, -1.02691650390625, -0.870361328125, -0.71380615234375, -0.5572509765625, -0.40069580078125, -0.244140625, -0.08758544921875, 0.0689697265625, 0.22552490234375, 0.382080078125, 0.53863525390625, 0.6951904296875, 0.85174560546875, 1.00830078125, 1.16485595703125, 1.3214111328125, 1.47796630859375, 1.634521484375, 1.79107666015625, 1.9476318359375, 2.10418701171875, 2.2607421875, 2.41729736328125, 2.5738525390625, 2.73040771484375, 2.886962890625, 3.04351806640625, 3.2000732421875, 3.35662841796875, 3.51318359375, 3.66973876953125, 3.8262939453125, 3.98284912109375, 4.139404296875, 4.29595947265625, 4.4525146484375, 4.60906982421875, 4.765625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 10.0, 18.0, 16.0, 27.0, 42.0, 55.0, 89.0, 133.0, 209.0, 305.0, 416.0, 644.0, 1040.0, 1543.0, 2700.0, 4520.0, 8078.0, 15076.0, 30470.0, 65186.0, 149510.0, 349975.0, 746921.0, 1107254.0, 893125.0, 455325.0, 195980.0, 84301.0, 38566.0, 19013.0, 10026.0, 5327.0, 3156.0, 1823.0, 1133.0, 774.0, 489.0, 311.0, 214.0, 142.0, 114.0, 66.0, 45.0, 28.0, 25.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.828125, -9.5361328125, -9.244140625, -8.9521484375, -8.66015625, -8.3681640625, -8.076171875, -7.7841796875, -7.4921875, -7.2001953125, -6.908203125, -6.6162109375, -6.32421875, -6.0322265625, -5.740234375, -5.4482421875, -5.15625, -4.8642578125, -4.572265625, -4.2802734375, -3.98828125, -3.6962890625, -3.404296875, -3.1123046875, -2.8203125, -2.5283203125, -2.236328125, -1.9443359375, -1.65234375, -1.3603515625, -1.068359375, -0.7763671875, -0.484375, -0.1923828125, 0.099609375, 0.3916015625, 0.68359375, 0.9755859375, 1.267578125, 1.5595703125, 1.8515625, 2.1435546875, 2.435546875, 2.7275390625, 3.01953125, 3.3115234375, 3.603515625, 3.8955078125, 4.1875, 4.4794921875, 4.771484375, 5.0634765625, 5.35546875, 5.6474609375, 5.939453125, 6.2314453125, 6.5234375, 6.8154296875, 7.107421875, 7.3994140625, 7.69140625, 7.9833984375, 8.275390625, 8.5673828125, 8.859375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 8.0, 17.0, 18.0, 19.0, 21.0, 34.0, 57.0, 65.0, 76.0, 130.0, 157.0, 185.0, 235.0, 267.0, 296.0, 286.0, 300.0, 302.0, 306.0, 243.0, 226.0, 196.0, 122.0, 120.0, 86.0, 68.0, 59.0, 47.0, 27.0, 28.0, 18.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.869964599609375, -2.77508544921875, -2.680206298828125, -2.5853271484375, -2.490447998046875, -2.39556884765625, -2.300689697265625, -2.205810546875, -2.110931396484375, -2.01605224609375, -1.921173095703125, -1.8262939453125, -1.731414794921875, -1.63653564453125, -1.541656494140625, -1.44677734375, -1.351898193359375, -1.25701904296875, -1.162139892578125, -1.0672607421875, -0.972381591796875, -0.87750244140625, -0.782623291015625, -0.687744140625, -0.592864990234375, -0.49798583984375, -0.403106689453125, -0.3082275390625, -0.213348388671875, -0.11846923828125, -0.023590087890625, 0.0712890625, 0.166168212890625, 0.26104736328125, 0.355926513671875, 0.4508056640625, 0.545684814453125, 0.64056396484375, 0.735443115234375, 0.830322265625, 0.925201416015625, 1.02008056640625, 1.114959716796875, 1.2098388671875, 1.304718017578125, 1.39959716796875, 1.494476318359375, 1.58935546875, 1.684234619140625, 1.77911376953125, 1.873992919921875, 1.9688720703125, 2.063751220703125, 2.15863037109375, 2.253509521484375, 2.348388671875, 2.443267822265625, 2.53814697265625, 2.633026123046875, 2.7279052734375, 2.822784423828125, 2.91766357421875, 3.012542724609375, 3.107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 4.0, 7.0, 11.0, 13.0, 13.0, 12.0, 8.0, 25.0, 20.0, 22.0, 23.0, 21.0, 33.0, 26.0, 37.0, 43.0, 33.0, 51.0, 54.0, 37.0, 53.0, 43.0, 43.0, 48.0, 41.0, 39.0, 28.0, 29.0, 22.0, 22.0, 26.0, 18.0, 16.0, 12.0, 14.0, 10.0, 6.0, 5.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0], "bins": [-6.423177242279053, -6.237593173980713, -6.052008628845215, -5.866424560546875, -5.680840492248535, -5.495256423950195, -5.309671878814697, -5.124087810516357, -4.938503742218018, -4.752919673919678, -4.56733512878418, -4.38175106048584, -4.1961669921875, -4.01058292388916, -3.824998378753662, -3.6394143104553223, -3.4538300037384033, -3.2682456970214844, -3.0826616287231445, -2.8970773220062256, -2.7114932537078857, -2.525908946990967, -2.340324878692627, -2.154740571975708, -1.9691563844680786, -1.7835721969604492, -1.5979880094528198, -1.4124038219451904, -1.2268195152282715, -1.0412354469299316, -0.8556511402130127, -0.6700669527053833, -0.4844827651977539, -0.2988985776901245, -0.11331436038017273, 0.07226985692977905, 0.25785404443740845, 0.44343823194503784, 0.629022479057312, 0.8146066665649414, 1.0001908540725708, 1.1857750415802002, 1.3713592290878296, 1.556943416595459, 1.742527723312378, 1.9281117916107178, 2.1136960983276367, 2.2992801666259766, 2.4848644733428955, 2.6704487800598145, 2.8560328483581543, 3.0416171550750732, 3.227201223373413, 3.412785530090332, 3.598369598388672, 3.783953905105591, 3.9695382118225098, 4.15512228012085, 4.340706825256348, 4.5262908935546875, 4.711874961853027, 4.897459030151367, 5.083043575286865, 5.268627643585205, 5.454211711883545]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 6.0, 10.0, 14.0, 8.0, 13.0, 15.0, 17.0, 17.0, 23.0, 23.0, 17.0, 29.0, 29.0, 42.0, 37.0, 41.0, 32.0, 47.0, 38.0, 38.0, 43.0, 49.0, 39.0, 37.0, 33.0, 28.0, 31.0, 35.0, 30.0, 26.0, 15.0, 17.0, 17.0, 13.0, 18.0, 11.0, 7.0, 13.0, 2.0, 9.0, 7.0, 4.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.577944278717041, -5.405832290649414, -5.233720779418945, -5.061608791351318, -4.889496803283691, -4.7173848152160645, -4.5452728271484375, -4.373161315917969, -4.201049327850342, -4.028937339782715, -3.856825590133667, -3.684713840484619, -3.512601852416992, -3.3404898643493652, -3.1683781147003174, -2.9962663650512695, -2.8241543769836426, -2.6520423889160156, -2.4799306392669678, -2.30781888961792, -2.135706901550293, -1.9635950326919556, -1.7914831638336182, -1.6193712949752808, -1.4472594261169434, -1.275147557258606, -1.1030356884002686, -0.9309238195419312, -0.7588119506835938, -0.5867000818252563, -0.41458821296691895, -0.24247634410858154, -0.07036495208740234, 0.10174691677093506, 0.27385878562927246, 0.44597065448760986, 0.6180825233459473, 0.7901943922042847, 0.9623062610626221, 1.1344181299209595, 1.3065299987792969, 1.4786418676376343, 1.6507537364959717, 1.822865605354309, 1.9949774742126465, 2.1670894622802734, 2.3392012119293213, 2.511312961578369, 2.683424949645996, 2.855536937713623, 3.027648687362671, 3.1997604370117188, 3.3718724250793457, 3.5439844131469727, 3.7160961627960205, 3.8882079124450684, 4.060319900512695, 4.232431888580322, 4.404543876647949, 4.576655387878418, 4.748767375946045, 4.920879364013672, 5.092990875244141, 5.265102863311768, 5.4372148513793945]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 8.0, 16.0, 16.0, 24.0, 29.0, 61.0, 70.0, 109.0, 191.0, 253.0, 405.0, 603.0, 909.0, 1316.0, 1916.0, 2853.0, 4221.0, 6374.0, 9305.0, 13761.0, 20525.0, 29125.0, 42706.0, 59439.0, 80117.0, 100298.0, 115028.0, 119466.0, 109862.0, 91851.0, 71092.0, 51645.0, 36856.0, 25018.0, 17044.0, 11717.0, 7830.0, 5432.0, 3616.0, 2412.0, 1671.0, 1092.0, 747.0, 477.0, 366.0, 247.0, 159.0, 92.0, 57.0, 43.0, 34.0, 26.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0], "bins": [-2.830078125, -2.7396240234375, -2.649169921875, -2.5587158203125, -2.46826171875, -2.3778076171875, -2.287353515625, -2.1968994140625, -2.1064453125, -2.0159912109375, -1.925537109375, -1.8350830078125, -1.74462890625, -1.6541748046875, -1.563720703125, -1.4732666015625, -1.3828125, -1.2923583984375, -1.201904296875, -1.1114501953125, -1.02099609375, -0.9305419921875, -0.840087890625, -0.7496337890625, -0.6591796875, -0.5687255859375, -0.478271484375, -0.3878173828125, -0.29736328125, -0.2069091796875, -0.116455078125, -0.0260009765625, 0.064453125, 0.1549072265625, 0.245361328125, 0.3358154296875, 0.42626953125, 0.5167236328125, 0.607177734375, 0.6976318359375, 0.7880859375, 0.8785400390625, 0.968994140625, 1.0594482421875, 1.14990234375, 1.2403564453125, 1.330810546875, 1.4212646484375, 1.51171875, 1.6021728515625, 1.692626953125, 1.7830810546875, 1.87353515625, 1.9639892578125, 2.054443359375, 2.1448974609375, 2.2353515625, 2.3258056640625, 2.416259765625, 2.5067138671875, 2.59716796875, 2.6876220703125, 2.778076171875, 2.8685302734375, 2.958984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 9.0, 11.0, 11.0, 8.0, 13.0, 19.0, 21.0, 26.0, 28.0, 35.0, 21.0, 36.0, 47.0, 44.0, 41.0, 36.0, 48.0, 41.0, 42.0, 54.0, 41.0, 43.0, 47.0, 26.0, 32.0, 27.0, 29.0, 21.0, 23.0, 16.0, 13.0, 7.0, 18.0, 11.0, 5.0, 3.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.76171875, -6.57098388671875, -6.3802490234375, -6.18951416015625, -5.998779296875, -5.80804443359375, -5.6173095703125, -5.42657470703125, -5.23583984375, -5.04510498046875, -4.8543701171875, -4.66363525390625, -4.472900390625, -4.28216552734375, -4.0914306640625, -3.90069580078125, -3.7099609375, -3.51922607421875, -3.3284912109375, -3.13775634765625, -2.947021484375, -2.75628662109375, -2.5655517578125, -2.37481689453125, -2.18408203125, -1.99334716796875, -1.8026123046875, -1.61187744140625, -1.421142578125, -1.23040771484375, -1.0396728515625, -0.84893798828125, -0.658203125, -0.46746826171875, -0.2767333984375, -0.08599853515625, 0.104736328125, 0.29547119140625, 0.4862060546875, 0.67694091796875, 0.86767578125, 1.05841064453125, 1.2491455078125, 1.43988037109375, 1.630615234375, 1.82135009765625, 2.0120849609375, 2.20281982421875, 2.3935546875, 2.58428955078125, 2.7750244140625, 2.96575927734375, 3.156494140625, 3.34722900390625, 3.5379638671875, 3.72869873046875, 3.91943359375, 4.11016845703125, 4.3009033203125, 4.49163818359375, 4.682373046875, 4.87310791015625, 5.0638427734375, 5.25457763671875, 5.4453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 7.0, 5.0, 11.0, 10.0, 28.0, 27.0, 56.0, 81.0, 140.0, 195.0, 311.0, 471.0, 739.0, 1072.0, 1776.0, 2644.0, 4358.0, 6641.0, 10718.0, 16914.0, 29851.0, 166190.0, 676791.0, 67381.0, 23516.0, 14388.0, 8974.0, 5585.0, 3445.0, 2275.0, 1457.0, 839.0, 599.0, 365.0, 231.0, 156.0, 96.0, 73.0, 52.0, 32.0, 16.0, 16.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.77099609375, -6.5615234375, -6.35205078125, -6.142578125, -5.93310546875, -5.7236328125, -5.51416015625, -5.3046875, -5.09521484375, -4.8857421875, -4.67626953125, -4.466796875, -4.25732421875, -4.0478515625, -3.83837890625, -3.62890625, -3.41943359375, -3.2099609375, -3.00048828125, -2.791015625, -2.58154296875, -2.3720703125, -2.16259765625, -1.953125, -1.74365234375, -1.5341796875, -1.32470703125, -1.115234375, -0.90576171875, -0.6962890625, -0.48681640625, -0.27734375, -0.06787109375, 0.1416015625, 0.35107421875, 0.560546875, 0.77001953125, 0.9794921875, 1.18896484375, 1.3984375, 1.60791015625, 1.8173828125, 2.02685546875, 2.236328125, 2.44580078125, 2.6552734375, 2.86474609375, 3.07421875, 3.28369140625, 3.4931640625, 3.70263671875, 3.912109375, 4.12158203125, 4.3310546875, 4.54052734375, 4.75, 4.95947265625, 5.1689453125, 5.37841796875, 5.587890625, 5.79736328125, 6.0068359375, 6.21630859375, 6.42578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 8.0, 12.0, 8.0, 14.0, 14.0, 13.0, 15.0, 19.0, 23.0, 26.0, 31.0, 44.0, 29.0, 30.0, 29.0, 47.0, 39.0, 29.0, 44.0, 43.0, 45.0, 42.0, 37.0, 31.0, 33.0, 31.0, 32.0, 22.0, 27.0, 24.0, 14.0, 13.0, 9.0, 23.0, 8.0, 16.0, 13.0, 14.0, 6.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.92578125, -4.76007080078125, -4.5943603515625, -4.42864990234375, -4.262939453125, -4.09722900390625, -3.9315185546875, -3.76580810546875, -3.60009765625, -3.43438720703125, -3.2686767578125, -3.10296630859375, -2.937255859375, -2.77154541015625, -2.6058349609375, -2.44012451171875, -2.2744140625, -2.10870361328125, -1.9429931640625, -1.77728271484375, -1.611572265625, -1.44586181640625, -1.2801513671875, -1.11444091796875, -0.94873046875, -0.78302001953125, -0.6173095703125, -0.45159912109375, -0.285888671875, -0.12017822265625, 0.0455322265625, 0.21124267578125, 0.376953125, 0.54266357421875, 0.7083740234375, 0.87408447265625, 1.039794921875, 1.20550537109375, 1.3712158203125, 1.53692626953125, 1.70263671875, 1.86834716796875, 2.0340576171875, 2.19976806640625, 2.365478515625, 2.53118896484375, 2.6968994140625, 2.86260986328125, 3.0283203125, 3.19403076171875, 3.3597412109375, 3.52545166015625, 3.691162109375, 3.85687255859375, 4.0225830078125, 4.18829345703125, 4.35400390625, 4.51971435546875, 4.6854248046875, 4.85113525390625, 5.016845703125, 5.18255615234375, 5.3482666015625, 5.51397705078125, 5.6796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 11.0, 8.0, 9.0, 15.0, 28.0, 36.0, 50.0, 70.0, 104.0, 163.0, 291.0, 478.0, 791.0, 1288.0, 2415.0, 4648.0, 10084.0, 27660.0, 270377.0, 668699.0, 37070.0, 12258.0, 5452.0, 2729.0, 1509.0, 869.0, 495.0, 338.0, 202.0, 128.0, 96.0, 54.0, 37.0, 29.0, 19.0, 8.0, 6.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.912109375, -2.82916259765625, -2.7462158203125, -2.66326904296875, -2.580322265625, -2.49737548828125, -2.4144287109375, -2.33148193359375, -2.24853515625, -2.16558837890625, -2.0826416015625, -1.99969482421875, -1.916748046875, -1.83380126953125, -1.7508544921875, -1.66790771484375, -1.5849609375, -1.50201416015625, -1.4190673828125, -1.33612060546875, -1.253173828125, -1.17022705078125, -1.0872802734375, -1.00433349609375, -0.92138671875, -0.83843994140625, -0.7554931640625, -0.67254638671875, -0.589599609375, -0.50665283203125, -0.4237060546875, -0.34075927734375, -0.2578125, -0.17486572265625, -0.0919189453125, -0.00897216796875, 0.073974609375, 0.15692138671875, 0.2398681640625, 0.32281494140625, 0.40576171875, 0.48870849609375, 0.5716552734375, 0.65460205078125, 0.737548828125, 0.82049560546875, 0.9034423828125, 0.98638916015625, 1.0693359375, 1.15228271484375, 1.2352294921875, 1.31817626953125, 1.401123046875, 1.48406982421875, 1.5670166015625, 1.64996337890625, 1.73291015625, 1.81585693359375, 1.8988037109375, 1.98175048828125, 2.064697265625, 2.14764404296875, 2.2305908203125, 2.31353759765625, 2.396484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 6.0, 2.0, 3.0, 2.0, 5.0, 9.0, 10.0, 11.0, 10.0, 11.0, 16.0, 13.0, 28.0, 19.0, 51.0, 44.0, 50.0, 67.0, 58.0, 60.0, 87.0, 65.0, 74.0, 60.0, 53.0, 43.0, 31.0, 22.0, 19.0, 12.0, 10.0, 10.0, 11.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037479400634765625, -0.00036147981882095337, -0.0003481656312942505, -0.0003348514437675476, -0.0003215372562408447, -0.00030822306871414185, -0.00029490888118743896, -0.0002815946936607361, -0.0002682805061340332, -0.0002549663186073303, -0.00024165213108062744, -0.00022833794355392456, -0.00021502375602722168, -0.0002017095685005188, -0.00018839538097381592, -0.00017508119344711304, -0.00016176700592041016, -0.00014845281839370728, -0.0001351386308670044, -0.00012182444334030151, -0.00010851025581359863, -9.519606828689575e-05, -8.188188076019287e-05, -6.856769323348999e-05, -5.525350570678711e-05, -4.193931818008423e-05, -2.8625130653381348e-05, -1.5310943126678467e-05, -1.996755599975586e-06, 1.1317431926727295e-05, 2.4631619453430176e-05, 3.794580698013306e-05, 5.125999450683594e-05, 6.457418203353882e-05, 7.78883695602417e-05, 9.120255708694458e-05, 0.00010451674461364746, 0.00011783093214035034, 0.00013114511966705322, 0.0001444593071937561, 0.00015777349472045898, 0.00017108768224716187, 0.00018440186977386475, 0.00019771605730056763, 0.0002110302448272705, 0.0002243444323539734, 0.00023765861988067627, 0.00025097280740737915, 0.00026428699493408203, 0.0002776011824607849, 0.0002909153699874878, 0.0003042295575141907, 0.00031754374504089355, 0.00033085793256759644, 0.0003441721200942993, 0.0003574863076210022, 0.0003708004951477051, 0.00038411468267440796, 0.00039742887020111084, 0.0004107430577278137, 0.0004240572452545166, 0.0004373714327812195, 0.00045068562030792236, 0.00046399980783462524, 0.0004773139953613281]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 7.0, 14.0, 29.0, 29.0, 43.0, 68.0, 97.0, 147.0, 163.0, 265.0, 415.0, 619.0, 1041.0, 1490.0, 2397.0, 3825.0, 6498.0, 10887.0, 19807.0, 37453.0, 77798.0, 183408.0, 332552.0, 197443.0, 82558.0, 39546.0, 20644.0, 11421.0, 6786.0, 4011.0, 2532.0, 1572.0, 1044.0, 655.0, 430.0, 275.0, 173.0, 121.0, 81.0, 73.0, 41.0, 27.0, 16.0, 12.0, 9.0, 6.0, 8.0, 4.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2353515625, -1.1949005126953125, -1.154449462890625, -1.1139984130859375, -1.07354736328125, -1.0330963134765625, -0.992645263671875, -0.9521942138671875, -0.9117431640625, -0.8712921142578125, -0.830841064453125, -0.7903900146484375, -0.74993896484375, -0.7094879150390625, -0.669036865234375, -0.6285858154296875, -0.588134765625, -0.5476837158203125, -0.507232666015625, -0.4667816162109375, -0.42633056640625, -0.3858795166015625, -0.345428466796875, -0.3049774169921875, -0.2645263671875, -0.2240753173828125, -0.183624267578125, -0.1431732177734375, -0.10272216796875, -0.0622711181640625, -0.021820068359375, 0.0186309814453125, 0.05908203125, 0.0995330810546875, 0.139984130859375, 0.1804351806640625, 0.22088623046875, 0.2613372802734375, 0.301788330078125, 0.3422393798828125, 0.3826904296875, 0.4231414794921875, 0.463592529296875, 0.5040435791015625, 0.54449462890625, 0.5849456787109375, 0.625396728515625, 0.6658477783203125, 0.706298828125, 0.7467498779296875, 0.787200927734375, 0.8276519775390625, 0.86810302734375, 0.9085540771484375, 0.949005126953125, 0.9894561767578125, 1.0299072265625, 1.0703582763671875, 1.110809326171875, 1.1512603759765625, 1.19171142578125, 1.2321624755859375, 1.272613525390625, 1.3130645751953125, 1.353515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 3.0, 9.0, 12.0, 4.0, 8.0, 16.0, 18.0, 27.0, 23.0, 28.0, 39.0, 39.0, 57.0, 64.0, 63.0, 64.0, 70.0, 66.0, 61.0, 41.0, 48.0, 44.0, 44.0, 25.0, 19.0, 20.0, 14.0, 15.0, 7.0, 14.0, 3.0, 8.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.41943359375, -0.4078102111816406, -0.39618682861328125, -0.3845634460449219, -0.3729400634765625, -0.3613166809082031, -0.34969329833984375, -0.3380699157714844, -0.326446533203125, -0.3148231506347656, -0.30319976806640625, -0.2915763854980469, -0.2799530029296875, -0.2683296203613281, -0.25670623779296875, -0.24508285522460938, -0.23345947265625, -0.22183609008789062, -0.21021270751953125, -0.19858932495117188, -0.1869659423828125, -0.17534255981445312, -0.16371917724609375, -0.15209579467773438, -0.140472412109375, -0.12884902954101562, -0.11722564697265625, -0.10560226440429688, -0.0939788818359375, -0.08235549926757812, -0.07073211669921875, -0.059108734130859375, -0.0474853515625, -0.035861968994140625, -0.02423858642578125, -0.012615203857421875, -0.0009918212890625, 0.010631561279296875, 0.02225494384765625, 0.033878326416015625, 0.045501708984375, 0.057125091552734375, 0.06874847412109375, 0.08037185668945312, 0.0919952392578125, 0.10361862182617188, 0.11524200439453125, 0.12686538696289062, 0.13848876953125, 0.15011215209960938, 0.16173553466796875, 0.17335891723632812, 0.1849822998046875, 0.19660568237304688, 0.20822906494140625, 0.21985244750976562, 0.231475830078125, 0.24309921264648438, 0.25472259521484375, 0.2663459777832031, 0.2779693603515625, 0.2895927429199219, 0.30121612548828125, 0.3128395080566406, 0.324462890625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 14.0, 7.0, 12.0, 10.0, 20.0, 17.0, 17.0, 21.0, 19.0, 31.0, 33.0, 35.0, 51.0, 49.0, 49.0, 42.0, 45.0, 64.0, 49.0, 40.0, 48.0, 40.0, 41.0, 28.0, 35.0, 26.0, 15.0, 26.0, 19.0, 12.0, 11.0, 9.0, 5.0, 12.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.1788740158081055, -5.980663776397705, -5.782453536987305, -5.584243297576904, -5.386033058166504, -5.187822341918945, -4.989612102508545, -4.7914018630981445, -4.593191623687744, -4.394981384277344, -4.196771144866943, -3.998560667037964, -3.8003504276275635, -3.602140188217163, -3.4039297103881836, -3.205719470977783, -3.007509231567383, -2.8092989921569824, -2.611088752746582, -2.4128782749176025, -2.214668035507202, -2.0164577960968018, -1.8182474374771118, -1.6200370788574219, -1.4218268394470215, -1.223616600036621, -1.0254062414169312, -0.827195942401886, -0.6289856433868408, -0.43077534437179565, -0.2325650453567505, -0.03435468673706055, 0.16385602951049805, 0.3620663285255432, 0.5602766275405884, 0.7584869265556335, 0.9566972255706787, 1.154907464981079, 1.353117823600769, 1.551328182220459, 1.7495384216308594, 1.9477486610412598, 2.14595890045166, 2.3441693782806396, 2.54237961769104, 2.7405898571014404, 2.93880033493042, 3.1370105743408203, 3.3352208137512207, 3.533431053161621, 3.7316412925720215, 3.929851770401001, 4.1280622482299805, 4.326272487640381, 4.524482727050781, 4.722692966461182, 4.920903205871582, 5.119113445281982, 5.317323684692383, 5.515533924102783, 5.713744163513184, 5.911954879760742, 6.110165119171143, 6.308375358581543, 6.506585597991943]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 11.0, 9.0, 13.0, 12.0, 25.0, 20.0, 16.0, 26.0, 20.0, 33.0, 39.0, 24.0, 41.0, 33.0, 34.0, 43.0, 49.0, 32.0, 35.0, 33.0, 40.0, 43.0, 31.0, 39.0, 37.0, 24.0, 19.0, 29.0, 19.0, 12.0, 16.0, 20.0, 20.0, 14.0, 6.0, 5.0, 6.0, 6.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.49501895904541, -5.3253631591796875, -5.155707359313965, -4.986051559448242, -4.8163957595825195, -4.646739959716797, -4.477084159851074, -4.307428359985352, -4.137772560119629, -3.9681167602539062, -3.7984609603881836, -3.628805160522461, -3.4591493606567383, -3.2894935607910156, -3.119837760925293, -2.9501819610595703, -2.7805263996124268, -2.610870599746704, -2.4412147998809814, -2.271559000015259, -2.101903200149536, -1.9322474002838135, -1.7625917196273804, -1.5929359197616577, -1.423280119895935, -1.2536243200302124, -1.0839685201644897, -0.9143127799034119, -0.7446569800376892, -0.5750011801719666, -0.40534543991088867, -0.23568964004516602, -0.06603384017944336, 0.1036219447851181, 0.27327772974967957, 0.44293349981307983, 0.6125892996788025, 0.7822450995445251, 0.951900839805603, 1.1215566396713257, 1.2912124395370483, 1.460868239402771, 1.6305240392684937, 1.8001797199249268, 1.9698355197906494, 2.139491319656372, 2.3091471195220947, 2.4788029193878174, 2.64845871925354, 2.8181145191192627, 2.9877703189849854, 3.157426118850708, 3.3270819187164307, 3.4967377185821533, 3.666393280029297, 3.8360490798950195, 4.005704879760742, 4.175360679626465, 4.3450164794921875, 4.51467227935791, 4.684328079223633, 4.8539838790893555, 5.023639678955078, 5.193295478820801, 5.362951278686523]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 11.0, 13.0, 17.0, 17.0, 17.0, 28.0, 48.0, 75.0, 101.0, 107.0, 173.0, 244.0, 354.0, 574.0, 970.0, 1703.0, 3037.0, 6050.0, 11943.0, 24772.0, 51234.0, 101745.0, 172881.0, 221340.0, 196346.0, 124878.0, 66087.0, 31814.0, 15256.0, 7555.0, 3900.0, 2089.0, 1159.0, 653.0, 420.0, 266.0, 203.0, 114.0, 107.0, 77.0, 50.0, 33.0, 23.0, 24.0, 13.0, 15.0, 5.0, 7.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.11944580078125, -6.8795166015625, -6.63958740234375, -6.399658203125, -6.15972900390625, -5.9197998046875, -5.67987060546875, -5.43994140625, -5.20001220703125, -4.9600830078125, -4.72015380859375, -4.480224609375, -4.24029541015625, -4.0003662109375, -3.76043701171875, -3.5205078125, -3.28057861328125, -3.0406494140625, -2.80072021484375, -2.560791015625, -2.32086181640625, -2.0809326171875, -1.84100341796875, -1.60107421875, -1.36114501953125, -1.1212158203125, -0.88128662109375, -0.641357421875, -0.40142822265625, -0.1614990234375, 0.07843017578125, 0.318359375, 0.55828857421875, 0.7982177734375, 1.03814697265625, 1.278076171875, 1.51800537109375, 1.7579345703125, 1.99786376953125, 2.23779296875, 2.47772216796875, 2.7176513671875, 2.95758056640625, 3.197509765625, 3.43743896484375, 3.6773681640625, 3.91729736328125, 4.1572265625, 4.39715576171875, 4.6370849609375, 4.87701416015625, 5.116943359375, 5.35687255859375, 5.5968017578125, 5.83673095703125, 6.07666015625, 6.31658935546875, 6.5565185546875, 6.79644775390625, 7.036376953125, 7.27630615234375, 7.5162353515625, 7.75616455078125, 7.99609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 10.0, 7.0, 7.0, 12.0, 15.0, 17.0, 19.0, 16.0, 20.0, 12.0, 17.0, 33.0, 27.0, 26.0, 37.0, 27.0, 40.0, 36.0, 37.0, 44.0, 33.0, 39.0, 46.0, 37.0, 33.0, 44.0, 28.0, 31.0, 28.0, 21.0, 24.0, 22.0, 17.0, 16.0, 15.0, 11.0, 17.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.35546875, -5.1905517578125, -5.025634765625, -4.8607177734375, -4.69580078125, -4.5308837890625, -4.365966796875, -4.2010498046875, -4.0361328125, -3.8712158203125, -3.706298828125, -3.5413818359375, -3.37646484375, -3.2115478515625, -3.046630859375, -2.8817138671875, -2.716796875, -2.5518798828125, -2.386962890625, -2.2220458984375, -2.05712890625, -1.8922119140625, -1.727294921875, -1.5623779296875, -1.3974609375, -1.2325439453125, -1.067626953125, -0.9027099609375, -0.73779296875, -0.5728759765625, -0.407958984375, -0.2430419921875, -0.078125, 0.0867919921875, 0.251708984375, 0.4166259765625, 0.58154296875, 0.7464599609375, 0.911376953125, 1.0762939453125, 1.2412109375, 1.4061279296875, 1.571044921875, 1.7359619140625, 1.90087890625, 2.0657958984375, 2.230712890625, 2.3956298828125, 2.560546875, 2.7254638671875, 2.890380859375, 3.0552978515625, 3.22021484375, 3.3851318359375, 3.550048828125, 3.7149658203125, 3.8798828125, 4.0447998046875, 4.209716796875, 4.3746337890625, 4.53955078125, 4.7044677734375, 4.869384765625, 5.0343017578125, 5.19921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 1.0, 12.0, 15.0, 21.0, 34.0, 26.0, 55.0, 79.0, 109.0, 157.0, 262.0, 382.0, 528.0, 823.0, 1171.0, 1815.0, 2747.0, 4260.0, 6746.0, 11050.0, 17908.0, 29807.0, 48859.0, 78289.0, 115900.0, 149923.0, 160949.0, 139953.0, 102303.0, 66575.0, 41346.0, 25060.0, 15524.0, 9344.0, 5765.0, 3652.0, 2413.0, 1568.0, 1006.0, 684.0, 452.0, 298.0, 213.0, 143.0, 95.0, 58.0, 49.0, 42.0, 25.0, 23.0, 16.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.72265625, -6.51470947265625, -6.3067626953125, -6.09881591796875, -5.890869140625, -5.68292236328125, -5.4749755859375, -5.26702880859375, -5.05908203125, -4.85113525390625, -4.6431884765625, -4.43524169921875, -4.227294921875, -4.01934814453125, -3.8114013671875, -3.60345458984375, -3.3955078125, -3.18756103515625, -2.9796142578125, -2.77166748046875, -2.563720703125, -2.35577392578125, -2.1478271484375, -1.93988037109375, -1.73193359375, -1.52398681640625, -1.3160400390625, -1.10809326171875, -0.900146484375, -0.69219970703125, -0.4842529296875, -0.27630615234375, -0.068359375, 0.13958740234375, 0.3475341796875, 0.55548095703125, 0.763427734375, 0.97137451171875, 1.1793212890625, 1.38726806640625, 1.59521484375, 1.80316162109375, 2.0111083984375, 2.21905517578125, 2.427001953125, 2.63494873046875, 2.8428955078125, 3.05084228515625, 3.2587890625, 3.46673583984375, 3.6746826171875, 3.88262939453125, 4.090576171875, 4.29852294921875, 4.5064697265625, 4.71441650390625, 4.92236328125, 5.13031005859375, 5.3382568359375, 5.54620361328125, 5.754150390625, 5.96209716796875, 6.1700439453125, 6.37799072265625, 6.5859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 1.0, 6.0, 7.0, 4.0, 15.0, 15.0, 16.0, 22.0, 13.0, 28.0, 17.0, 20.0, 38.0, 26.0, 43.0, 32.0, 42.0, 35.0, 46.0, 39.0, 36.0, 36.0, 45.0, 26.0, 31.0, 29.0, 31.0, 36.0, 42.0, 25.0, 27.0, 22.0, 18.0, 23.0, 15.0, 16.0, 14.0, 12.0, 11.0, 11.0, 3.0, 3.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.8857421875, -3.759765625, -3.6337890625, -3.5078125, -3.3818359375, -3.255859375, -3.1298828125, -3.00390625, -2.8779296875, -2.751953125, -2.6259765625, -2.5, -2.3740234375, -2.248046875, -2.1220703125, -1.99609375, -1.8701171875, -1.744140625, -1.6181640625, -1.4921875, -1.3662109375, -1.240234375, -1.1142578125, -0.98828125, -0.8623046875, -0.736328125, -0.6103515625, -0.484375, -0.3583984375, -0.232421875, -0.1064453125, 0.01953125, 0.1455078125, 0.271484375, 0.3974609375, 0.5234375, 0.6494140625, 0.775390625, 0.9013671875, 1.02734375, 1.1533203125, 1.279296875, 1.4052734375, 1.53125, 1.6572265625, 1.783203125, 1.9091796875, 2.03515625, 2.1611328125, 2.287109375, 2.4130859375, 2.5390625, 2.6650390625, 2.791015625, 2.9169921875, 3.04296875, 3.1689453125, 3.294921875, 3.4208984375, 3.546875, 3.6728515625, 3.798828125, 3.9248046875, 4.05078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 17.0, 13.0, 22.0, 28.0, 47.0, 82.0, 74.0, 156.0, 252.0, 360.0, 486.0, 752.0, 1027.0, 1574.0, 2345.0, 3571.0, 5382.0, 8305.0, 13643.0, 22394.0, 38402.0, 68160.0, 119900.0, 193147.0, 213623.0, 148316.0, 85094.0, 48207.0, 27579.0, 16341.0, 10312.0, 6327.0, 4166.0, 2681.0, 1876.0, 1248.0, 857.0, 600.0, 390.0, 244.0, 190.0, 126.0, 79.0, 57.0, 36.0, 22.0, 28.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.2890625, -5.1343994140625, -4.979736328125, -4.8250732421875, -4.67041015625, -4.5157470703125, -4.361083984375, -4.2064208984375, -4.0517578125, -3.8970947265625, -3.742431640625, -3.5877685546875, -3.43310546875, -3.2784423828125, -3.123779296875, -2.9691162109375, -2.814453125, -2.6597900390625, -2.505126953125, -2.3504638671875, -2.19580078125, -2.0411376953125, -1.886474609375, -1.7318115234375, -1.5771484375, -1.4224853515625, -1.267822265625, -1.1131591796875, -0.95849609375, -0.8038330078125, -0.649169921875, -0.4945068359375, -0.33984375, -0.1851806640625, -0.030517578125, 0.1241455078125, 0.27880859375, 0.4334716796875, 0.588134765625, 0.7427978515625, 0.8974609375, 1.0521240234375, 1.206787109375, 1.3614501953125, 1.51611328125, 1.6707763671875, 1.825439453125, 1.9801025390625, 2.134765625, 2.2894287109375, 2.444091796875, 2.5987548828125, 2.75341796875, 2.9080810546875, 3.062744140625, 3.2174072265625, 3.3720703125, 3.5267333984375, 3.681396484375, 3.8360595703125, 3.99072265625, 4.1453857421875, 4.300048828125, 4.4547119140625, 4.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 11.0, 4.0, 11.0, 16.0, 15.0, 21.0, 33.0, 43.0, 43.0, 67.0, 72.0, 82.0, 81.0, 88.0, 77.0, 64.0, 55.0, 51.0, 32.0, 30.0, 16.0, 19.0, 9.0, 17.0, 16.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000408172607421875, -0.0003902316093444824, -0.00037229061126708984, -0.00035434961318969727, -0.0003364086151123047, -0.0003184676170349121, -0.00030052661895751953, -0.00028258562088012695, -0.0002646446228027344, -0.0002467036247253418, -0.00022876262664794922, -0.00021082162857055664, -0.00019288063049316406, -0.00017493963241577148, -0.0001569986343383789, -0.00013905763626098633, -0.00012111663818359375, -0.00010317564010620117, -8.52346420288086e-05, -6.729364395141602e-05, -4.935264587402344e-05, -3.141164779663086e-05, -1.3470649719238281e-05, 4.470348358154297e-06, 2.2411346435546875e-05, 4.035234451293945e-05, 5.829334259033203e-05, 7.623434066772461e-05, 9.417533874511719e-05, 0.00011211633682250977, 0.00013005733489990234, 0.00014799833297729492, 0.0001659393310546875, 0.00018388032913208008, 0.00020182132720947266, 0.00021976232528686523, 0.0002377033233642578, 0.0002556443214416504, 0.00027358531951904297, 0.00029152631759643555, 0.0003094673156738281, 0.0003274083137512207, 0.0003453493118286133, 0.00036329030990600586, 0.00038123130798339844, 0.000399172306060791, 0.0004171133041381836, 0.00043505430221557617, 0.00045299530029296875, 0.00047093629837036133, 0.0004888772964477539, 0.0005068182945251465, 0.0005247592926025391, 0.0005427002906799316, 0.0005606412887573242, 0.0005785822868347168, 0.0005965232849121094, 0.000614464282989502, 0.0006324052810668945, 0.0006503462791442871, 0.0006682872772216797, 0.0006862282752990723, 0.0007041692733764648, 0.0007221102714538574, 0.00074005126953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 14.0, 24.0, 29.0, 40.0, 68.0, 110.0, 196.0, 302.0, 507.0, 849.0, 1409.0, 2377.0, 4007.0, 7021.0, 12295.0, 22846.0, 44149.0, 90151.0, 177536.0, 257345.0, 204905.0, 108247.0, 53478.0, 27068.0, 14240.0, 8079.0, 4540.0, 2673.0, 1611.0, 954.0, 519.0, 320.0, 218.0, 135.0, 97.0, 50.0, 40.0, 26.0, 25.0, 12.0, 5.0, 10.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.59417724609375, -5.4227294921875, -5.25128173828125, -5.079833984375, -4.90838623046875, -4.7369384765625, -4.56549072265625, -4.39404296875, -4.22259521484375, -4.0511474609375, -3.87969970703125, -3.708251953125, -3.53680419921875, -3.3653564453125, -3.19390869140625, -3.0224609375, -2.85101318359375, -2.6795654296875, -2.50811767578125, -2.336669921875, -2.16522216796875, -1.9937744140625, -1.82232666015625, -1.65087890625, -1.47943115234375, -1.3079833984375, -1.13653564453125, -0.965087890625, -0.79364013671875, -0.6221923828125, -0.45074462890625, -0.279296875, -0.10784912109375, 0.0635986328125, 0.23504638671875, 0.406494140625, 0.57794189453125, 0.7493896484375, 0.92083740234375, 1.09228515625, 1.26373291015625, 1.4351806640625, 1.60662841796875, 1.778076171875, 1.94952392578125, 2.1209716796875, 2.29241943359375, 2.4638671875, 2.63531494140625, 2.8067626953125, 2.97821044921875, 3.149658203125, 3.32110595703125, 3.4925537109375, 3.66400146484375, 3.83544921875, 4.00689697265625, 4.1783447265625, 4.34979248046875, 4.521240234375, 4.69268798828125, 4.8641357421875, 5.03558349609375, 5.20703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 8.0, 8.0, 10.0, 10.0, 11.0, 8.0, 21.0, 29.0, 26.0, 42.0, 41.0, 46.0, 48.0, 56.0, 39.0, 48.0, 47.0, 58.0, 61.0, 41.0, 48.0, 29.0, 41.0, 40.0, 33.0, 27.0, 25.0, 17.0, 11.0, 15.0, 15.0, 15.0, 5.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1640625, -1.1204071044921875, -1.076751708984375, -1.0330963134765625, -0.98944091796875, -0.9457855224609375, -0.902130126953125, -0.8584747314453125, -0.8148193359375, -0.7711639404296875, -0.727508544921875, -0.6838531494140625, -0.64019775390625, -0.5965423583984375, -0.552886962890625, -0.5092315673828125, -0.465576171875, -0.4219207763671875, -0.378265380859375, -0.3346099853515625, -0.29095458984375, -0.2472991943359375, -0.203643798828125, -0.1599884033203125, -0.1163330078125, -0.0726776123046875, -0.029022216796875, 0.0146331787109375, 0.05828857421875, 0.1019439697265625, 0.145599365234375, 0.1892547607421875, 0.23291015625, 0.2765655517578125, 0.320220947265625, 0.3638763427734375, 0.40753173828125, 0.4511871337890625, 0.494842529296875, 0.5384979248046875, 0.5821533203125, 0.6258087158203125, 0.669464111328125, 0.7131195068359375, 0.75677490234375, 0.8004302978515625, 0.844085693359375, 0.8877410888671875, 0.931396484375, 0.9750518798828125, 1.018707275390625, 1.0623626708984375, 1.10601806640625, 1.1496734619140625, 1.193328857421875, 1.2369842529296875, 1.2806396484375, 1.3242950439453125, 1.367950439453125, 1.4116058349609375, 1.45526123046875, 1.4989166259765625, 1.542572021484375, 1.5862274169921875, 1.6298828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 10.0, 6.0, 12.0, 15.0, 12.0, 19.0, 21.0, 26.0, 30.0, 31.0, 37.0, 35.0, 51.0, 56.0, 52.0, 45.0, 49.0, 51.0, 41.0, 47.0, 39.0, 47.0, 39.0, 34.0, 24.0, 25.0, 24.0, 21.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.762845039367676, -6.555128574371338, -6.347412109375, -6.139695644378662, -5.931979179382324, -5.724262714385986, -5.516546249389648, -5.3088297843933105, -5.101113319396973, -4.893396854400635, -4.685680389404297, -4.477963924407959, -4.270247459411621, -4.062530994415283, -3.8548145294189453, -3.6470980644226074, -3.4393815994262695, -3.2316651344299316, -3.0239486694335938, -2.816232204437256, -2.608515739440918, -2.40079927444458, -2.193082809448242, -1.9853663444519043, -1.7776498794555664, -1.5699334144592285, -1.3622169494628906, -1.1545004844665527, -0.9467840194702148, -0.739067554473877, -0.5313510894775391, -0.32363462448120117, -0.11591863632202148, 0.0917978286743164, 0.2995142936706543, 0.5072307586669922, 0.7149472236633301, 0.922663688659668, 1.1303801536560059, 1.3380966186523438, 1.5458130836486816, 1.7535295486450195, 1.9612460136413574, 2.1689624786376953, 2.376678943634033, 2.584395408630371, 2.792111873626709, 2.999828338623047, 3.2075448036193848, 3.4152612686157227, 3.6229777336120605, 3.8306941986083984, 4.038410663604736, 4.246127128601074, 4.453843593597412, 4.66156005859375, 4.869276523590088, 5.076992988586426, 5.284709453582764, 5.492425918579102, 5.7001423835754395, 5.907858848571777, 6.115575313568115, 6.323291778564453, 6.531008243560791]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 8.0, 15.0, 18.0, 18.0, 25.0, 35.0, 33.0, 41.0, 30.0, 44.0, 46.0, 55.0, 46.0, 47.0, 55.0, 53.0, 49.0, 49.0, 47.0, 51.0, 34.0, 27.0, 34.0, 22.0, 17.0, 16.0, 12.0, 13.0, 4.0, 9.0, 10.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.190070629119873, -5.961208343505859, -5.7323455810546875, -5.503483295440674, -5.274620532989502, -5.045758247375488, -4.816895484924316, -4.588033199310303, -4.359170913696289, -4.130308628082275, -3.9014458656311035, -3.67258358001709, -3.443720817565918, -3.2148585319519043, -2.9859960079193115, -2.7571334838867188, -2.528270721435547, -2.299408197402954, -2.0705456733703613, -1.841683268547058, -1.6128207445144653, -1.3839582204818726, -1.1550958156585693, -0.9262332916259766, -0.6973707675933838, -0.4685082733631134, -0.23964577913284302, -0.01078331470489502, 0.21807920932769775, 0.4469417333602905, 0.6758041381835938, 0.9046666622161865, 1.1335296630859375, 1.3623921871185303, 1.591254711151123, 1.8201171159744263, 2.0489797592163086, 2.2778420448303223, 2.506704568862915, 2.735567092895508, 2.9644296169281006, 3.1932921409606934, 3.422154664993286, 3.651017189025879, 3.8798794746398926, 4.1087422370910645, 4.337604522705078, 4.56646728515625, 4.795329570770264, 5.024191856384277, 5.253054618835449, 5.481916904449463, 5.710779666900635, 5.939641952514648, 6.16850471496582, 6.397367000579834, 6.626229286193848, 6.855091571807861, 7.083954334259033, 7.312816619873047, 7.541679382324219, 7.770541667938232, 7.999403953552246, 8.228266716003418, 8.45712947845459]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 15.0, 16.0, 19.0, 42.0, 42.0, 72.0, 118.0, 154.0, 221.0, 346.0, 525.0, 738.0, 1148.0, 1786.0, 2605.0, 4403.0, 7064.0, 11919.0, 21586.0, 42280.0, 90910.0, 209858.0, 464884.0, 841769.0, 1008715.0, 757368.0, 396634.0, 175081.0, 76159.0, 34946.0, 17518.0, 9842.0, 5695.0, 3381.0, 2154.0, 1336.0, 912.0, 652.0, 409.0, 321.0, 192.0, 136.0, 85.0, 65.0, 46.0, 29.0, 27.0, 17.0, 12.0, 9.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.5625, -6.3533935546875, -6.144287109375, -5.9351806640625, -5.72607421875, -5.5169677734375, -5.307861328125, -5.0987548828125, -4.8896484375, -4.6805419921875, -4.471435546875, -4.2623291015625, -4.05322265625, -3.8441162109375, -3.635009765625, -3.4259033203125, -3.216796875, -3.0076904296875, -2.798583984375, -2.5894775390625, -2.38037109375, -2.1712646484375, -1.962158203125, -1.7530517578125, -1.5439453125, -1.3348388671875, -1.125732421875, -0.9166259765625, -0.70751953125, -0.4984130859375, -0.289306640625, -0.0802001953125, 0.12890625, 0.3380126953125, 0.547119140625, 0.7562255859375, 0.96533203125, 1.1744384765625, 1.383544921875, 1.5926513671875, 1.8017578125, 2.0108642578125, 2.219970703125, 2.4290771484375, 2.63818359375, 2.8472900390625, 3.056396484375, 3.2655029296875, 3.474609375, 3.6837158203125, 3.892822265625, 4.1019287109375, 4.31103515625, 4.5201416015625, 4.729248046875, 4.9383544921875, 5.1474609375, 5.3565673828125, 5.565673828125, 5.7747802734375, 5.98388671875, 6.1929931640625, 6.402099609375, 6.6112060546875, 6.8203125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 14.0, 10.0, 13.0, 12.0, 23.0, 29.0, 20.0, 24.0, 30.0, 40.0, 36.0, 39.0, 48.0, 49.0, 49.0, 52.0, 57.0, 43.0, 52.0, 48.0, 47.0, 37.0, 33.0, 23.0, 23.0, 24.0, 16.0, 22.0, 17.0, 13.0, 10.0, 6.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05859375, -4.8768310546875, -4.695068359375, -4.5133056640625, -4.33154296875, -4.1497802734375, -3.968017578125, -3.7862548828125, -3.6044921875, -3.4227294921875, -3.240966796875, -3.0592041015625, -2.87744140625, -2.6956787109375, -2.513916015625, -2.3321533203125, -2.150390625, -1.9686279296875, -1.786865234375, -1.6051025390625, -1.42333984375, -1.2415771484375, -1.059814453125, -0.8780517578125, -0.6962890625, -0.5145263671875, -0.332763671875, -0.1510009765625, 0.03076171875, 0.2125244140625, 0.394287109375, 0.5760498046875, 0.7578125, 0.9395751953125, 1.121337890625, 1.3031005859375, 1.48486328125, 1.6666259765625, 1.848388671875, 2.0301513671875, 2.2119140625, 2.3936767578125, 2.575439453125, 2.7572021484375, 2.93896484375, 3.1207275390625, 3.302490234375, 3.4842529296875, 3.666015625, 3.8477783203125, 4.029541015625, 4.2113037109375, 4.39306640625, 4.5748291015625, 4.756591796875, 4.9383544921875, 5.1201171875, 5.3018798828125, 5.483642578125, 5.6654052734375, 5.84716796875, 6.0289306640625, 6.210693359375, 6.3924560546875, 6.57421875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 5.0, 14.0, 20.0, 23.0, 32.0, 46.0, 68.0, 103.0, 134.0, 167.0, 283.0, 363.0, 539.0, 743.0, 1123.0, 1697.0, 2683.0, 4102.0, 6792.0, 11610.0, 20909.0, 40479.0, 85450.0, 196305.0, 454913.0, 905353.0, 1111081.0, 730856.0, 336138.0, 144003.0, 64636.0, 31544.0, 16579.0, 9332.0, 5693.0, 3512.0, 2275.0, 1459.0, 963.0, 691.0, 442.0, 341.0, 223.0, 141.0, 97.0, 91.0, 70.0, 40.0, 35.0, 13.0, 14.0, 14.0, 8.0, 9.0, 7.0, 6.0, 1.0, 4.0], "bins": [-9.1640625, -8.8804931640625, -8.596923828125, -8.3133544921875, -8.02978515625, -7.7462158203125, -7.462646484375, -7.1790771484375, -6.8955078125, -6.6119384765625, -6.328369140625, -6.0447998046875, -5.76123046875, -5.4776611328125, -5.194091796875, -4.9105224609375, -4.626953125, -4.3433837890625, -4.059814453125, -3.7762451171875, -3.49267578125, -3.2091064453125, -2.925537109375, -2.6419677734375, -2.3583984375, -2.0748291015625, -1.791259765625, -1.5076904296875, -1.22412109375, -0.9405517578125, -0.656982421875, -0.3734130859375, -0.08984375, 0.1937255859375, 0.477294921875, 0.7608642578125, 1.04443359375, 1.3280029296875, 1.611572265625, 1.8951416015625, 2.1787109375, 2.4622802734375, 2.745849609375, 3.0294189453125, 3.31298828125, 3.5965576171875, 3.880126953125, 4.1636962890625, 4.447265625, 4.7308349609375, 5.014404296875, 5.2979736328125, 5.58154296875, 5.8651123046875, 6.148681640625, 6.4322509765625, 6.7158203125, 6.9993896484375, 7.282958984375, 7.5665283203125, 7.85009765625, 8.1336669921875, 8.417236328125, 8.7008056640625, 8.984375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 16.0, 13.0, 16.0, 19.0, 25.0, 31.0, 57.0, 41.0, 71.0, 82.0, 102.0, 136.0, 160.0, 175.0, 230.0, 240.0, 263.0, 304.0, 290.0, 281.0, 261.0, 246.0, 196.0, 156.0, 151.0, 106.0, 90.0, 68.0, 53.0, 32.0, 33.0, 25.0, 15.0, 15.0, 14.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.80859375, -2.72119140625, -2.6337890625, -2.54638671875, -2.458984375, -2.37158203125, -2.2841796875, -2.19677734375, -2.109375, -2.02197265625, -1.9345703125, -1.84716796875, -1.759765625, -1.67236328125, -1.5849609375, -1.49755859375, -1.41015625, -1.32275390625, -1.2353515625, -1.14794921875, -1.060546875, -0.97314453125, -0.8857421875, -0.79833984375, -0.7109375, -0.62353515625, -0.5361328125, -0.44873046875, -0.361328125, -0.27392578125, -0.1865234375, -0.09912109375, -0.01171875, 0.07568359375, 0.1630859375, 0.25048828125, 0.337890625, 0.42529296875, 0.5126953125, 0.60009765625, 0.6875, 0.77490234375, 0.8623046875, 0.94970703125, 1.037109375, 1.12451171875, 1.2119140625, 1.29931640625, 1.38671875, 1.47412109375, 1.5615234375, 1.64892578125, 1.736328125, 1.82373046875, 1.9111328125, 1.99853515625, 2.0859375, 2.17333984375, 2.2607421875, 2.34814453125, 2.435546875, 2.52294921875, 2.6103515625, 2.69775390625, 2.78515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 3.0, 5.0, 8.0, 13.0, 6.0, 16.0, 14.0, 12.0, 16.0, 27.0, 29.0, 38.0, 41.0, 45.0, 50.0, 52.0, 67.0, 59.0, 55.0, 54.0, 50.0, 47.0, 47.0, 33.0, 28.0, 32.0, 18.0, 25.0, 18.0, 16.0, 16.0, 10.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.590851783752441, -6.369492530822754, -6.148133754730225, -5.926774501800537, -5.705415725708008, -5.48405647277832, -5.262697219848633, -5.041337966918945, -4.819979190826416, -4.5986199378967285, -4.377261161804199, -4.155901908874512, -3.9345428943634033, -3.713183879852295, -3.4918246269226074, -3.270465612411499, -3.0491065979003906, -2.8277475833892822, -2.606388568878174, -2.3850293159484863, -2.163670301437378, -1.9423112869262695, -1.7209521532058716, -1.4995930194854736, -1.2782340049743652, -1.0568749904632568, -0.8355158567428589, -0.6141567826271057, -0.39279770851135254, -0.17143869400024414, 0.04992043972015381, 0.27127957344055176, 0.49263858795166016, 0.7139976620674133, 0.9353567361831665, 1.1567158699035645, 1.3780748844146729, 1.5994338989257812, 1.8207930326461792, 2.042152166366577, 2.2635111808776855, 2.484870195388794, 2.7062292098999023, 2.92758846282959, 3.1489474773406982, 3.3703064918518066, 3.591665744781494, 3.8130247592926025, 4.034383773803711, 4.255743026733398, 4.477101802825928, 4.698461055755615, 4.9198198318481445, 5.141179084777832, 5.3625383377075195, 5.583897590637207, 5.805256366729736, 6.026615619659424, 6.247974395751953, 6.469333648681641, 6.690692901611328, 6.912051677703857, 7.133410930633545, 7.354769706726074, 7.576128959655762]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 13.0, 8.0, 5.0, 19.0, 13.0, 14.0, 12.0, 23.0, 21.0, 25.0, 35.0, 41.0, 20.0, 31.0, 49.0, 45.0, 46.0, 51.0, 47.0, 42.0, 40.0, 40.0, 39.0, 36.0, 36.0, 32.0, 30.0, 25.0, 25.0, 34.0, 21.0, 16.0, 14.0, 15.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5407490730285645, -5.3404693603515625, -5.140190124511719, -4.939910411834717, -4.739630699157715, -4.539351463317871, -4.339071750640869, -4.138792037963867, -3.9385128021240234, -3.7382333278656006, -3.5379538536071777, -3.337674140930176, -3.137394666671753, -2.93711519241333, -2.736835479736328, -2.5365560054779053, -2.3362765312194824, -2.1359970569610596, -1.9357174634933472, -1.7354378700256348, -1.535158395767212, -1.334878921508789, -1.1345993280410767, -0.9343197345733643, -0.7340402603149414, -0.5337607264518738, -0.33348119258880615, -0.13320165872573853, 0.0670778751373291, 0.26735734939575195, 0.46763694286346436, 0.6679165363311768, 0.8681964874267578, 1.0684759616851807, 1.268755555152893, 1.4690351486206055, 1.6693146228790283, 1.8695940971374512, 2.069873809814453, 2.270153284072876, 2.470432758331299, 2.6707122325897217, 2.8709917068481445, 3.0712714195251465, 3.2715508937835693, 3.471830368041992, 3.672110080718994, 3.872389554977417, 4.07266902923584, 4.272948741912842, 4.4732279777526855, 4.6735076904296875, 4.873786926269531, 5.074066638946533, 5.274346351623535, 5.474625587463379, 5.674905300140381, 5.875185012817383, 6.075464248657227, 6.2757439613342285, 6.4760236740112305, 6.676302909851074, 6.876582622528076, 7.076862335205078, 7.277141571044922]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 12.0, 20.0, 34.0, 44.0, 70.0, 92.0, 127.0, 185.0, 246.0, 426.0, 532.0, 744.0, 1126.0, 1672.0, 2476.0, 3706.0, 5787.0, 8957.0, 14203.0, 22353.0, 35694.0, 56830.0, 86981.0, 124645.0, 155083.0, 155010.0, 125714.0, 88309.0, 57507.0, 36098.0, 22761.0, 14278.0, 9143.0, 5930.0, 3819.0, 2613.0, 1686.0, 1079.0, 756.0, 537.0, 381.0, 277.0, 172.0, 129.0, 93.0, 74.0, 43.0, 32.0, 19.0, 18.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.19140625, -3.0885009765625, -2.985595703125, -2.8826904296875, -2.77978515625, -2.6768798828125, -2.573974609375, -2.4710693359375, -2.3681640625, -2.2652587890625, -2.162353515625, -2.0594482421875, -1.95654296875, -1.8536376953125, -1.750732421875, -1.6478271484375, -1.544921875, -1.4420166015625, -1.339111328125, -1.2362060546875, -1.13330078125, -1.0303955078125, -0.927490234375, -0.8245849609375, -0.7216796875, -0.6187744140625, -0.515869140625, -0.4129638671875, -0.31005859375, -0.2071533203125, -0.104248046875, -0.0013427734375, 0.1015625, 0.2044677734375, 0.307373046875, 0.4102783203125, 0.51318359375, 0.6160888671875, 0.718994140625, 0.8218994140625, 0.9248046875, 1.0277099609375, 1.130615234375, 1.2335205078125, 1.33642578125, 1.4393310546875, 1.542236328125, 1.6451416015625, 1.748046875, 1.8509521484375, 1.953857421875, 2.0567626953125, 2.15966796875, 2.2625732421875, 2.365478515625, 2.4683837890625, 2.5712890625, 2.6741943359375, 2.777099609375, 2.8800048828125, 2.98291015625, 3.0858154296875, 3.188720703125, 3.2916259765625, 3.39453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 12.0, 8.0, 7.0, 9.0, 16.0, 16.0, 17.0, 16.0, 20.0, 22.0, 29.0, 30.0, 35.0, 40.0, 44.0, 40.0, 50.0, 42.0, 50.0, 38.0, 45.0, 49.0, 38.0, 40.0, 36.0, 25.0, 25.0, 28.0, 25.0, 26.0, 25.0, 22.0, 12.0, 14.0, 14.0, 7.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.4173583984375, -5.209716796875, -5.0020751953125, -4.79443359375, -4.5867919921875, -4.379150390625, -4.1715087890625, -3.9638671875, -3.7562255859375, -3.548583984375, -3.3409423828125, -3.13330078125, -2.9256591796875, -2.718017578125, -2.5103759765625, -2.302734375, -2.0950927734375, -1.887451171875, -1.6798095703125, -1.47216796875, -1.2645263671875, -1.056884765625, -0.8492431640625, -0.6416015625, -0.4339599609375, -0.226318359375, -0.0186767578125, 0.18896484375, 0.3966064453125, 0.604248046875, 0.8118896484375, 1.01953125, 1.2271728515625, 1.434814453125, 1.6424560546875, 1.85009765625, 2.0577392578125, 2.265380859375, 2.4730224609375, 2.6806640625, 2.8883056640625, 3.095947265625, 3.3035888671875, 3.51123046875, 3.7188720703125, 3.926513671875, 4.1341552734375, 4.341796875, 4.5494384765625, 4.757080078125, 4.9647216796875, 5.17236328125, 5.3800048828125, 5.587646484375, 5.7952880859375, 6.0029296875, 6.2105712890625, 6.418212890625, 6.6258544921875, 6.83349609375, 7.0411376953125, 7.248779296875, 7.4564208984375, 7.6640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 13.0, 13.0, 22.0, 40.0, 45.0, 83.0, 113.0, 176.0, 282.0, 424.0, 693.0, 1211.0, 1932.0, 3147.0, 5017.0, 8169.0, 13060.0, 21762.0, 48400.0, 615877.0, 248951.0, 32015.0, 18095.0, 10885.0, 6891.0, 4297.0, 2617.0, 1630.0, 990.0, 622.0, 395.0, 240.0, 150.0, 83.0, 58.0, 48.0, 24.0, 19.0, 9.0, 12.0, 9.0, 7.0, 6.0, 9.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.37109375, -6.18267822265625, -5.9942626953125, -5.80584716796875, -5.617431640625, -5.42901611328125, -5.2406005859375, -5.05218505859375, -4.86376953125, -4.67535400390625, -4.4869384765625, -4.29852294921875, -4.110107421875, -3.92169189453125, -3.7332763671875, -3.54486083984375, -3.3564453125, -3.16802978515625, -2.9796142578125, -2.79119873046875, -2.602783203125, -2.41436767578125, -2.2259521484375, -2.03753662109375, -1.84912109375, -1.66070556640625, -1.4722900390625, -1.28387451171875, -1.095458984375, -0.90704345703125, -0.7186279296875, -0.53021240234375, -0.341796875, -0.15338134765625, 0.0350341796875, 0.22344970703125, 0.411865234375, 0.60028076171875, 0.7886962890625, 0.97711181640625, 1.16552734375, 1.35394287109375, 1.5423583984375, 1.73077392578125, 1.919189453125, 2.10760498046875, 2.2960205078125, 2.48443603515625, 2.6728515625, 2.86126708984375, 3.0496826171875, 3.23809814453125, 3.426513671875, 3.61492919921875, 3.8033447265625, 3.99176025390625, 4.18017578125, 4.36859130859375, 4.5570068359375, 4.74542236328125, 4.933837890625, 5.12225341796875, 5.3106689453125, 5.49908447265625, 5.6875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 3.0, 8.0, 8.0, 10.0, 10.0, 14.0, 20.0, 20.0, 24.0, 21.0, 25.0, 34.0, 27.0, 41.0, 38.0, 38.0, 41.0, 54.0, 45.0, 41.0, 40.0, 44.0, 35.0, 43.0, 41.0, 42.0, 37.0, 29.0, 30.0, 19.0, 27.0, 21.0, 12.0, 8.0, 5.0, 11.0, 10.0, 10.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.4208984375, -5.244140625, -5.0673828125, -4.890625, -4.7138671875, -4.537109375, -4.3603515625, -4.18359375, -4.0068359375, -3.830078125, -3.6533203125, -3.4765625, -3.2998046875, -3.123046875, -2.9462890625, -2.76953125, -2.5927734375, -2.416015625, -2.2392578125, -2.0625, -1.8857421875, -1.708984375, -1.5322265625, -1.35546875, -1.1787109375, -1.001953125, -0.8251953125, -0.6484375, -0.4716796875, -0.294921875, -0.1181640625, 0.05859375, 0.2353515625, 0.412109375, 0.5888671875, 0.765625, 0.9423828125, 1.119140625, 1.2958984375, 1.47265625, 1.6494140625, 1.826171875, 2.0029296875, 2.1796875, 2.3564453125, 2.533203125, 2.7099609375, 2.88671875, 3.0634765625, 3.240234375, 3.4169921875, 3.59375, 3.7705078125, 3.947265625, 4.1240234375, 4.30078125, 4.4775390625, 4.654296875, 4.8310546875, 5.0078125, 5.1845703125, 5.361328125, 5.5380859375, 5.71484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 10.0, 7.0, 15.0, 21.0, 33.0, 45.0, 69.0, 92.0, 143.0, 293.0, 517.0, 1164.0, 3159.0, 11420.0, 68035.0, 915040.0, 36540.0, 7617.0, 2373.0, 914.0, 441.0, 206.0, 127.0, 77.0, 64.0, 33.0, 33.0, 16.0, 17.0, 11.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.966796875, -2.87786865234375, -2.7889404296875, -2.70001220703125, -2.611083984375, -2.52215576171875, -2.4332275390625, -2.34429931640625, -2.25537109375, -2.16644287109375, -2.0775146484375, -1.98858642578125, -1.899658203125, -1.81072998046875, -1.7218017578125, -1.63287353515625, -1.5439453125, -1.45501708984375, -1.3660888671875, -1.27716064453125, -1.188232421875, -1.09930419921875, -1.0103759765625, -0.92144775390625, -0.83251953125, -0.74359130859375, -0.6546630859375, -0.56573486328125, -0.476806640625, -0.38787841796875, -0.2989501953125, -0.21002197265625, -0.12109375, -0.03216552734375, 0.0567626953125, 0.14569091796875, 0.234619140625, 0.32354736328125, 0.4124755859375, 0.50140380859375, 0.59033203125, 0.67926025390625, 0.7681884765625, 0.85711669921875, 0.946044921875, 1.03497314453125, 1.1239013671875, 1.21282958984375, 1.3017578125, 1.39068603515625, 1.4796142578125, 1.56854248046875, 1.657470703125, 1.74639892578125, 1.8353271484375, 1.92425537109375, 2.01318359375, 2.10211181640625, 2.1910400390625, 2.27996826171875, 2.368896484375, 2.45782470703125, 2.5467529296875, 2.63568115234375, 2.724609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 14.0, 12.0, 17.0, 24.0, 28.0, 48.0, 51.0, 61.0, 72.0, 97.0, 113.0, 100.0, 72.0, 57.0, 57.0, 38.0, 38.0, 19.0, 12.0, 11.0, 11.0, 5.0, 7.0, 5.0, 6.0, 6.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003802776336669922, -0.0003689117729663849, -0.0003575459122657776, -0.0003461800515651703, -0.000334814190864563, -0.0003234483301639557, -0.0003120824694633484, -0.0003007166087627411, -0.0002893507480621338, -0.0002779848873615265, -0.0002666190266609192, -0.0002552531659603119, -0.0002438873052597046, -0.0002325214445590973, -0.00022115558385849, -0.0002097897231578827, -0.0001984238624572754, -0.0001870580017566681, -0.0001756921410560608, -0.0001643262803554535, -0.0001529604196548462, -0.0001415945589542389, -0.0001302286982536316, -0.00011886283755302429, -0.00010749697685241699, -9.613111615180969e-05, -8.476525545120239e-05, -7.339939475059509e-05, -6.203353404998779e-05, -5.066767334938049e-05, -3.930181264877319e-05, -2.7935951948165894e-05, -1.6570091247558594e-05, -5.204230546951294e-06, 6.161630153656006e-06, 1.7527490854263306e-05, 2.8893351554870605e-05, 4.0259212255477905e-05, 5.1625072956085205e-05, 6.29909336566925e-05, 7.43567943572998e-05, 8.57226550579071e-05, 9.70885157585144e-05, 0.0001084543764591217, 0.000119820237159729, 0.0001311860978603363, 0.0001425519585609436, 0.0001539178192615509, 0.0001652836799621582, 0.0001766495406627655, 0.0001880154013633728, 0.0001993812620639801, 0.0002107471227645874, 0.0002221129834651947, 0.000233478844165802, 0.0002448447048664093, 0.0002562105655670166, 0.0002675764262676239, 0.0002789422869682312, 0.0002903081476688385, 0.0003016740083694458, 0.0003130398690700531, 0.0003244057297706604, 0.0003357715904712677, 0.000347137451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 16.0, 8.0, 25.0, 39.0, 44.0, 55.0, 79.0, 98.0, 163.0, 183.0, 231.0, 312.0, 445.0, 647.0, 899.0, 1319.0, 2155.0, 4082.0, 9570.0, 26512.0, 94748.0, 371052.0, 386852.0, 99497.0, 28344.0, 9922.0, 4251.0, 2276.0, 1389.0, 876.0, 633.0, 445.0, 390.0, 268.0, 185.0, 135.0, 108.0, 73.0, 59.0, 39.0, 28.0, 26.0, 15.0, 14.0, 7.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4072265625, -1.3603515625, -1.3134765625, -1.2666015625, -1.2197265625, -1.1728515625, -1.1259765625, -1.0791015625, -1.0322265625, -0.9853515625, -0.9384765625, -0.8916015625, -0.8447265625, -0.7978515625, -0.7509765625, -0.7041015625, -0.6572265625, -0.6103515625, -0.5634765625, -0.5166015625, -0.4697265625, -0.4228515625, -0.3759765625, -0.3291015625, -0.2822265625, -0.2353515625, -0.1884765625, -0.1416015625, -0.0947265625, -0.0478515625, -0.0009765625, 0.0458984375, 0.0927734375, 0.1396484375, 0.1865234375, 0.2333984375, 0.2802734375, 0.3271484375, 0.3740234375, 0.4208984375, 0.4677734375, 0.5146484375, 0.5615234375, 0.6083984375, 0.6552734375, 0.7021484375, 0.7490234375, 0.7958984375, 0.8427734375, 0.8896484375, 0.9365234375, 0.9833984375, 1.0302734375, 1.0771484375, 1.1240234375, 1.1708984375, 1.2177734375, 1.2646484375, 1.3115234375, 1.3583984375, 1.4052734375, 1.4521484375, 1.4990234375, 1.5458984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 8.0, 14.0, 10.0, 16.0, 18.0, 41.0, 40.0, 65.0, 110.0, 136.0, 124.0, 104.0, 91.0, 65.0, 45.0, 21.0, 26.0, 22.0, 17.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435302734375, -0.42144775390625, -0.4075927734375, -0.39373779296875, -0.3798828125, -0.36602783203125, -0.3521728515625, -0.33831787109375, -0.324462890625, -0.31060791015625, -0.2967529296875, -0.28289794921875, -0.26904296875, -0.25518798828125, -0.2413330078125, -0.22747802734375, -0.213623046875, -0.19976806640625, -0.1859130859375, -0.17205810546875, -0.158203125, -0.14434814453125, -0.1304931640625, -0.11663818359375, -0.102783203125, -0.08892822265625, -0.0750732421875, -0.06121826171875, -0.04736328125, -0.03350830078125, -0.0196533203125, -0.00579833984375, 0.008056640625, 0.02191162109375, 0.0357666015625, 0.04962158203125, 0.0634765625, 0.07733154296875, 0.0911865234375, 0.10504150390625, 0.118896484375, 0.13275146484375, 0.1466064453125, 0.16046142578125, 0.17431640625, 0.18817138671875, 0.2020263671875, 0.21588134765625, 0.229736328125, 0.24359130859375, 0.2574462890625, 0.27130126953125, 0.28515625, 0.29901123046875, 0.3128662109375, 0.32672119140625, 0.340576171875, 0.35443115234375, 0.3682861328125, 0.38214111328125, 0.39599609375, 0.40985107421875, 0.4237060546875, 0.43756103515625, 0.451416015625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 12.0, 9.0, 17.0, 23.0, 23.0, 35.0, 35.0, 50.0, 58.0, 53.0, 57.0, 59.0, 59.0, 50.0, 61.0, 56.0, 45.0, 38.0, 37.0, 24.0, 29.0, 23.0, 22.0, 20.0, 10.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.445980072021484, -6.2141242027282715, -5.9822678565979, -5.7504119873046875, -5.518555641174316, -5.2866997718811035, -5.054843902587891, -4.8229875564575195, -4.591131210327148, -4.3592753410339355, -4.1274189949035645, -3.8955631256103516, -3.6637067794799805, -3.4318509101867676, -3.1999948024749756, -2.9681386947631836, -2.7362828254699707, -2.5044267177581787, -2.2725706100463867, -2.040714740753174, -1.8088585138320923, -1.5770024061203003, -1.3451464176177979, -1.1132903099060059, -0.8814342021942139, -0.6495780944824219, -0.41772204637527466, -0.18586599826812744, 0.04599010944366455, 0.27784621715545654, 0.509702205657959, 0.741558313369751, 0.973414421081543, 1.205270528793335, 1.437126636505127, 1.6689826250076294, 1.9008387327194214, 2.132694721221924, 2.364550828933716, 2.596406936645508, 2.8282630443573, 3.060119152069092, 3.291975259780884, 3.523831367492676, 3.7556872367858887, 3.9875435829162598, 4.219399452209473, 4.451255798339844, 4.683111667633057, 4.9149675369262695, 5.146823883056641, 5.3786797523498535, 5.610536098480225, 5.8423919677734375, 6.074248313903809, 6.3061041831970215, 6.537960052490234, 6.769815921783447, 7.001672267913818, 7.233528137207031, 7.465384483337402, 7.697240352630615, 7.929096221923828, 8.1609525680542, 8.39280891418457]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 11.0, 9.0, 14.0, 19.0, 10.0, 15.0, 21.0, 24.0, 28.0, 38.0, 37.0, 19.0, 42.0, 57.0, 38.0, 44.0, 54.0, 42.0, 33.0, 43.0, 46.0, 29.0, 33.0, 31.0, 39.0, 22.0, 27.0, 33.0, 27.0, 22.0, 14.0, 15.0, 8.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6666951179504395, -5.465402126312256, -5.2641096115112305, -5.062816619873047, -4.861523628234863, -4.660231113433838, -4.458938121795654, -4.257645606994629, -4.056352615356445, -3.855059862136841, -3.6537671089172363, -3.4524741172790527, -3.2511813640594482, -3.0498886108398438, -2.84859561920166, -2.6473028659820557, -2.446010112762451, -2.2447173595428467, -2.043424606323242, -1.8421316146850586, -1.640838861465454, -1.4395461082458496, -1.2382532358169556, -1.0369603633880615, -0.835667610168457, -0.6343747973442078, -0.4330819845199585, -0.23178917169570923, -0.03049635887145996, 0.17079639434814453, 0.3720892667770386, 0.5733821392059326, 0.7746748924255371, 0.9759677052497864, 1.1772605180740356, 1.3785533905029297, 1.5798461437225342, 1.7811388969421387, 1.9824317693710327, 2.1837246417999268, 2.3850173950195312, 2.5863101482391357, 2.7876029014587402, 2.988895893096924, 3.1901886463165283, 3.391481399536133, 3.5927743911743164, 3.794067144393921, 3.9953598976135254, 4.196652889251709, 4.397945404052734, 4.599238395690918, 4.800531387329102, 5.001823902130127, 5.2031168937683105, 5.404409408569336, 5.6057024002075195, 5.806995391845703, 6.0082879066467285, 6.209580898284912, 6.4108734130859375, 6.612166404724121, 6.813459396362305, 7.014752388000488, 7.216044902801514]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 12.0, 28.0, 29.0, 43.0, 84.0, 123.0, 141.0, 222.0, 316.0, 481.0, 695.0, 1019.0, 1569.0, 2318.0, 3644.0, 5748.0, 8919.0, 14663.0, 23498.0, 38313.0, 61542.0, 93075.0, 129482.0, 153977.0, 150121.0, 122948.0, 86363.0, 56404.0, 34719.0, 21203.0, 13453.0, 8001.0, 5285.0, 3444.0, 2285.0, 1397.0, 984.0, 687.0, 448.0, 267.0, 188.0, 137.0, 100.0, 47.0, 35.0, 33.0, 23.0, 13.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.53192138671875, -5.3529052734375, -5.17388916015625, -4.994873046875, -4.81585693359375, -4.6368408203125, -4.45782470703125, -4.27880859375, -4.09979248046875, -3.9207763671875, -3.74176025390625, -3.562744140625, -3.38372802734375, -3.2047119140625, -3.02569580078125, -2.8466796875, -2.66766357421875, -2.4886474609375, -2.30963134765625, -2.130615234375, -1.95159912109375, -1.7725830078125, -1.59356689453125, -1.41455078125, -1.23553466796875, -1.0565185546875, -0.87750244140625, -0.698486328125, -0.51947021484375, -0.3404541015625, -0.16143798828125, 0.017578125, 0.19659423828125, 0.3756103515625, 0.55462646484375, 0.733642578125, 0.91265869140625, 1.0916748046875, 1.27069091796875, 1.44970703125, 1.62872314453125, 1.8077392578125, 1.98675537109375, 2.165771484375, 2.34478759765625, 2.5238037109375, 2.70281982421875, 2.8818359375, 3.06085205078125, 3.2398681640625, 3.41888427734375, 3.597900390625, 3.77691650390625, 3.9559326171875, 4.13494873046875, 4.31396484375, 4.49298095703125, 4.6719970703125, 4.85101318359375, 5.030029296875, 5.20904541015625, 5.3880615234375, 5.56707763671875, 5.74609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 4.0, 13.0, 5.0, 16.0, 12.0, 17.0, 20.0, 15.0, 24.0, 23.0, 29.0, 31.0, 37.0, 38.0, 53.0, 48.0, 44.0, 51.0, 32.0, 43.0, 40.0, 41.0, 39.0, 40.0, 40.0, 32.0, 27.0, 31.0, 15.0, 31.0, 16.0, 22.0, 12.0, 12.0, 12.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30859375, -5.1065673828125, -4.904541015625, -4.7025146484375, -4.50048828125, -4.2984619140625, -4.096435546875, -3.8944091796875, -3.6923828125, -3.4903564453125, -3.288330078125, -3.0863037109375, -2.88427734375, -2.6822509765625, -2.480224609375, -2.2781982421875, -2.076171875, -1.8741455078125, -1.672119140625, -1.4700927734375, -1.26806640625, -1.0660400390625, -0.864013671875, -0.6619873046875, -0.4599609375, -0.2579345703125, -0.055908203125, 0.1461181640625, 0.34814453125, 0.5501708984375, 0.752197265625, 0.9542236328125, 1.15625, 1.3582763671875, 1.560302734375, 1.7623291015625, 1.96435546875, 2.1663818359375, 2.368408203125, 2.5704345703125, 2.7724609375, 2.9744873046875, 3.176513671875, 3.3785400390625, 3.58056640625, 3.7825927734375, 3.984619140625, 4.1866455078125, 4.388671875, 4.5906982421875, 4.792724609375, 4.9947509765625, 5.19677734375, 5.3988037109375, 5.600830078125, 5.8028564453125, 6.0048828125, 6.2069091796875, 6.408935546875, 6.6109619140625, 6.81298828125, 7.0150146484375, 7.217041015625, 7.4190673828125, 7.62109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 18.0, 20.0, 21.0, 27.0, 47.0, 50.0, 94.0, 132.0, 208.0, 281.0, 445.0, 625.0, 1036.0, 1771.0, 2715.0, 4312.0, 7339.0, 12062.0, 20255.0, 34929.0, 58594.0, 95409.0, 138550.0, 169449.0, 164118.0, 126873.0, 83308.0, 51044.0, 29847.0, 17913.0, 10416.0, 6268.0, 3670.0, 2397.0, 1516.0, 931.0, 629.0, 432.0, 241.0, 161.0, 117.0, 90.0, 56.0, 38.0, 27.0, 26.0, 12.0, 11.0, 5.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.37054443359375, -7.1317138671875, -6.89288330078125, -6.654052734375, -6.41522216796875, -6.1763916015625, -5.93756103515625, -5.69873046875, -5.45989990234375, -5.2210693359375, -4.98223876953125, -4.743408203125, -4.50457763671875, -4.2657470703125, -4.02691650390625, -3.7880859375, -3.54925537109375, -3.3104248046875, -3.07159423828125, -2.832763671875, -2.59393310546875, -2.3551025390625, -2.11627197265625, -1.87744140625, -1.63861083984375, -1.3997802734375, -1.16094970703125, -0.922119140625, -0.68328857421875, -0.4444580078125, -0.20562744140625, 0.033203125, 0.27203369140625, 0.5108642578125, 0.74969482421875, 0.988525390625, 1.22735595703125, 1.4661865234375, 1.70501708984375, 1.94384765625, 2.18267822265625, 2.4215087890625, 2.66033935546875, 2.899169921875, 3.13800048828125, 3.3768310546875, 3.61566162109375, 3.8544921875, 4.09332275390625, 4.3321533203125, 4.57098388671875, 4.809814453125, 5.04864501953125, 5.2874755859375, 5.52630615234375, 5.76513671875, 6.00396728515625, 6.2427978515625, 6.48162841796875, 6.720458984375, 6.95928955078125, 7.1981201171875, 7.43695068359375, 7.67578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 3.0, 7.0, 9.0, 9.0, 8.0, 15.0, 14.0, 11.0, 12.0, 18.0, 22.0, 35.0, 28.0, 27.0, 38.0, 38.0, 41.0, 43.0, 40.0, 41.0, 30.0, 56.0, 49.0, 31.0, 29.0, 31.0, 36.0, 32.0, 43.0, 34.0, 24.0, 17.0, 27.0, 20.0, 12.0, 18.0, 9.0, 12.0, 7.0, 8.0, 9.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.49334716796875, -3.3734130859375, -3.25347900390625, -3.133544921875, -3.01361083984375, -2.8936767578125, -2.77374267578125, -2.65380859375, -2.53387451171875, -2.4139404296875, -2.29400634765625, -2.174072265625, -2.05413818359375, -1.9342041015625, -1.81427001953125, -1.6943359375, -1.57440185546875, -1.4544677734375, -1.33453369140625, -1.214599609375, -1.09466552734375, -0.9747314453125, -0.85479736328125, -0.73486328125, -0.61492919921875, -0.4949951171875, -0.37506103515625, -0.255126953125, -0.13519287109375, -0.0152587890625, 0.10467529296875, 0.224609375, 0.34454345703125, 0.4644775390625, 0.58441162109375, 0.704345703125, 0.82427978515625, 0.9442138671875, 1.06414794921875, 1.18408203125, 1.30401611328125, 1.4239501953125, 1.54388427734375, 1.663818359375, 1.78375244140625, 1.9036865234375, 2.02362060546875, 2.1435546875, 2.26348876953125, 2.3834228515625, 2.50335693359375, 2.623291015625, 2.74322509765625, 2.8631591796875, 2.98309326171875, 3.10302734375, 3.22296142578125, 3.3428955078125, 3.46282958984375, 3.582763671875, 3.70269775390625, 3.8226318359375, 3.94256591796875, 4.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 9.0, 14.0, 24.0, 21.0, 32.0, 51.0, 74.0, 88.0, 135.0, 251.0, 352.0, 497.0, 773.0, 1271.0, 2075.0, 3683.0, 6791.0, 12323.0, 24090.0, 49525.0, 107237.0, 218567.0, 281425.0, 176492.0, 81820.0, 38479.0, 18998.0, 9972.0, 5436.0, 3087.0, 1767.0, 1115.0, 687.0, 461.0, 304.0, 196.0, 117.0, 98.0, 67.0, 48.0, 27.0, 22.0, 17.0, 8.0, 7.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.28125, -6.07415771484375, -5.8670654296875, -5.65997314453125, -5.452880859375, -5.24578857421875, -5.0386962890625, -4.83160400390625, -4.62451171875, -4.41741943359375, -4.2103271484375, -4.00323486328125, -3.796142578125, -3.58905029296875, -3.3819580078125, -3.17486572265625, -2.9677734375, -2.76068115234375, -2.5535888671875, -2.34649658203125, -2.139404296875, -1.93231201171875, -1.7252197265625, -1.51812744140625, -1.31103515625, -1.10394287109375, -0.8968505859375, -0.68975830078125, -0.482666015625, -0.27557373046875, -0.0684814453125, 0.13861083984375, 0.345703125, 0.55279541015625, 0.7598876953125, 0.96697998046875, 1.174072265625, 1.38116455078125, 1.5882568359375, 1.79534912109375, 2.00244140625, 2.20953369140625, 2.4166259765625, 2.62371826171875, 2.830810546875, 3.03790283203125, 3.2449951171875, 3.45208740234375, 3.6591796875, 3.86627197265625, 4.0733642578125, 4.28045654296875, 4.487548828125, 4.69464111328125, 4.9017333984375, 5.10882568359375, 5.31591796875, 5.52301025390625, 5.7301025390625, 5.93719482421875, 6.144287109375, 6.35137939453125, 6.5584716796875, 6.76556396484375, 6.97265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 9.0, 6.0, 13.0, 15.0, 14.0, 11.0, 24.0, 46.0, 67.0, 94.0, 107.0, 147.0, 116.0, 96.0, 65.0, 52.0, 34.0, 22.0, 10.0, 17.0, 5.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001071929931640625, -0.0010449737310409546, -0.0010180175304412842, -0.0009910613298416138, -0.0009641051292419434, -0.000937148928642273, -0.0009101927280426025, -0.0008832365274429321, -0.0008562803268432617, -0.0008293241262435913, -0.0008023679256439209, -0.0007754117250442505, -0.0007484555244445801, -0.0007214993238449097, -0.0006945431232452393, -0.0006675869226455688, -0.0006406307220458984, -0.000613674521446228, -0.0005867183208465576, -0.0005597621202468872, -0.0005328059196472168, -0.0005058497190475464, -0.000478893518447876, -0.00045193731784820557, -0.00042498111724853516, -0.00039802491664886475, -0.00037106871604919434, -0.0003441125154495239, -0.0003171563148498535, -0.0002902001142501831, -0.0002632439136505127, -0.00023628771305084229, -0.00020933151245117188, -0.00018237531185150146, -0.00015541911125183105, -0.00012846291065216064, -0.00010150671005249023, -7.455050945281982e-05, -4.7594308853149414e-05, -2.0638108253479004e-05, 6.318092346191406e-06, 3.3274292945861816e-05, 6.0230493545532227e-05, 8.718669414520264e-05, 0.00011414289474487305, 0.00014109909534454346, 0.00016805529594421387, 0.00019501149654388428, 0.0002219676971435547, 0.0002489238977432251, 0.0002758800983428955, 0.0003028362989425659, 0.00032979249954223633, 0.00035674870014190674, 0.00038370490074157715, 0.00041066110134124756, 0.00043761730194091797, 0.0004645735025405884, 0.0004915297031402588, 0.0005184859037399292, 0.0005454421043395996, 0.00057239830493927, 0.0005993545055389404, 0.0006263107061386108, 0.0006532669067382812]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 8.0, 8.0, 19.0, 21.0, 27.0, 43.0, 57.0, 80.0, 87.0, 148.0, 218.0, 281.0, 410.0, 543.0, 834.0, 1144.0, 1679.0, 2533.0, 3857.0, 5740.0, 9394.0, 14644.0, 24873.0, 42019.0, 72818.0, 122718.0, 179900.0, 193119.0, 146314.0, 91012.0, 52755.0, 30531.0, 18266.0, 11292.0, 7007.0, 4523.0, 3064.0, 1965.0, 1400.0, 948.0, 646.0, 481.0, 288.0, 240.0, 190.0, 103.0, 97.0, 64.0, 45.0, 32.0, 23.0, 21.0, 9.0, 16.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.140625, -4.0079345703125, -3.875244140625, -3.7425537109375, -3.60986328125, -3.4771728515625, -3.344482421875, -3.2117919921875, -3.0791015625, -2.9464111328125, -2.813720703125, -2.6810302734375, -2.54833984375, -2.4156494140625, -2.282958984375, -2.1502685546875, -2.017578125, -1.8848876953125, -1.752197265625, -1.6195068359375, -1.48681640625, -1.3541259765625, -1.221435546875, -1.0887451171875, -0.9560546875, -0.8233642578125, -0.690673828125, -0.5579833984375, -0.42529296875, -0.2926025390625, -0.159912109375, -0.0272216796875, 0.10546875, 0.2381591796875, 0.370849609375, 0.5035400390625, 0.63623046875, 0.7689208984375, 0.901611328125, 1.0343017578125, 1.1669921875, 1.2996826171875, 1.432373046875, 1.5650634765625, 1.69775390625, 1.8304443359375, 1.963134765625, 2.0958251953125, 2.228515625, 2.3612060546875, 2.493896484375, 2.6265869140625, 2.75927734375, 2.8919677734375, 3.024658203125, 3.1573486328125, 3.2900390625, 3.4227294921875, 3.555419921875, 3.6881103515625, 3.82080078125, 3.9534912109375, 4.086181640625, 4.2188720703125, 4.3515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 4.0, 2.0, 10.0, 13.0, 7.0, 16.0, 23.0, 26.0, 23.0, 27.0, 30.0, 34.0, 44.0, 50.0, 48.0, 58.0, 49.0, 62.0, 46.0, 52.0, 50.0, 43.0, 39.0, 41.0, 27.0, 22.0, 23.0, 18.0, 14.0, 16.0, 8.0, 13.0, 11.0, 12.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.48828125, -1.4454803466796875, -1.402679443359375, -1.3598785400390625, -1.31707763671875, -1.2742767333984375, -1.231475830078125, -1.1886749267578125, -1.1458740234375, -1.1030731201171875, -1.060272216796875, -1.0174713134765625, -0.97467041015625, -0.9318695068359375, -0.889068603515625, -0.8462677001953125, -0.803466796875, -0.7606658935546875, -0.717864990234375, -0.6750640869140625, -0.63226318359375, -0.5894622802734375, -0.546661376953125, -0.5038604736328125, -0.4610595703125, -0.4182586669921875, -0.375457763671875, -0.3326568603515625, -0.28985595703125, -0.2470550537109375, -0.204254150390625, -0.1614532470703125, -0.11865234375, -0.0758514404296875, -0.033050537109375, 0.0097503662109375, 0.05255126953125, 0.0953521728515625, 0.138153076171875, 0.1809539794921875, 0.2237548828125, 0.2665557861328125, 0.309356689453125, 0.3521575927734375, 0.39495849609375, 0.4377593994140625, 0.480560302734375, 0.5233612060546875, 0.566162109375, 0.6089630126953125, 0.651763916015625, 0.6945648193359375, 0.73736572265625, 0.7801666259765625, 0.822967529296875, 0.8657684326171875, 0.9085693359375, 0.9513702392578125, 0.994171142578125, 1.0369720458984375, 1.07977294921875, 1.1225738525390625, 1.165374755859375, 1.2081756591796875, 1.2509765625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 2.0, 5.0, 6.0, 9.0, 15.0, 16.0, 21.0, 25.0, 21.0, 29.0, 28.0, 45.0, 44.0, 45.0, 60.0, 59.0, 55.0, 49.0, 53.0, 54.0, 52.0, 44.0, 43.0, 40.0, 27.0, 25.0, 17.0, 19.0, 18.0, 11.0, 15.0, 5.0, 7.0, 6.0, 3.0, 6.0, 0.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.961334228515625, -6.730799674987793, -6.500265121459961, -6.269730567932129, -6.039196014404297, -5.808661460876465, -5.578126430511475, -5.347591876983643, -5.1170573234558105, -4.8865227699279785, -4.6559882164001465, -4.4254536628723145, -4.194918632507324, -3.9643843173980713, -3.73384952545166, -3.503314971923828, -3.272780418395996, -3.042245864868164, -2.811711311340332, -2.581176519393921, -2.350641965866089, -2.120107412338257, -1.8895727396011353, -1.6590380668640137, -1.4285035133361816, -1.1979689598083496, -0.967434287071228, -0.7368996739387512, -0.5063650608062744, -0.2758305072784424, -0.0452958345413208, 0.18523883819580078, 0.415773868560791, 0.6463084816932678, 0.8768430948257446, 1.1073777675628662, 1.3379123210906982, 1.5684468746185303, 1.7989815473556519, 2.0295162200927734, 2.2600507736206055, 2.4905853271484375, 2.7211198806762695, 2.9516546726226807, 3.1821892261505127, 3.4127237796783447, 3.643258571624756, 3.873793125152588, 4.10432767868042, 4.334862232208252, 4.565396785736084, 4.795931339263916, 5.026466369628906, 5.257000923156738, 5.48753547668457, 5.718070030212402, 5.948604583740234, 6.179139137268066, 6.409673690795898, 6.6402082443237305, 6.8707427978515625, 7.1012773513793945, 7.331812381744385, 7.562346935272217, 7.792881488800049]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 6.0, 9.0, 12.0, 14.0, 9.0, 17.0, 14.0, 21.0, 15.0, 21.0, 35.0, 34.0, 43.0, 29.0, 39.0, 39.0, 42.0, 49.0, 44.0, 53.0, 48.0, 38.0, 37.0, 36.0, 37.0, 31.0, 27.0, 37.0, 27.0, 24.0, 24.0, 11.0, 8.0, 19.0, 11.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.650705814361572, -5.448733806610107, -5.246762275695801, -5.044790267944336, -4.842818737030029, -4.6408467292785645, -4.438875198364258, -4.236903190612793, -4.034931182861328, -3.8329594135284424, -3.6309876441955566, -3.429015636444092, -3.227044105529785, -3.0250720977783203, -2.8231003284454346, -2.621128559112549, -2.419157028198242, -2.2171852588653564, -2.0152134895324707, -1.8132416009902954, -1.6112698316574097, -1.409298062324524, -1.2073261737823486, -1.005354404449463, -0.8033826351165771, -0.6014108657836914, -0.3994390368461609, -0.19746720790863037, 0.004504561424255371, 0.2064763307571411, 0.4084482192993164, 0.6104199886322021, 0.8123917579650879, 1.0143635272979736, 1.2163352966308594, 1.4183071851730347, 1.6202789545059204, 1.8222507238388062, 2.0242226123809814, 2.226194381713867, 2.428166151046753, 2.6301379203796387, 2.8321096897125244, 3.03408145904541, 3.236053466796875, 3.4380249977111816, 3.6399970054626465, 3.8419687747955322, 4.043940544128418, 4.245912551879883, 4.4478840827941895, 4.649856090545654, 4.851827621459961, 5.053799629211426, 5.255771636962891, 5.457743167877197, 5.659714698791504, 5.861686706542969, 6.063658237457275, 6.26563024520874, 6.467601776123047, 6.669573783874512, 6.871545791625977, 7.073517322540283, 7.275489330291748]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 14.0, 13.0, 18.0, 25.0, 39.0, 60.0, 93.0, 125.0, 202.0, 308.0, 486.0, 775.0, 1298.0, 2332.0, 4108.0, 7706.0, 15882.0, 37204.0, 104362.0, 333065.0, 913717.0, 1370104.0, 898913.0, 330232.0, 103680.0, 37146.0, 15565.0, 7480.0, 3935.0, 2117.0, 1229.0, 727.0, 437.0, 278.0, 200.0, 124.0, 95.0, 57.0, 45.0, 26.0, 23.0, 11.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.9765625, -8.6915283203125, -8.406494140625, -8.1214599609375, -7.83642578125, -7.5513916015625, -7.266357421875, -6.9813232421875, -6.6962890625, -6.4112548828125, -6.126220703125, -5.8411865234375, -5.55615234375, -5.2711181640625, -4.986083984375, -4.7010498046875, -4.416015625, -4.1309814453125, -3.845947265625, -3.5609130859375, -3.27587890625, -2.9908447265625, -2.705810546875, -2.4207763671875, -2.1357421875, -1.8507080078125, -1.565673828125, -1.2806396484375, -0.99560546875, -0.7105712890625, -0.425537109375, -0.1405029296875, 0.14453125, 0.4295654296875, 0.714599609375, 0.9996337890625, 1.28466796875, 1.5697021484375, 1.854736328125, 2.1397705078125, 2.4248046875, 2.7098388671875, 2.994873046875, 3.2799072265625, 3.56494140625, 3.8499755859375, 4.135009765625, 4.4200439453125, 4.705078125, 4.9901123046875, 5.275146484375, 5.5601806640625, 5.84521484375, 6.1302490234375, 6.415283203125, 6.7003173828125, 6.9853515625, 7.2703857421875, 7.555419921875, 7.8404541015625, 8.12548828125, 8.4105224609375, 8.695556640625, 8.9805908203125, 9.265625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 11.0, 8.0, 14.0, 8.0, 25.0, 24.0, 22.0, 26.0, 27.0, 37.0, 35.0, 43.0, 38.0, 44.0, 43.0, 45.0, 54.0, 57.0, 44.0, 33.0, 27.0, 47.0, 29.0, 37.0, 28.0, 27.0, 31.0, 17.0, 14.0, 18.0, 14.0, 13.0, 13.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.16339111328125, -4.9869384765625, -4.81048583984375, -4.634033203125, -4.45758056640625, -4.2811279296875, -4.10467529296875, -3.92822265625, -3.75177001953125, -3.5753173828125, -3.39886474609375, -3.222412109375, -3.04595947265625, -2.8695068359375, -2.69305419921875, -2.5166015625, -2.34014892578125, -2.1636962890625, -1.98724365234375, -1.810791015625, -1.63433837890625, -1.4578857421875, -1.28143310546875, -1.10498046875, -0.92852783203125, -0.7520751953125, -0.57562255859375, -0.399169921875, -0.22271728515625, -0.0462646484375, 0.13018798828125, 0.306640625, 0.48309326171875, 0.6595458984375, 0.83599853515625, 1.012451171875, 1.18890380859375, 1.3653564453125, 1.54180908203125, 1.71826171875, 1.89471435546875, 2.0711669921875, 2.24761962890625, 2.424072265625, 2.60052490234375, 2.7769775390625, 2.95343017578125, 3.1298828125, 3.30633544921875, 3.4827880859375, 3.65924072265625, 3.835693359375, 4.01214599609375, 4.1885986328125, 4.36505126953125, 4.54150390625, 4.71795654296875, 4.8944091796875, 5.07086181640625, 5.247314453125, 5.42376708984375, 5.6002197265625, 5.77667236328125, 5.953125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 28.0, 26.0, 38.0, 50.0, 87.0, 122.0, 183.0, 258.0, 368.0, 517.0, 756.0, 1157.0, 1619.0, 2452.0, 3666.0, 5905.0, 9696.0, 16807.0, 30525.0, 59615.0, 128105.0, 290652.0, 639353.0, 1070509.0, 971944.0, 517649.0, 228917.0, 101585.0, 48409.0, 25386.0, 14066.0, 8440.0, 5209.0, 3329.0, 2118.0, 1430.0, 964.0, 720.0, 466.0, 316.0, 227.0, 176.0, 124.0, 75.0, 80.0, 37.0, 35.0, 21.0, 19.0, 14.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0], "bins": [-8.6171875, -8.3466796875, -8.076171875, -7.8056640625, -7.53515625, -7.2646484375, -6.994140625, -6.7236328125, -6.453125, -6.1826171875, -5.912109375, -5.6416015625, -5.37109375, -5.1005859375, -4.830078125, -4.5595703125, -4.2890625, -4.0185546875, -3.748046875, -3.4775390625, -3.20703125, -2.9365234375, -2.666015625, -2.3955078125, -2.125, -1.8544921875, -1.583984375, -1.3134765625, -1.04296875, -0.7724609375, -0.501953125, -0.2314453125, 0.0390625, 0.3095703125, 0.580078125, 0.8505859375, 1.12109375, 1.3916015625, 1.662109375, 1.9326171875, 2.203125, 2.4736328125, 2.744140625, 3.0146484375, 3.28515625, 3.5556640625, 3.826171875, 4.0966796875, 4.3671875, 4.6376953125, 4.908203125, 5.1787109375, 5.44921875, 5.7197265625, 5.990234375, 6.2607421875, 6.53125, 6.8017578125, 7.072265625, 7.3427734375, 7.61328125, 7.8837890625, 8.154296875, 8.4248046875, 8.6953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 13.0, 21.0, 27.0, 42.0, 45.0, 50.0, 55.0, 88.0, 115.0, 151.0, 177.0, 193.0, 226.0, 251.0, 251.0, 298.0, 294.0, 264.0, 247.0, 224.0, 195.0, 166.0, 138.0, 97.0, 64.0, 72.0, 55.0, 52.0, 31.0, 32.0, 13.0, 16.0, 9.0, 11.0, 12.0, 17.0, 8.0, 6.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.3359375, -2.2552490234375, -2.174560546875, -2.0938720703125, -2.01318359375, -1.9324951171875, -1.851806640625, -1.7711181640625, -1.6904296875, -1.6097412109375, -1.529052734375, -1.4483642578125, -1.36767578125, -1.2869873046875, -1.206298828125, -1.1256103515625, -1.044921875, -0.9642333984375, -0.883544921875, -0.8028564453125, -0.72216796875, -0.6414794921875, -0.560791015625, -0.4801025390625, -0.3994140625, -0.3187255859375, -0.238037109375, -0.1573486328125, -0.07666015625, 0.0040283203125, 0.084716796875, 0.1654052734375, 0.24609375, 0.3267822265625, 0.407470703125, 0.4881591796875, 0.56884765625, 0.6495361328125, 0.730224609375, 0.8109130859375, 0.8916015625, 0.9722900390625, 1.052978515625, 1.1336669921875, 1.21435546875, 1.2950439453125, 1.375732421875, 1.4564208984375, 1.537109375, 1.6177978515625, 1.698486328125, 1.7791748046875, 1.85986328125, 1.9405517578125, 2.021240234375, 2.1019287109375, 2.1826171875, 2.2633056640625, 2.343994140625, 2.4246826171875, 2.50537109375, 2.5860595703125, 2.666748046875, 2.7474365234375, 2.828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 4.0, 12.0, 14.0, 11.0, 28.0, 28.0, 31.0, 30.0, 35.0, 36.0, 48.0, 56.0, 57.0, 63.0, 75.0, 66.0, 53.0, 64.0, 37.0, 43.0, 38.0, 34.0, 21.0, 27.0, 20.0, 14.0, 12.0, 3.0, 3.0, 4.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.880133152008057, -6.627935409545898, -6.375738143920898, -6.12354040145874, -5.87134313583374, -5.619145393371582, -5.366948127746582, -5.114750385284424, -4.862552642822266, -4.610354900360107, -4.358157634735107, -4.105959892272949, -3.853762626647949, -3.601564884185791, -3.349367380142212, -3.097169876098633, -2.844972610473633, -2.5927751064300537, -2.3405776023864746, -2.0883798599243164, -1.8361824750900269, -1.5839849710464478, -1.331787347793579, -1.07958984375, -0.8273923397064209, -0.5751948356628418, -0.3229972720146179, -0.07079970836639404, 0.18139779567718506, 0.43359529972076416, 0.6857929229736328, 0.9379904270172119, 1.1901874542236328, 1.442384958267212, 1.694582462310791, 1.9467800855636597, 2.198977470397949, 2.4511752128601074, 2.7033727169036865, 2.9555702209472656, 3.2077677249908447, 3.459965229034424, 3.712162733078003, 3.964360237121582, 4.21655797958374, 4.46875524520874, 4.720952987670898, 4.973150253295898, 5.225347995758057, 5.477545738220215, 5.729743003845215, 5.981940746307373, 6.234138011932373, 6.486335754394531, 6.738533020019531, 6.9907307624816895, 7.242928504943848, 7.495126247406006, 7.747323513031006, 7.999521255493164, 8.251718521118164, 8.503915786743164, 8.75611400604248, 9.00831127166748, 9.26050853729248]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 2.0, 7.0, 9.0, 10.0, 10.0, 16.0, 13.0, 18.0, 25.0, 24.0, 28.0, 33.0, 39.0, 36.0, 43.0, 36.0, 38.0, 36.0, 40.0, 37.0, 46.0, 41.0, 38.0, 34.0, 47.0, 36.0, 27.0, 33.0, 24.0, 26.0, 21.0, 18.0, 21.0, 17.0, 17.0, 11.0, 9.0, 11.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.999600410461426, -4.817230701446533, -4.634861469268799, -4.452491760253906, -4.270122528076172, -4.087752819061279, -3.905383586883545, -3.7230138778686523, -3.540644645690918, -3.3582751750946045, -3.175905704498291, -2.9935362339019775, -2.811166763305664, -2.6287972927093506, -2.446427822113037, -2.2640581130981445, -2.081688642501831, -1.8993191719055176, -1.716949701309204, -1.5345802307128906, -1.3522107601165771, -1.1698412895202637, -0.9874716997146606, -0.8051022291183472, -0.6227327585220337, -0.4403632879257202, -0.25799378752708435, -0.07562428712844849, 0.10674518346786499, 0.28911465406417847, 0.4714841842651367, 0.6538536548614502, 0.8362231254577637, 1.0185925960540771, 1.2009620666503906, 1.383331537246704, 1.5657010078430176, 1.748070478439331, 1.930440068244934, 2.112809658050537, 2.2951788902282715, 2.477548360824585, 2.6599178314208984, 2.842287302017212, 3.0246567726135254, 3.207026243209839, 3.3893957138061523, 3.571765422821045, 3.7541348934173584, 3.936504364013672, 4.1188740730285645, 4.301243305206299, 4.483613014221191, 4.665982246398926, 4.848351955413818, 5.030721187591553, 5.213090896606445, 5.395460605621338, 5.577829837799072, 5.760199546813965, 5.942568778991699, 6.124938488006592, 6.307307720184326, 6.489677429199219, 6.672046661376953]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 12.0, 12.0, 20.0, 30.0, 45.0, 47.0, 85.0, 113.0, 192.0, 323.0, 442.0, 704.0, 1189.0, 2072.0, 3225.0, 5707.0, 10080.0, 18336.0, 33077.0, 59378.0, 104630.0, 162563.0, 199830.0, 175542.0, 116689.0, 68014.0, 37879.0, 20748.0, 11481.0, 6576.0, 3711.0, 2122.0, 1363.0, 868.0, 507.0, 319.0, 216.0, 134.0, 90.0, 70.0, 40.0, 26.0, 25.0, 9.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.29296875, -2.21282958984375, -2.1326904296875, -2.05255126953125, -1.972412109375, -1.89227294921875, -1.8121337890625, -1.73199462890625, -1.65185546875, -1.57171630859375, -1.4915771484375, -1.41143798828125, -1.331298828125, -1.25115966796875, -1.1710205078125, -1.09088134765625, -1.0107421875, -0.93060302734375, -0.8504638671875, -0.77032470703125, -0.690185546875, -0.61004638671875, -0.5299072265625, -0.44976806640625, -0.36962890625, -0.28948974609375, -0.2093505859375, -0.12921142578125, -0.049072265625, 0.03106689453125, 0.1112060546875, 0.19134521484375, 0.271484375, 0.35162353515625, 0.4317626953125, 0.51190185546875, 0.592041015625, 0.67218017578125, 0.7523193359375, 0.83245849609375, 0.91259765625, 0.99273681640625, 1.0728759765625, 1.15301513671875, 1.233154296875, 1.31329345703125, 1.3934326171875, 1.47357177734375, 1.5537109375, 1.63385009765625, 1.7139892578125, 1.79412841796875, 1.874267578125, 1.95440673828125, 2.0345458984375, 2.11468505859375, 2.19482421875, 2.27496337890625, 2.3551025390625, 2.43524169921875, 2.515380859375, 2.59552001953125, 2.6756591796875, 2.75579833984375, 2.8359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 15.0, 10.0, 10.0, 14.0, 18.0, 30.0, 28.0, 31.0, 33.0, 34.0, 43.0, 40.0, 47.0, 52.0, 46.0, 49.0, 41.0, 45.0, 40.0, 53.0, 33.0, 35.0, 37.0, 34.0, 32.0, 20.0, 31.0, 14.0, 14.0, 11.0, 7.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.453125, -6.236083984375, -6.01904296875, -5.802001953125, -5.5849609375, -5.367919921875, -5.15087890625, -4.933837890625, -4.716796875, -4.499755859375, -4.28271484375, -4.065673828125, -3.8486328125, -3.631591796875, -3.41455078125, -3.197509765625, -2.98046875, -2.763427734375, -2.54638671875, -2.329345703125, -2.1123046875, -1.895263671875, -1.67822265625, -1.461181640625, -1.244140625, -1.027099609375, -0.81005859375, -0.593017578125, -0.3759765625, -0.158935546875, 0.05810546875, 0.275146484375, 0.4921875, 0.709228515625, 0.92626953125, 1.143310546875, 1.3603515625, 1.577392578125, 1.79443359375, 2.011474609375, 2.228515625, 2.445556640625, 2.66259765625, 2.879638671875, 3.0966796875, 3.313720703125, 3.53076171875, 3.747802734375, 3.96484375, 4.181884765625, 4.39892578125, 4.615966796875, 4.8330078125, 5.050048828125, 5.26708984375, 5.484130859375, 5.701171875, 5.918212890625, 6.13525390625, 6.352294921875, 6.5693359375, 6.786376953125, 7.00341796875, 7.220458984375, 7.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 14.0, 18.0, 19.0, 41.0, 66.0, 63.0, 78.0, 106.0, 198.0, 265.0, 354.0, 470.0, 721.0, 1046.0, 1561.0, 2275.0, 3323.0, 5260.0, 7900.0, 12435.0, 20642.0, 45787.0, 574523.0, 287475.0, 33780.0, 17882.0, 10963.0, 7142.0, 4580.0, 2948.0, 2020.0, 1370.0, 921.0, 710.0, 481.0, 322.0, 218.0, 146.0, 104.0, 78.0, 66.0, 50.0, 25.0, 19.0, 21.0, 9.0, 15.0, 7.0, 8.0, 1.0, 3.0, 5.0, 4.0, 0.0, 2.0], "bins": [-4.71484375, -4.56689453125, -4.4189453125, -4.27099609375, -4.123046875, -3.97509765625, -3.8271484375, -3.67919921875, -3.53125, -3.38330078125, -3.2353515625, -3.08740234375, -2.939453125, -2.79150390625, -2.6435546875, -2.49560546875, -2.34765625, -2.19970703125, -2.0517578125, -1.90380859375, -1.755859375, -1.60791015625, -1.4599609375, -1.31201171875, -1.1640625, -1.01611328125, -0.8681640625, -0.72021484375, -0.572265625, -0.42431640625, -0.2763671875, -0.12841796875, 0.01953125, 0.16748046875, 0.3154296875, 0.46337890625, 0.611328125, 0.75927734375, 0.9072265625, 1.05517578125, 1.203125, 1.35107421875, 1.4990234375, 1.64697265625, 1.794921875, 1.94287109375, 2.0908203125, 2.23876953125, 2.38671875, 2.53466796875, 2.6826171875, 2.83056640625, 2.978515625, 3.12646484375, 3.2744140625, 3.42236328125, 3.5703125, 3.71826171875, 3.8662109375, 4.01416015625, 4.162109375, 4.31005859375, 4.4580078125, 4.60595703125, 4.75390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 7.0, 11.0, 4.0, 5.0, 14.0, 14.0, 20.0, 18.0, 14.0, 26.0, 14.0, 34.0, 23.0, 33.0, 14.0, 27.0, 34.0, 25.0, 22.0, 32.0, 43.0, 39.0, 31.0, 39.0, 46.0, 32.0, 47.0, 33.0, 30.0, 32.0, 30.0, 30.0, 18.0, 20.0, 21.0, 17.0, 25.0, 11.0, 7.0, 14.0, 9.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 5.0, 4.0, 1.0, 1.0], "bins": [-4.49609375, -4.3619384765625, -4.227783203125, -4.0936279296875, -3.95947265625, -3.8253173828125, -3.691162109375, -3.5570068359375, -3.4228515625, -3.2886962890625, -3.154541015625, -3.0203857421875, -2.88623046875, -2.7520751953125, -2.617919921875, -2.4837646484375, -2.349609375, -2.2154541015625, -2.081298828125, -1.9471435546875, -1.81298828125, -1.6788330078125, -1.544677734375, -1.4105224609375, -1.2763671875, -1.1422119140625, -1.008056640625, -0.8739013671875, -0.73974609375, -0.6055908203125, -0.471435546875, -0.3372802734375, -0.203125, -0.0689697265625, 0.065185546875, 0.1993408203125, 0.33349609375, 0.4676513671875, 0.601806640625, 0.7359619140625, 0.8701171875, 1.0042724609375, 1.138427734375, 1.2725830078125, 1.40673828125, 1.5408935546875, 1.675048828125, 1.8092041015625, 1.943359375, 2.0775146484375, 2.211669921875, 2.3458251953125, 2.47998046875, 2.6141357421875, 2.748291015625, 2.8824462890625, 3.0166015625, 3.1507568359375, 3.284912109375, 3.4190673828125, 3.55322265625, 3.6873779296875, 3.821533203125, 3.9556884765625, 4.08984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 10.0, 14.0, 11.0, 21.0, 45.0, 70.0, 97.0, 149.0, 198.0, 302.0, 501.0, 787.0, 1348.0, 2554.0, 4802.0, 11061.0, 32448.0, 644103.0, 303311.0, 26753.0, 9662.0, 4471.0, 2228.0, 1309.0, 784.0, 489.0, 306.0, 236.0, 138.0, 89.0, 67.0, 51.0, 33.0, 26.0, 17.0, 17.0, 10.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.306640625, -1.2643890380859375, -1.222137451171875, -1.1798858642578125, -1.13763427734375, -1.0953826904296875, -1.053131103515625, -1.0108795166015625, -0.9686279296875, -0.9263763427734375, -0.884124755859375, -0.8418731689453125, -0.79962158203125, -0.7573699951171875, -0.715118408203125, -0.6728668212890625, -0.630615234375, -0.5883636474609375, -0.546112060546875, -0.5038604736328125, -0.46160888671875, -0.4193572998046875, -0.377105712890625, -0.3348541259765625, -0.2926025390625, -0.2503509521484375, -0.208099365234375, -0.1658477783203125, -0.12359619140625, -0.0813446044921875, -0.039093017578125, 0.0031585693359375, 0.04541015625, 0.0876617431640625, 0.129913330078125, 0.1721649169921875, 0.21441650390625, 0.2566680908203125, 0.298919677734375, 0.3411712646484375, 0.3834228515625, 0.4256744384765625, 0.467926025390625, 0.5101776123046875, 0.55242919921875, 0.5946807861328125, 0.636932373046875, 0.6791839599609375, 0.721435546875, 0.7636871337890625, 0.805938720703125, 0.8481903076171875, 0.89044189453125, 0.9326934814453125, 0.974945068359375, 1.0171966552734375, 1.0594482421875, 1.1016998291015625, 1.143951416015625, 1.1862030029296875, 1.22845458984375, 1.2707061767578125, 1.312957763671875, 1.3552093505859375, 1.3974609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 3.0, 9.0, 12.0, 22.0, 52.0, 113.0, 173.0, 250.0, 171.0, 80.0, 39.0, 25.0, 13.0, 10.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.00030604004859924316, -0.00029402971267700195, -0.00028201937675476074, -0.00027000904083251953, -0.0002579987049102783, -0.0002459883689880371, -0.0002339780330657959, -0.0002219676971435547, -0.00020995736122131348, -0.00019794702529907227, -0.00018593668937683105, -0.00017392635345458984, -0.00016191601753234863, -0.00014990568161010742, -0.0001378953456878662, -0.000125885009765625, -0.00011387467384338379, -0.00010186433792114258, -8.985400199890137e-05, -7.784366607666016e-05, -6.583333015441895e-05, -5.3822994232177734e-05, -4.1812658309936523e-05, -2.9802322387695312e-05, -1.77919864654541e-05, -5.781650543212891e-06, 6.22868537902832e-06, 1.823902130126953e-05, 3.0249357223510742e-05, 4.225969314575195e-05, 5.4270029067993164e-05, 6.628036499023438e-05, 7.829070091247559e-05, 9.03010368347168e-05, 0.00010231137275695801, 0.00011432170867919922, 0.00012633204460144043, 0.00013834238052368164, 0.00015035271644592285, 0.00016236305236816406, 0.00017437338829040527, 0.00018638372421264648, 0.0001983940601348877, 0.0002104043960571289, 0.00022241473197937012, 0.00023442506790161133, 0.00024643540382385254, 0.00025844573974609375, 0.00027045607566833496, 0.00028246641159057617, 0.0002944767475128174, 0.0003064870834350586, 0.0003184974193572998, 0.000330507755279541, 0.0003425180912017822, 0.00035452842712402344, 0.00036653876304626465, 0.00037854909896850586, 0.00039055943489074707, 0.0004025697708129883, 0.0004145801067352295, 0.0004265904426574707, 0.0004386007785797119, 0.0004506111145019531]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 6.0, 6.0, 14.0, 19.0, 17.0, 30.0, 52.0, 73.0, 107.0, 153.0, 237.0, 340.0, 487.0, 789.0, 1198.0, 1919.0, 2961.0, 4803.0, 8474.0, 15367.0, 30622.0, 67370.0, 163079.0, 310181.0, 242177.0, 104460.0, 44542.0, 21194.0, 11213.0, 6368.0, 3714.0, 2230.0, 1472.0, 952.0, 574.0, 409.0, 281.0, 201.0, 134.0, 101.0, 71.0, 50.0, 43.0, 25.0, 17.0, 9.0, 7.0, 1.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8054428100585938, -0.7783660888671875, -0.7512893676757812, -0.724212646484375, -0.6971359252929688, -0.6700592041015625, -0.6429824829101562, -0.61590576171875, -0.5888290405273438, -0.5617523193359375, -0.5346755981445312, -0.507598876953125, -0.48052215576171875, -0.4534454345703125, -0.42636871337890625, -0.3992919921875, -0.37221527099609375, -0.3451385498046875, -0.31806182861328125, -0.290985107421875, -0.26390838623046875, -0.2368316650390625, -0.20975494384765625, -0.18267822265625, -0.15560150146484375, -0.1285247802734375, -0.10144805908203125, -0.074371337890625, -0.04729461669921875, -0.0202178955078125, 0.00685882568359375, 0.033935546875, 0.06101226806640625, 0.0880889892578125, 0.11516571044921875, 0.142242431640625, 0.16931915283203125, 0.1963958740234375, 0.22347259521484375, 0.25054931640625, 0.27762603759765625, 0.3047027587890625, 0.33177947998046875, 0.358856201171875, 0.38593292236328125, 0.4130096435546875, 0.44008636474609375, 0.4671630859375, 0.49423980712890625, 0.5213165283203125, 0.5483932495117188, 0.575469970703125, 0.6025466918945312, 0.6296234130859375, 0.6567001342773438, 0.68377685546875, 0.7108535766601562, 0.7379302978515625, 0.7650070190429688, 0.792083740234375, 0.8191604614257812, 0.8462371826171875, 0.8733139038085938, 0.900390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 7.0, 5.0, 13.0, 10.0, 26.0, 22.0, 31.0, 40.0, 50.0, 69.0, 78.0, 90.0, 91.0, 87.0, 85.0, 52.0, 58.0, 42.0, 27.0, 22.0, 12.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.291015625, -0.2825279235839844, -0.27404022216796875, -0.2655525207519531, -0.2570648193359375, -0.24857711791992188, -0.24008941650390625, -0.23160171508789062, -0.223114013671875, -0.21462631225585938, -0.20613861083984375, -0.19765090942382812, -0.1891632080078125, -0.18067550659179688, -0.17218780517578125, -0.16370010375976562, -0.15521240234375, -0.14672470092773438, -0.13823699951171875, -0.12974929809570312, -0.1212615966796875, -0.11277389526367188, -0.10428619384765625, -0.09579849243164062, -0.087310791015625, -0.07882308959960938, -0.07033538818359375, -0.061847686767578125, -0.0533599853515625, -0.044872283935546875, -0.03638458251953125, -0.027896881103515625, -0.0194091796875, -0.010921478271484375, -0.00243377685546875, 0.006053924560546875, 0.0145416259765625, 0.023029327392578125, 0.03151702880859375, 0.040004730224609375, 0.048492431640625, 0.056980133056640625, 0.06546783447265625, 0.07395553588867188, 0.0824432373046875, 0.09093093872070312, 0.09941864013671875, 0.10790634155273438, 0.11639404296875, 0.12488174438476562, 0.13336944580078125, 0.14185714721679688, 0.1503448486328125, 0.15883255004882812, 0.16732025146484375, 0.17580795288085938, 0.184295654296875, 0.19278335571289062, 0.20127105712890625, 0.20975875854492188, 0.2182464599609375, 0.22673416137695312, 0.23522186279296875, 0.24370956420898438, 0.252197265625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 3.0, 16.0, 13.0, 7.0, 29.0, 33.0, 24.0, 40.0, 36.0, 27.0, 50.0, 48.0, 66.0, 67.0, 63.0, 71.0, 60.0, 44.0, 50.0, 40.0, 25.0, 42.0, 29.0, 28.0, 15.0, 15.0, 11.0, 5.0, 1.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.851507186889648, -6.601330757141113, -6.35115385055542, -6.100976943969727, -5.850800514221191, -5.600624084472656, -5.350447177886963, -5.1002702713012695, -4.850093841552734, -4.599917411804199, -4.349740505218506, -4.0995635986328125, -3.8493871688842773, -3.599210500717163, -3.349033832550049, -3.0988571643829346, -2.8486804962158203, -2.598503828048706, -2.348327159881592, -2.0981504917144775, -1.8479738235473633, -1.597797155380249, -1.3476204872131348, -1.0974438190460205, -0.8472671508789062, -0.597090482711792, -0.34691381454467773, -0.09673714637756348, 0.15343952178955078, 0.40361618995666504, 0.6537928581237793, 0.9039695262908936, 1.1541461944580078, 1.404322862625122, 1.6544995307922363, 1.9046761989593506, 2.154852867126465, 2.405029535293579, 2.6552062034606934, 2.9053828716278076, 3.155559539794922, 3.405736207962036, 3.6559128761291504, 3.9060895442962646, 4.156266212463379, 4.406442642211914, 4.656619548797607, 4.906796455383301, 5.156972885131836, 5.407149314880371, 5.6573262214660645, 5.907503128051758, 6.157679557800293, 6.407855987548828, 6.6580328941345215, 6.908209800720215, 7.15838623046875, 7.408562660217285, 7.6587395668029785, 7.908916473388672, 8.159092903137207, 8.409269332885742, 8.659446716308594, 8.909623146057129, 9.159799575805664]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 7.0, 7.0, 10.0, 10.0, 18.0, 11.0, 18.0, 22.0, 28.0, 28.0, 42.0, 38.0, 30.0, 41.0, 39.0, 40.0, 31.0, 41.0, 43.0, 42.0, 45.0, 37.0, 39.0, 37.0, 40.0, 37.0, 17.0, 33.0, 27.0, 22.0, 18.0, 20.0, 16.0, 12.0, 16.0, 9.0, 3.0, 2.0, 8.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.120590686798096, -4.93440055847168, -4.748210906982422, -4.562020778656006, -4.37583065032959, -4.189640522003174, -4.003450393676758, -3.8172607421875, -3.631070613861084, -3.444880485534668, -3.258690595626831, -3.072500705718994, -2.886310577392578, -2.700120449066162, -2.513930559158325, -2.3277406692504883, -2.1415505409240723, -1.9553605318069458, -1.7691705226898193, -1.5829805135726929, -1.3967905044555664, -1.21060049533844, -1.0244104862213135, -0.838220477104187, -0.6520304679870605, -0.4658404588699341, -0.2796504497528076, -0.09346044063568115, 0.09272956848144531, 0.2789195775985718, 0.46510958671569824, 0.6512995958328247, 0.8374900817871094, 1.0236800909042358, 1.2098701000213623, 1.3960601091384888, 1.5822501182556152, 1.7684401273727417, 1.9546301364898682, 2.140820026397705, 2.327010154724121, 2.513200283050537, 2.699390172958374, 2.885580062866211, 3.071770191192627, 3.257960319519043, 3.44415020942688, 3.630340099334717, 3.816530227661133, 4.002720355987549, 4.188910484313965, 4.375100135803223, 4.561290264129639, 4.747480392456055, 4.9336700439453125, 5.1198601722717285, 5.3060503005981445, 5.4922404289245605, 5.678430557250977, 5.864620208740234, 6.05081033706665, 6.237000465393066, 6.423190116882324, 6.60938024520874, 6.795570373535156]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 6.0, 11.0, 25.0, 21.0, 22.0, 56.0, 70.0, 105.0, 151.0, 227.0, 318.0, 488.0, 750.0, 1155.0, 1703.0, 2585.0, 3865.0, 6132.0, 9993.0, 16425.0, 27193.0, 45008.0, 72173.0, 106427.0, 141728.0, 158632.0, 145373.0, 110537.0, 75257.0, 46985.0, 28690.0, 17164.0, 10686.0, 6616.0, 4055.0, 2702.0, 1711.0, 1113.0, 740.0, 544.0, 357.0, 228.0, 190.0, 93.0, 78.0, 56.0, 36.0, 22.0, 19.0, 15.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.21875, -5.0533447265625, -4.887939453125, -4.7225341796875, -4.55712890625, -4.3917236328125, -4.226318359375, -4.0609130859375, -3.8955078125, -3.7301025390625, -3.564697265625, -3.3992919921875, -3.23388671875, -3.0684814453125, -2.903076171875, -2.7376708984375, -2.572265625, -2.4068603515625, -2.241455078125, -2.0760498046875, -1.91064453125, -1.7452392578125, -1.579833984375, -1.4144287109375, -1.2490234375, -1.0836181640625, -0.918212890625, -0.7528076171875, -0.58740234375, -0.4219970703125, -0.256591796875, -0.0911865234375, 0.07421875, 0.2396240234375, 0.405029296875, 0.5704345703125, 0.73583984375, 0.9012451171875, 1.066650390625, 1.2320556640625, 1.3974609375, 1.5628662109375, 1.728271484375, 1.8936767578125, 2.05908203125, 2.2244873046875, 2.389892578125, 2.5552978515625, 2.720703125, 2.8861083984375, 3.051513671875, 3.2169189453125, 3.38232421875, 3.5477294921875, 3.713134765625, 3.8785400390625, 4.0439453125, 4.2093505859375, 4.374755859375, 4.5401611328125, 4.70556640625, 4.8709716796875, 5.036376953125, 5.2017822265625, 5.3671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 7.0, 8.0, 9.0, 14.0, 17.0, 16.0, 20.0, 34.0, 32.0, 27.0, 31.0, 30.0, 32.0, 34.0, 37.0, 50.0, 38.0, 43.0, 38.0, 35.0, 43.0, 35.0, 39.0, 38.0, 32.0, 42.0, 22.0, 34.0, 16.0, 14.0, 18.0, 14.0, 14.0, 17.0, 13.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.015625, -5.83306884765625, -5.6505126953125, -5.46795654296875, -5.285400390625, -5.10284423828125, -4.9202880859375, -4.73773193359375, -4.55517578125, -4.37261962890625, -4.1900634765625, -4.00750732421875, -3.824951171875, -3.64239501953125, -3.4598388671875, -3.27728271484375, -3.0947265625, -2.91217041015625, -2.7296142578125, -2.54705810546875, -2.364501953125, -2.18194580078125, -1.9993896484375, -1.81683349609375, -1.63427734375, -1.45172119140625, -1.2691650390625, -1.08660888671875, -0.904052734375, -0.72149658203125, -0.5389404296875, -0.35638427734375, -0.173828125, 0.00872802734375, 0.1912841796875, 0.37384033203125, 0.556396484375, 0.73895263671875, 0.9215087890625, 1.10406494140625, 1.28662109375, 1.46917724609375, 1.6517333984375, 1.83428955078125, 2.016845703125, 2.19940185546875, 2.3819580078125, 2.56451416015625, 2.7470703125, 2.92962646484375, 3.1121826171875, 3.29473876953125, 3.477294921875, 3.65985107421875, 3.8424072265625, 4.02496337890625, 4.20751953125, 4.39007568359375, 4.5726318359375, 4.75518798828125, 4.937744140625, 5.12030029296875, 5.3028564453125, 5.48541259765625, 5.66796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 17.0, 17.0, 34.0, 47.0, 89.0, 120.0, 153.0, 260.0, 376.0, 577.0, 928.0, 1460.0, 2212.0, 3768.0, 6216.0, 10758.0, 18622.0, 33035.0, 57858.0, 97532.0, 145317.0, 177750.0, 170346.0, 127641.0, 81336.0, 47406.0, 27174.0, 15225.0, 8829.0, 5084.0, 3122.0, 1914.0, 1162.0, 775.0, 471.0, 331.0, 192.0, 130.0, 86.0, 48.0, 40.0, 29.0, 17.0, 17.0, 11.0, 9.0, 2.0, 2.0, 1.0, 4.0], "bins": [-7.53125, -7.32098388671875, -7.1107177734375, -6.90045166015625, -6.690185546875, -6.47991943359375, -6.2696533203125, -6.05938720703125, -5.84912109375, -5.63885498046875, -5.4285888671875, -5.21832275390625, -5.008056640625, -4.79779052734375, -4.5875244140625, -4.37725830078125, -4.1669921875, -3.95672607421875, -3.7464599609375, -3.53619384765625, -3.325927734375, -3.11566162109375, -2.9053955078125, -2.69512939453125, -2.48486328125, -2.27459716796875, -2.0643310546875, -1.85406494140625, -1.643798828125, -1.43353271484375, -1.2232666015625, -1.01300048828125, -0.802734375, -0.59246826171875, -0.3822021484375, -0.17193603515625, 0.038330078125, 0.24859619140625, 0.4588623046875, 0.66912841796875, 0.87939453125, 1.08966064453125, 1.2999267578125, 1.51019287109375, 1.720458984375, 1.93072509765625, 2.1409912109375, 2.35125732421875, 2.5615234375, 2.77178955078125, 2.9820556640625, 3.19232177734375, 3.402587890625, 3.61285400390625, 3.8231201171875, 4.03338623046875, 4.24365234375, 4.45391845703125, 4.6641845703125, 4.87445068359375, 5.084716796875, 5.29498291015625, 5.5052490234375, 5.71551513671875, 5.92578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 12.0, 10.0, 13.0, 9.0, 17.0, 24.0, 26.0, 24.0, 23.0, 39.0, 29.0, 44.0, 33.0, 50.0, 56.0, 53.0, 40.0, 54.0, 41.0, 39.0, 37.0, 37.0, 46.0, 44.0, 27.0, 33.0, 20.0, 29.0, 13.0, 16.0, 12.0, 12.0, 13.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.345489501953125, -4.21441650390625, -4.083343505859375, -3.9522705078125, -3.821197509765625, -3.69012451171875, -3.559051513671875, -3.427978515625, -3.296905517578125, -3.16583251953125, -3.034759521484375, -2.9036865234375, -2.772613525390625, -2.64154052734375, -2.510467529296875, -2.37939453125, -2.248321533203125, -2.11724853515625, -1.986175537109375, -1.8551025390625, -1.724029541015625, -1.59295654296875, -1.461883544921875, -1.330810546875, -1.199737548828125, -1.06866455078125, -0.937591552734375, -0.8065185546875, -0.675445556640625, -0.54437255859375, -0.413299560546875, -0.2822265625, -0.151153564453125, -0.02008056640625, 0.110992431640625, 0.2420654296875, 0.373138427734375, 0.50421142578125, 0.635284423828125, 0.766357421875, 0.897430419921875, 1.02850341796875, 1.159576416015625, 1.2906494140625, 1.421722412109375, 1.55279541015625, 1.683868408203125, 1.81494140625, 1.946014404296875, 2.07708740234375, 2.208160400390625, 2.3392333984375, 2.470306396484375, 2.60137939453125, 2.732452392578125, 2.863525390625, 2.994598388671875, 3.12567138671875, 3.256744384765625, 3.3878173828125, 3.518890380859375, 3.64996337890625, 3.781036376953125, 3.912109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 11.0, 12.0, 17.0, 28.0, 31.0, 48.0, 66.0, 92.0, 151.0, 210.0, 352.0, 494.0, 708.0, 1164.0, 1637.0, 2501.0, 3921.0, 6287.0, 10190.0, 17364.0, 31057.0, 58118.0, 107790.0, 184125.0, 226949.0, 172632.0, 98770.0, 53240.0, 28500.0, 16217.0, 9516.0, 5739.0, 3553.0, 2356.0, 1514.0, 1068.0, 691.0, 464.0, 293.0, 217.0, 152.0, 94.0, 62.0, 57.0, 30.0, 22.0, 15.0, 6.0, 10.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0], "bins": [-5.3515625, -5.19146728515625, -5.0313720703125, -4.87127685546875, -4.711181640625, -4.55108642578125, -4.3909912109375, -4.23089599609375, -4.07080078125, -3.91070556640625, -3.7506103515625, -3.59051513671875, -3.430419921875, -3.27032470703125, -3.1102294921875, -2.95013427734375, -2.7900390625, -2.62994384765625, -2.4698486328125, -2.30975341796875, -2.149658203125, -1.98956298828125, -1.8294677734375, -1.66937255859375, -1.50927734375, -1.34918212890625, -1.1890869140625, -1.02899169921875, -0.868896484375, -0.70880126953125, -0.5487060546875, -0.38861083984375, -0.228515625, -0.06842041015625, 0.0916748046875, 0.25177001953125, 0.411865234375, 0.57196044921875, 0.7320556640625, 0.89215087890625, 1.05224609375, 1.21234130859375, 1.3724365234375, 1.53253173828125, 1.692626953125, 1.85272216796875, 2.0128173828125, 2.17291259765625, 2.3330078125, 2.49310302734375, 2.6531982421875, 2.81329345703125, 2.973388671875, 3.13348388671875, 3.2935791015625, 3.45367431640625, 3.61376953125, 3.77386474609375, 3.9339599609375, 4.09405517578125, 4.254150390625, 4.41424560546875, 4.5743408203125, 4.73443603515625, 4.89453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 20.0, 18.0, 18.0, 30.0, 48.0, 70.0, 60.0, 74.0, 97.0, 110.0, 78.0, 66.0, 45.0, 51.0, 45.0, 28.0, 25.0, 19.0, 14.0, 7.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005445480346679688, -0.0005231499671936035, -0.0005017518997192383, -0.00048035383224487305, -0.0004589557647705078, -0.0004375576972961426, -0.00041615962982177734, -0.0003947615623474121, -0.0003733634948730469, -0.00035196542739868164, -0.0003305673599243164, -0.00030916929244995117, -0.00028777122497558594, -0.0002663731575012207, -0.00024497509002685547, -0.00022357702255249023, -0.000202178955078125, -0.00018078088760375977, -0.00015938282012939453, -0.0001379847526550293, -0.00011658668518066406, -9.518861770629883e-05, -7.37905502319336e-05, -5.239248275756836e-05, -3.0994415283203125e-05, -9.59634780883789e-06, 1.1801719665527344e-05, 3.319978713989258e-05, 5.459785461425781e-05, 7.599592208862305e-05, 9.739398956298828e-05, 0.00011879205703735352, 0.00014019012451171875, 0.00016158819198608398, 0.00018298625946044922, 0.00020438432693481445, 0.0002257823944091797, 0.0002471804618835449, 0.00026857852935791016, 0.0002899765968322754, 0.0003113746643066406, 0.00033277273178100586, 0.0003541707992553711, 0.00037556886672973633, 0.00039696693420410156, 0.0004183650016784668, 0.00043976306915283203, 0.00046116113662719727, 0.0004825592041015625, 0.0005039572715759277, 0.000525355339050293, 0.0005467534065246582, 0.0005681514739990234, 0.0005895495414733887, 0.0006109476089477539, 0.0006323456764221191, 0.0006537437438964844, 0.0006751418113708496, 0.0006965398788452148, 0.0007179379463195801, 0.0007393360137939453, 0.0007607340812683105, 0.0007821321487426758, 0.000803530216217041, 0.0008249282836914062]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 9.0, 7.0, 26.0, 15.0, 29.0, 66.0, 82.0, 107.0, 162.0, 245.0, 392.0, 568.0, 900.0, 1420.0, 2106.0, 3431.0, 5692.0, 9308.0, 16031.0, 27388.0, 48392.0, 83870.0, 137566.0, 186655.0, 186971.0, 137582.0, 84147.0, 47809.0, 27381.0, 15514.0, 9324.0, 5626.0, 3468.0, 2163.0, 1432.0, 936.0, 570.0, 406.0, 247.0, 180.0, 112.0, 95.0, 45.0, 31.0, 14.0, 15.0, 4.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.390625, -4.261474609375, -4.13232421875, -4.003173828125, -3.8740234375, -3.744873046875, -3.61572265625, -3.486572265625, -3.357421875, -3.228271484375, -3.09912109375, -2.969970703125, -2.8408203125, -2.711669921875, -2.58251953125, -2.453369140625, -2.32421875, -2.195068359375, -2.06591796875, -1.936767578125, -1.8076171875, -1.678466796875, -1.54931640625, -1.420166015625, -1.291015625, -1.161865234375, -1.03271484375, -0.903564453125, -0.7744140625, -0.645263671875, -0.51611328125, -0.386962890625, -0.2578125, -0.128662109375, 0.00048828125, 0.129638671875, 0.2587890625, 0.387939453125, 0.51708984375, 0.646240234375, 0.775390625, 0.904541015625, 1.03369140625, 1.162841796875, 1.2919921875, 1.421142578125, 1.55029296875, 1.679443359375, 1.80859375, 1.937744140625, 2.06689453125, 2.196044921875, 2.3251953125, 2.454345703125, 2.58349609375, 2.712646484375, 2.841796875, 2.970947265625, 3.10009765625, 3.229248046875, 3.3583984375, 3.487548828125, 3.61669921875, 3.745849609375, 3.875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 13.0, 20.0, 22.0, 22.0, 25.0, 32.0, 51.0, 39.0, 51.0, 65.0, 66.0, 55.0, 62.0, 75.0, 48.0, 45.0, 57.0, 48.0, 30.0, 22.0, 24.0, 18.0, 14.0, 16.0, 16.0, 6.0, 5.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5213623046875, -1.475341796875, -1.4293212890625, -1.38330078125, -1.3372802734375, -1.291259765625, -1.2452392578125, -1.19921875, -1.1531982421875, -1.107177734375, -1.0611572265625, -1.01513671875, -0.9691162109375, -0.923095703125, -0.8770751953125, -0.8310546875, -0.7850341796875, -0.739013671875, -0.6929931640625, -0.64697265625, -0.6009521484375, -0.554931640625, -0.5089111328125, -0.462890625, -0.4168701171875, -0.370849609375, -0.3248291015625, -0.27880859375, -0.2327880859375, -0.186767578125, -0.1407470703125, -0.0947265625, -0.0487060546875, -0.002685546875, 0.0433349609375, 0.08935546875, 0.1353759765625, 0.181396484375, 0.2274169921875, 0.2734375, 0.3194580078125, 0.365478515625, 0.4114990234375, 0.45751953125, 0.5035400390625, 0.549560546875, 0.5955810546875, 0.6416015625, 0.6876220703125, 0.733642578125, 0.7796630859375, 0.82568359375, 0.8717041015625, 0.917724609375, 0.9637451171875, 1.009765625, 1.0557861328125, 1.101806640625, 1.1478271484375, 1.19384765625, 1.2398681640625, 1.285888671875, 1.3319091796875, 1.3779296875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 23.0, 22.0, 15.0, 23.0, 30.0, 31.0, 33.0, 43.0, 48.0, 64.0, 57.0, 62.0, 71.0, 69.0, 47.0, 59.0, 59.0, 32.0, 39.0, 29.0, 22.0, 26.0, 17.0, 15.0, 18.0, 6.0, 2.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.949092864990234, -6.694309711456299, -6.439526557922363, -6.184743404388428, -5.929960250854492, -5.675177574157715, -5.420394420623779, -5.165611267089844, -4.910828113555908, -4.656044960021973, -4.401261806488037, -4.146478652954102, -3.891695737838745, -3.6369125843048096, -3.382129669189453, -3.1273465156555176, -2.872563362121582, -2.6177802085876465, -2.362997055053711, -2.1082141399383545, -1.853430986404419, -1.5986478328704834, -1.3438647985458374, -1.0890817642211914, -0.8342986106872559, -0.5795155167579651, -0.3247324228286743, -0.06994932889938354, 0.18483376502990723, 0.4396169185638428, 0.6943999528884888, 0.9491829872131348, 1.2039670944213867, 1.4587502479553223, 1.7135332822799683, 1.9683163166046143, 2.22309947013855, 2.4778826236724854, 2.732665538787842, 2.9874486923217773, 3.242231845855713, 3.4970149993896484, 3.751798152923584, 4.0065813064575195, 4.261363983154297, 4.516147613525391, 4.770930290222168, 5.0257134437561035, 5.280496597290039, 5.535279750823975, 5.79006290435791, 6.044846057891846, 6.299629211425781, 6.554411888122559, 6.809195041656494, 7.06397819519043, 7.318761348724365, 7.573544502258301, 7.828327655792236, 8.083110809326172, 8.33789348602295, 8.592677116394043, 8.84745979309082, 9.102243423461914, 9.357026100158691]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 7.0, 13.0, 10.0, 16.0, 18.0, 19.0, 29.0, 30.0, 35.0, 36.0, 40.0, 45.0, 41.0, 43.0, 37.0, 43.0, 40.0, 63.0, 42.0, 37.0, 42.0, 42.0, 21.0, 30.0, 37.0, 25.0, 28.0, 19.0, 28.0, 20.0, 11.0, 10.0, 4.0, 13.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6435675621032715, -5.439590930938721, -5.235613822937012, -5.031637191772461, -4.827660083770752, -4.623683452606201, -4.419706344604492, -4.215729713439941, -4.011753082275391, -3.8077762126922607, -3.603799343109131, -3.39982271194458, -3.195845603942871, -2.9918689727783203, -2.7878921031951904, -2.5839152336120605, -2.3799381256103516, -2.1759612560272217, -1.9719843864440918, -1.7680076360702515, -1.5640307664871216, -1.3600538969039917, -1.1560771465301514, -0.9521002769470215, -0.7481234073638916, -0.5441465377807617, -0.3401697278022766, -0.1361929178237915, 0.06778395175933838, 0.27176082134246826, 0.4757375717163086, 0.6797144412994385, 0.8836908340454102, 1.08766770362854, 1.29164457321167, 1.4956213235855103, 1.6995981931686401, 1.90357506275177, 2.1075518131256104, 2.3115286827087402, 2.51550555229187, 2.719482421875, 2.92345929145813, 3.1274361610412598, 3.3314127922058105, 3.5353899002075195, 3.7393665313720703, 3.9433434009552, 4.14732027053833, 4.351296901702881, 4.55527400970459, 4.759250640869141, 4.96322774887085, 5.1672043800354, 5.371181488037109, 5.57515811920166, 5.779134750366211, 5.983111381530762, 6.187088489532471, 6.3910651206970215, 6.5950422286987305, 6.799018859863281, 7.002995491027832, 7.206972599029541, 7.41094970703125]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 11.0, 6.0, 17.0, 20.0, 25.0, 41.0, 60.0, 90.0, 125.0, 201.0, 255.0, 454.0, 703.0, 1148.0, 1711.0, 2954.0, 5385.0, 10340.0, 22037.0, 54361.0, 153052.0, 447750.0, 1015293.0, 1270366.0, 761360.0, 284100.0, 95870.0, 35159.0, 14338.0, 7232.0, 3795.0, 2158.0, 1314.0, 867.0, 523.0, 398.0, 241.0, 157.0, 112.0, 74.0, 63.0, 43.0, 23.0, 16.0, 11.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.1171875, -7.84912109375, -7.5810546875, -7.31298828125, -7.044921875, -6.77685546875, -6.5087890625, -6.24072265625, -5.97265625, -5.70458984375, -5.4365234375, -5.16845703125, -4.900390625, -4.63232421875, -4.3642578125, -4.09619140625, -3.828125, -3.56005859375, -3.2919921875, -3.02392578125, -2.755859375, -2.48779296875, -2.2197265625, -1.95166015625, -1.68359375, -1.41552734375, -1.1474609375, -0.87939453125, -0.611328125, -0.34326171875, -0.0751953125, 0.19287109375, 0.4609375, 0.72900390625, 0.9970703125, 1.26513671875, 1.533203125, 1.80126953125, 2.0693359375, 2.33740234375, 2.60546875, 2.87353515625, 3.1416015625, 3.40966796875, 3.677734375, 3.94580078125, 4.2138671875, 4.48193359375, 4.75, 5.01806640625, 5.2861328125, 5.55419921875, 5.822265625, 6.09033203125, 6.3583984375, 6.62646484375, 6.89453125, 7.16259765625, 7.4306640625, 7.69873046875, 7.966796875, 8.23486328125, 8.5029296875, 8.77099609375, 9.0390625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 4.0, 12.0, 10.0, 9.0, 13.0, 15.0, 19.0, 21.0, 31.0, 29.0, 29.0, 36.0, 53.0, 38.0, 43.0, 55.0, 37.0, 44.0, 45.0, 35.0, 45.0, 44.0, 50.0, 26.0, 33.0, 33.0, 27.0, 30.0, 24.0, 23.0, 13.0, 22.0, 13.0, 10.0, 6.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.55450439453125, -4.3746337890625, -4.19476318359375, -4.014892578125, -3.83502197265625, -3.6551513671875, -3.47528076171875, -3.29541015625, -3.11553955078125, -2.9356689453125, -2.75579833984375, -2.575927734375, -2.39605712890625, -2.2161865234375, -2.03631591796875, -1.8564453125, -1.67657470703125, -1.4967041015625, -1.31683349609375, -1.136962890625, -0.95709228515625, -0.7772216796875, -0.59735107421875, -0.41748046875, -0.23760986328125, -0.0577392578125, 0.12213134765625, 0.302001953125, 0.48187255859375, 0.6617431640625, 0.84161376953125, 1.021484375, 1.20135498046875, 1.3812255859375, 1.56109619140625, 1.740966796875, 1.92083740234375, 2.1007080078125, 2.28057861328125, 2.46044921875, 2.64031982421875, 2.8201904296875, 3.00006103515625, 3.179931640625, 3.35980224609375, 3.5396728515625, 3.71954345703125, 3.8994140625, 4.07928466796875, 4.2591552734375, 4.43902587890625, 4.618896484375, 4.79876708984375, 4.9786376953125, 5.15850830078125, 5.33837890625, 5.51824951171875, 5.6981201171875, 5.87799072265625, 6.057861328125, 6.23773193359375, 6.4176025390625, 6.59747314453125, 6.77734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 16.0, 31.0, 30.0, 47.0, 84.0, 101.0, 173.0, 240.0, 343.0, 606.0, 880.0, 1526.0, 2462.0, 4302.0, 8224.0, 16129.0, 34774.0, 86072.0, 243086.0, 700467.0, 1364181.0, 1068645.0, 417775.0, 142040.0, 53058.0, 23244.0, 11242.0, 5971.0, 3353.0, 1914.0, 1175.0, 741.0, 440.0, 279.0, 193.0, 141.0, 87.0, 67.0, 36.0, 26.0, 22.0, 16.0, 8.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.5546875, -10.21142578125, -9.8681640625, -9.52490234375, -9.181640625, -8.83837890625, -8.4951171875, -8.15185546875, -7.80859375, -7.46533203125, -7.1220703125, -6.77880859375, -6.435546875, -6.09228515625, -5.7490234375, -5.40576171875, -5.0625, -4.71923828125, -4.3759765625, -4.03271484375, -3.689453125, -3.34619140625, -3.0029296875, -2.65966796875, -2.31640625, -1.97314453125, -1.6298828125, -1.28662109375, -0.943359375, -0.60009765625, -0.2568359375, 0.08642578125, 0.4296875, 0.77294921875, 1.1162109375, 1.45947265625, 1.802734375, 2.14599609375, 2.4892578125, 2.83251953125, 3.17578125, 3.51904296875, 3.8623046875, 4.20556640625, 4.548828125, 4.89208984375, 5.2353515625, 5.57861328125, 5.921875, 6.26513671875, 6.6083984375, 6.95166015625, 7.294921875, 7.63818359375, 7.9814453125, 8.32470703125, 8.66796875, 9.01123046875, 9.3544921875, 9.69775390625, 10.041015625, 10.38427734375, 10.7275390625, 11.07080078125, 11.4140625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 6.0, 12.0, 10.0, 12.0, 12.0, 22.0, 21.0, 31.0, 35.0, 65.0, 67.0, 99.0, 116.0, 166.0, 185.0, 224.0, 230.0, 284.0, 285.0, 303.0, 294.0, 283.0, 245.0, 206.0, 177.0, 146.0, 122.0, 81.0, 77.0, 57.0, 44.0, 44.0, 24.0, 23.0, 15.0, 12.0, 10.0, 8.0, 7.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.139984130859375, -2.05535888671875, -1.970733642578125, -1.8861083984375, -1.801483154296875, -1.71685791015625, -1.632232666015625, -1.547607421875, -1.462982177734375, -1.37835693359375, -1.293731689453125, -1.2091064453125, -1.124481201171875, -1.03985595703125, -0.955230712890625, -0.87060546875, -0.785980224609375, -0.70135498046875, -0.616729736328125, -0.5321044921875, -0.447479248046875, -0.36285400390625, -0.278228759765625, -0.193603515625, -0.108978271484375, -0.02435302734375, 0.060272216796875, 0.1448974609375, 0.229522705078125, 0.31414794921875, 0.398773193359375, 0.4833984375, 0.568023681640625, 0.65264892578125, 0.737274169921875, 0.8218994140625, 0.906524658203125, 0.99114990234375, 1.075775146484375, 1.160400390625, 1.245025634765625, 1.32965087890625, 1.414276123046875, 1.4989013671875, 1.583526611328125, 1.66815185546875, 1.752777099609375, 1.83740234375, 1.922027587890625, 2.00665283203125, 2.091278076171875, 2.1759033203125, 2.260528564453125, 2.34515380859375, 2.429779052734375, 2.514404296875, 2.599029541015625, 2.68365478515625, 2.768280029296875, 2.8529052734375, 2.937530517578125, 3.02215576171875, 3.106781005859375, 3.19140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 12.0, 5.0, 9.0, 9.0, 11.0, 14.0, 27.0, 25.0, 32.0, 26.0, 28.0, 41.0, 37.0, 54.0, 52.0, 69.0, 60.0, 81.0, 58.0, 58.0, 47.0, 47.0, 34.0, 43.0, 26.0, 26.0, 16.0, 7.0, 11.0, 11.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.633728981018066, -6.382436752319336, -6.1311445236206055, -5.879852294921875, -5.6285600662231445, -5.377267837524414, -5.125976085662842, -4.874683856964111, -4.623391628265381, -4.37209939956665, -4.12080717086792, -3.8695151805877686, -3.618222951889038, -3.3669307231903076, -3.1156387329101562, -2.864346504211426, -2.6130542755126953, -2.361762046813965, -2.1104698181152344, -1.859177827835083, -1.6078855991363525, -1.356593370437622, -1.1053012609481812, -0.8540091514587402, -0.6027169227600098, -0.3514247536659241, -0.10013258457183838, 0.15115958452224731, 0.402451753616333, 0.6537439823150635, 0.9050360918045044, 1.1563282012939453, 1.4076204299926758, 1.6589126586914062, 1.9102047681808472, 2.161496877670288, 2.4127891063690186, 2.664081335067749, 2.9153733253479004, 3.166665554046631, 3.4179577827453613, 3.669250011444092, 3.9205422401428223, 4.171834468841553, 4.423126220703125, 4.6744184494018555, 4.925710678100586, 5.177002906799316, 5.428295135498047, 5.679587364196777, 5.930879592895508, 6.182171821594238, 6.433464050292969, 6.684756278991699, 6.9360480308532715, 7.187340259552002, 7.438632488250732, 7.689924716949463, 7.941216945648193, 8.192508697509766, 8.443800926208496, 8.695093154907227, 8.946385383605957, 9.197677612304688, 9.448969841003418]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 13.0, 16.0, 14.0, 16.0, 25.0, 26.0, 23.0, 26.0, 46.0, 32.0, 49.0, 39.0, 47.0, 47.0, 33.0, 49.0, 45.0, 31.0, 50.0, 39.0, 41.0, 47.0, 39.0, 32.0, 25.0, 21.0, 25.0, 16.0, 9.0, 12.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.002016067504883, -5.8050150871276855, -5.60801362991333, -5.411012649536133, -5.2140116691589355, -5.017010688781738, -4.820009231567383, -4.6230082511901855, -4.426007270812988, -4.229006290435791, -4.0320048332214355, -3.8350038528442383, -3.638002872467041, -3.4410016536712646, -3.2440004348754883, -3.046999454498291, -2.8499979972839355, -2.652996778488159, -2.455995798110962, -2.2589945793151855, -2.0619935989379883, -1.864992380142212, -1.6679911613464355, -1.4709900617599487, -1.273988962173462, -1.076987862586975, -0.8799867033958435, -0.6829855442047119, -0.4859844446182251, -0.2889833450317383, -0.09198212623596191, 0.1050189733505249, 0.3020195960998535, 0.4990207254886627, 0.6960218548774719, 0.8930230140686035, 1.0900241136550903, 1.2870252132415771, 1.4840264320373535, 1.6810275316238403, 1.8780286312103271, 2.0750298500061035, 2.272030830383301, 2.469032049179077, 2.6660332679748535, 2.863034248352051, 3.060035467147827, 3.2570366859436035, 3.454037666320801, 3.651038885116577, 3.8480398654937744, 4.045041084289551, 4.242042064666748, 4.439043045043945, 4.636044502258301, 4.833045482635498, 5.030046463012695, 5.227047443389893, 5.424048900604248, 5.621049880981445, 5.818050861358643, 6.01505184173584, 6.212053298950195, 6.409054279327393, 6.606055736541748]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 7.0, 8.0, 7.0, 13.0, 15.0, 30.0, 37.0, 44.0, 91.0, 124.0, 216.0, 299.0, 514.0, 729.0, 1113.0, 1807.0, 2962.0, 5022.0, 8705.0, 15002.0, 26809.0, 48640.0, 86596.0, 144044.0, 196092.0, 191298.0, 135129.0, 79666.0, 44605.0, 24510.0, 14027.0, 8114.0, 4649.0, 2848.0, 1739.0, 1065.0, 660.0, 454.0, 291.0, 223.0, 122.0, 88.0, 44.0, 43.0, 18.0, 16.0, 7.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.19140625, -2.122772216796875, -2.05413818359375, -1.985504150390625, -1.9168701171875, -1.848236083984375, -1.77960205078125, -1.710968017578125, -1.642333984375, -1.573699951171875, -1.50506591796875, -1.436431884765625, -1.3677978515625, -1.299163818359375, -1.23052978515625, -1.161895751953125, -1.09326171875, -1.024627685546875, -0.95599365234375, -0.887359619140625, -0.8187255859375, -0.750091552734375, -0.68145751953125, -0.612823486328125, -0.544189453125, -0.475555419921875, -0.40692138671875, -0.338287353515625, -0.2696533203125, -0.201019287109375, -0.13238525390625, -0.063751220703125, 0.0048828125, 0.073516845703125, 0.14215087890625, 0.210784912109375, 0.2794189453125, 0.348052978515625, 0.41668701171875, 0.485321044921875, 0.553955078125, 0.622589111328125, 0.69122314453125, 0.759857177734375, 0.8284912109375, 0.897125244140625, 0.96575927734375, 1.034393310546875, 1.10302734375, 1.171661376953125, 1.24029541015625, 1.308929443359375, 1.3775634765625, 1.446197509765625, 1.51483154296875, 1.583465576171875, 1.652099609375, 1.720733642578125, 1.78936767578125, 1.858001708984375, 1.9266357421875, 1.995269775390625, 2.06390380859375, 2.132537841796875, 2.201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 9.0, 11.0, 17.0, 22.0, 19.0, 22.0, 24.0, 33.0, 30.0, 40.0, 28.0, 40.0, 48.0, 30.0, 46.0, 58.0, 32.0, 44.0, 43.0, 52.0, 50.0, 34.0, 40.0, 27.0, 27.0, 30.0, 27.0, 18.0, 19.0, 9.0, 9.0, 11.0, 11.0, 11.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.1727294921875, -5.962646484375, -5.7525634765625, -5.54248046875, -5.3323974609375, -5.122314453125, -4.9122314453125, -4.7021484375, -4.4920654296875, -4.281982421875, -4.0718994140625, -3.86181640625, -3.6517333984375, -3.441650390625, -3.2315673828125, -3.021484375, -2.8114013671875, -2.601318359375, -2.3912353515625, -2.18115234375, -1.9710693359375, -1.760986328125, -1.5509033203125, -1.3408203125, -1.1307373046875, -0.920654296875, -0.7105712890625, -0.50048828125, -0.2904052734375, -0.080322265625, 0.1297607421875, 0.33984375, 0.5499267578125, 0.760009765625, 0.9700927734375, 1.18017578125, 1.3902587890625, 1.600341796875, 1.8104248046875, 2.0205078125, 2.2305908203125, 2.440673828125, 2.6507568359375, 2.86083984375, 3.0709228515625, 3.281005859375, 3.4910888671875, 3.701171875, 3.9112548828125, 4.121337890625, 4.3314208984375, 4.54150390625, 4.7515869140625, 4.961669921875, 5.1717529296875, 5.3818359375, 5.5919189453125, 5.802001953125, 6.0120849609375, 6.22216796875, 6.4322509765625, 6.642333984375, 6.8524169921875, 7.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 10.0, 9.0, 12.0, 32.0, 42.0, 64.0, 110.0, 128.0, 212.0, 337.0, 449.0, 727.0, 1121.0, 1725.0, 2859.0, 4584.0, 7828.0, 13486.0, 25407.0, 110058.0, 773553.0, 55158.0, 21158.0, 11706.0, 6678.0, 4031.0, 2551.0, 1575.0, 1008.0, 672.0, 407.0, 270.0, 188.0, 114.0, 104.0, 48.0, 41.0, 28.0, 18.0, 16.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.6640625, -5.489013671875, -5.31396484375, -5.138916015625, -4.9638671875, -4.788818359375, -4.61376953125, -4.438720703125, -4.263671875, -4.088623046875, -3.91357421875, -3.738525390625, -3.5634765625, -3.388427734375, -3.21337890625, -3.038330078125, -2.86328125, -2.688232421875, -2.51318359375, -2.338134765625, -2.1630859375, -1.988037109375, -1.81298828125, -1.637939453125, -1.462890625, -1.287841796875, -1.11279296875, -0.937744140625, -0.7626953125, -0.587646484375, -0.41259765625, -0.237548828125, -0.0625, 0.112548828125, 0.28759765625, 0.462646484375, 0.6376953125, 0.812744140625, 0.98779296875, 1.162841796875, 1.337890625, 1.512939453125, 1.68798828125, 1.863037109375, 2.0380859375, 2.213134765625, 2.38818359375, 2.563232421875, 2.73828125, 2.913330078125, 3.08837890625, 3.263427734375, 3.4384765625, 3.613525390625, 3.78857421875, 3.963623046875, 4.138671875, 4.313720703125, 4.48876953125, 4.663818359375, 4.8388671875, 5.013916015625, 5.18896484375, 5.364013671875, 5.5390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 8.0, 15.0, 7.0, 12.0, 8.0, 22.0, 27.0, 23.0, 30.0, 32.0, 30.0, 37.0, 28.0, 46.0, 41.0, 49.0, 41.0, 39.0, 39.0, 38.0, 34.0, 31.0, 37.0, 39.0, 28.0, 27.0, 28.0, 23.0, 19.0, 20.0, 25.0, 14.0, 14.0, 12.0, 9.0, 10.0, 4.0, 4.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.12957763671875, -3.9818115234375, -3.83404541015625, -3.686279296875, -3.53851318359375, -3.3907470703125, -3.24298095703125, -3.09521484375, -2.94744873046875, -2.7996826171875, -2.65191650390625, -2.504150390625, -2.35638427734375, -2.2086181640625, -2.06085205078125, -1.9130859375, -1.76531982421875, -1.6175537109375, -1.46978759765625, -1.322021484375, -1.17425537109375, -1.0264892578125, -0.87872314453125, -0.73095703125, -0.58319091796875, -0.4354248046875, -0.28765869140625, -0.139892578125, 0.00787353515625, 0.1556396484375, 0.30340576171875, 0.451171875, 0.59893798828125, 0.7467041015625, 0.89447021484375, 1.042236328125, 1.19000244140625, 1.3377685546875, 1.48553466796875, 1.63330078125, 1.78106689453125, 1.9288330078125, 2.07659912109375, 2.224365234375, 2.37213134765625, 2.5198974609375, 2.66766357421875, 2.8154296875, 2.96319580078125, 3.1109619140625, 3.25872802734375, 3.406494140625, 3.55426025390625, 3.7020263671875, 3.84979248046875, 3.99755859375, 4.14532470703125, 4.2930908203125, 4.44085693359375, 4.588623046875, 4.73638916015625, 4.8841552734375, 5.03192138671875, 5.1796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 16.0, 14.0, 24.0, 33.0, 42.0, 61.0, 96.0, 133.0, 183.0, 246.0, 417.0, 619.0, 984.0, 1639.0, 2883.0, 5006.0, 9601.0, 20375.0, 63492.0, 793598.0, 100425.0, 23859.0, 11071.0, 5729.0, 3156.0, 1807.0, 1044.0, 700.0, 425.0, 301.0, 161.0, 99.0, 79.0, 78.0, 44.0, 23.0, 29.0, 15.0, 10.0, 11.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8038101196289062, -0.7775421142578125, -0.7512741088867188, -0.725006103515625, -0.6987380981445312, -0.6724700927734375, -0.6462020874023438, -0.61993408203125, -0.5936660766601562, -0.5673980712890625, -0.5411300659179688, -0.514862060546875, -0.48859405517578125, -0.4623260498046875, -0.43605804443359375, -0.4097900390625, -0.38352203369140625, -0.3572540283203125, -0.33098602294921875, -0.304718017578125, -0.27845001220703125, -0.2521820068359375, -0.22591400146484375, -0.19964599609375, -0.17337799072265625, -0.1471099853515625, -0.12084197998046875, -0.094573974609375, -0.06830596923828125, -0.0420379638671875, -0.01576995849609375, 0.010498046875, 0.03676605224609375, 0.0630340576171875, 0.08930206298828125, 0.115570068359375, 0.14183807373046875, 0.1681060791015625, 0.19437408447265625, 0.22064208984375, 0.24691009521484375, 0.2731781005859375, 0.29944610595703125, 0.325714111328125, 0.35198211669921875, 0.3782501220703125, 0.40451812744140625, 0.4307861328125, 0.45705413818359375, 0.4833221435546875, 0.5095901489257812, 0.535858154296875, 0.5621261596679688, 0.5883941650390625, 0.6146621704101562, 0.64093017578125, 0.6671981811523438, 0.6934661865234375, 0.7197341918945312, 0.746002197265625, 0.7722702026367188, 0.7985382080078125, 0.8248062133789062, 0.85107421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 10.0, 7.0, 14.0, 16.0, 13.0, 34.0, 37.0, 57.0, 79.0, 87.0, 98.0, 104.0, 100.0, 96.0, 60.0, 43.0, 32.0, 25.0, 21.0, 15.0, 14.0, 9.0, 10.0, 5.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.334087371826172e-05, -8.953548967838287e-05, -8.573010563850403e-05, -8.192472159862518e-05, -7.811933755874634e-05, -7.431395351886749e-05, -7.050856947898865e-05, -6.67031854391098e-05, -6.289780139923096e-05, -5.909241735935211e-05, -5.5287033319473267e-05, -5.148164927959442e-05, -4.7676265239715576e-05, -4.387088119983673e-05, -4.0065497159957886e-05, -3.626011312007904e-05, -3.2454729080200195e-05, -2.864934504032135e-05, -2.4843961000442505e-05, -2.103857696056366e-05, -1.7233192920684814e-05, -1.342780888080597e-05, -9.622424840927124e-06, -5.817040801048279e-06, -2.0116567611694336e-06, 1.7937272787094116e-06, 5.599111318588257e-06, 9.404495358467102e-06, 1.3209879398345947e-05, 1.7015263438224792e-05, 2.0820647478103638e-05, 2.4626031517982483e-05, 2.8431415557861328e-05, 3.223679959774017e-05, 3.604218363761902e-05, 3.9847567677497864e-05, 4.365295171737671e-05, 4.7458335757255554e-05, 5.12637197971344e-05, 5.5069103837013245e-05, 5.887448787689209e-05, 6.267987191677094e-05, 6.648525595664978e-05, 7.029063999652863e-05, 7.409602403640747e-05, 7.790140807628632e-05, 8.170679211616516e-05, 8.5512176156044e-05, 8.931756019592285e-05, 9.31229442358017e-05, 9.692832827568054e-05, 0.00010073371231555939, 0.00010453909635543823, 0.00010834448039531708, 0.00011214986443519592, 0.00011595524847507477, 0.00011976063251495361, 0.00012356601655483246, 0.0001273714005947113, 0.00013117678463459015, 0.000134982168674469, 0.00013878755271434784, 0.00014259293675422668, 0.00014639832079410553, 0.00015020370483398438]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 8.0, 8.0, 21.0, 24.0, 33.0, 47.0, 66.0, 85.0, 117.0, 186.0, 249.0, 353.0, 495.0, 752.0, 1119.0, 1768.0, 2635.0, 4221.0, 6773.0, 10991.0, 19215.0, 32968.0, 59471.0, 105302.0, 171500.0, 210693.0, 171216.0, 106136.0, 59454.0, 33547.0, 19145.0, 11167.0, 6647.0, 4207.0, 2610.0, 1763.0, 1135.0, 736.0, 485.0, 327.0, 269.0, 180.0, 122.0, 82.0, 63.0, 46.0, 32.0, 19.0, 21.0, 11.0, 11.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0], "bins": [-0.55322265625, -0.5362014770507812, -0.5191802978515625, -0.5021591186523438, -0.485137939453125, -0.46811676025390625, -0.4510955810546875, -0.43407440185546875, -0.41705322265625, -0.40003204345703125, -0.3830108642578125, -0.36598968505859375, -0.348968505859375, -0.33194732666015625, -0.3149261474609375, -0.29790496826171875, -0.2808837890625, -0.26386260986328125, -0.2468414306640625, -0.22982025146484375, -0.212799072265625, -0.19577789306640625, -0.1787567138671875, -0.16173553466796875, -0.14471435546875, -0.12769317626953125, -0.1106719970703125, -0.09365081787109375, -0.076629638671875, -0.05960845947265625, -0.0425872802734375, -0.02556610107421875, -0.008544921875, 0.00847625732421875, 0.0254974365234375, 0.04251861572265625, 0.059539794921875, 0.07656097412109375, 0.0935821533203125, 0.11060333251953125, 0.12762451171875, 0.14464569091796875, 0.1616668701171875, 0.17868804931640625, 0.195709228515625, 0.21273040771484375, 0.2297515869140625, 0.24677276611328125, 0.2637939453125, 0.28081512451171875, 0.2978363037109375, 0.31485748291015625, 0.331878662109375, 0.34889984130859375, 0.3659210205078125, 0.38294219970703125, 0.39996337890625, 0.41698455810546875, 0.4340057373046875, 0.45102691650390625, 0.468048095703125, 0.48506927490234375, 0.5020904541015625, 0.5191116333007812, 0.5361328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 12.0, 12.0, 17.0, 22.0, 18.0, 26.0, 15.0, 37.0, 32.0, 43.0, 45.0, 52.0, 50.0, 61.0, 47.0, 60.0, 59.0, 49.0, 52.0, 56.0, 45.0, 36.0, 30.0, 18.0, 20.0, 18.0, 24.0, 8.0, 4.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16033554077148438, -0.15477752685546875, -0.14921951293945312, -0.1436614990234375, -0.13810348510742188, -0.13254547119140625, -0.12698745727539062, -0.121429443359375, -0.11587142944335938, -0.11031341552734375, -0.10475540161132812, -0.0991973876953125, -0.09363937377929688, -0.08808135986328125, -0.08252334594726562, -0.07696533203125, -0.07140731811523438, -0.06584930419921875, -0.060291290283203125, -0.0547332763671875, -0.049175262451171875, -0.04361724853515625, -0.038059234619140625, -0.032501220703125, -0.026943206787109375, -0.02138519287109375, -0.015827178955078125, -0.0102691650390625, -0.004711151123046875, 0.00084686279296875, 0.006404876708984375, 0.011962890625, 0.017520904541015625, 0.02307891845703125, 0.028636932373046875, 0.0341949462890625, 0.039752960205078125, 0.04531097412109375, 0.050868988037109375, 0.056427001953125, 0.061985015869140625, 0.06754302978515625, 0.07310104370117188, 0.0786590576171875, 0.08421707153320312, 0.08977508544921875, 0.09533309936523438, 0.10089111328125, 0.10644912719726562, 0.11200714111328125, 0.11756515502929688, 0.1231231689453125, 0.12868118286132812, 0.13423919677734375, 0.13979721069335938, 0.145355224609375, 0.15091323852539062, 0.15647125244140625, 0.16202926635742188, 0.1675872802734375, 0.17314529418945312, 0.17870330810546875, 0.18426132202148438, 0.1898193359375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 9.0, 15.0, 6.0, 19.0, 25.0, 26.0, 32.0, 21.0, 35.0, 43.0, 27.0, 57.0, 56.0, 58.0, 68.0, 55.0, 74.0, 51.0, 46.0, 42.0, 37.0, 39.0, 35.0, 23.0, 15.0, 17.0, 12.0, 10.0, 3.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.066775798797607, -5.827760696411133, -5.588746070861816, -5.349730968475342, -5.110716342926025, -4.871701240539551, -4.632686614990234, -4.39367151260376, -4.154656410217285, -3.9156415462493896, -3.676626682281494, -3.4376115798950195, -3.198596954345703, -2.9595818519592285, -2.720566987991333, -2.4815521240234375, -2.242537498474121, -2.0035226345062256, -1.76450777053833, -1.525492787361145, -1.2864779233932495, -1.047463059425354, -0.808448076248169, -0.5694332122802734, -0.33041834831237793, -0.09140345454216003, 0.14761143922805786, 0.38662636280059814, 0.6256412267684937, 0.8646560907363892, 1.1036710739135742, 1.3426859378814697, 1.5817012786865234, 1.820716142654419, 2.0597310066223145, 2.298746109008789, 2.5377607345581055, 2.77677583694458, 3.0157907009124756, 3.254805564880371, 3.4938204288482666, 3.732835292816162, 3.9718501567840576, 4.210865020751953, 4.449880123138428, 4.688894748687744, 4.927909851074219, 5.166924476623535, 5.40593957901001, 5.644954681396484, 5.883969306945801, 6.122984409332275, 6.361999034881592, 6.601014137268066, 6.840028762817383, 7.079043865203857, 7.318058967590332, 7.557074069976807, 7.796088695526123, 8.035103797912598, 8.274118423461914, 8.51313304901123, 8.752148628234863, 8.99116325378418, 9.230177879333496]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 13.0, 14.0, 15.0, 17.0, 25.0, 20.0, 30.0, 21.0, 47.0, 27.0, 45.0, 43.0, 46.0, 50.0, 32.0, 50.0, 48.0, 32.0, 38.0, 44.0, 43.0, 46.0, 40.0, 37.0, 27.0, 21.0, 27.0, 12.0, 13.0, 11.0, 10.0, 8.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.009172439575195, -5.813447952270508, -5.61772346496582, -5.421998977661133, -5.226274490356445, -5.030550003051758, -4.83482551574707, -4.639100551605225, -4.443376064300537, -4.24765157699585, -4.051927089691162, -3.8562026023864746, -3.660477876663208, -3.4647533893585205, -3.269028902053833, -3.0733041763305664, -2.877579927444458, -2.6818554401397705, -2.486130952835083, -2.2904062271118164, -2.094681739807129, -1.8989572525024414, -1.703232765197754, -1.5075081586837769, -1.3117836713790894, -1.1160591840744019, -0.9203345775604248, -0.7246100902557373, -0.528885543346405, -0.33316099643707275, -0.13743650913238525, 0.0582880973815918, 0.2540125846862793, 0.4497371315956116, 0.6454616785049438, 0.8411861658096313, 1.0369107723236084, 1.232635259628296, 1.4283597469329834, 1.6240843534469604, 1.819808840751648, 2.015533447265625, 2.2112579345703125, 2.406982421875, 2.6027069091796875, 2.798431396484375, 2.9941558837890625, 3.189880609512329, 3.3856050968170166, 3.581329584121704, 3.7770540714263916, 3.972778797149658, 4.168503284454346, 4.364227771759033, 4.559952259063721, 4.755676746368408, 4.951401233673096, 5.147125720977783, 5.342850208282471, 5.538574695587158, 5.734299182891846, 5.930024147033691, 6.125748634338379, 6.321473121643066, 6.517197608947754]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 9.0, 11.0, 5.0, 21.0, 28.0, 32.0, 47.0, 58.0, 100.0, 143.0, 188.0, 312.0, 449.0, 645.0, 1095.0, 1708.0, 3050.0, 5475.0, 10662.0, 22536.0, 52014.0, 122489.0, 240546.0, 277207.0, 170349.0, 75409.0, 32502.0, 14479.0, 7145.0, 3942.0, 2202.0, 1280.0, 792.0, 498.0, 378.0, 239.0, 146.0, 127.0, 62.0, 55.0, 42.0, 28.0, 17.0, 15.0, 12.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.6290283203125, -9.320556640625, -9.0120849609375, -8.70361328125, -8.3951416015625, -8.086669921875, -7.7781982421875, -7.4697265625, -7.1612548828125, -6.852783203125, -6.5443115234375, -6.23583984375, -5.9273681640625, -5.618896484375, -5.3104248046875, -5.001953125, -4.6934814453125, -4.385009765625, -4.0765380859375, -3.76806640625, -3.4595947265625, -3.151123046875, -2.8426513671875, -2.5341796875, -2.2257080078125, -1.917236328125, -1.6087646484375, -1.30029296875, -0.9918212890625, -0.683349609375, -0.3748779296875, -0.06640625, 0.2420654296875, 0.550537109375, 0.8590087890625, 1.16748046875, 1.4759521484375, 1.784423828125, 2.0928955078125, 2.4013671875, 2.7098388671875, 3.018310546875, 3.3267822265625, 3.63525390625, 3.9437255859375, 4.252197265625, 4.5606689453125, 4.869140625, 5.1776123046875, 5.486083984375, 5.7945556640625, 6.10302734375, 6.4114990234375, 6.719970703125, 7.0284423828125, 7.3369140625, 7.6453857421875, 7.953857421875, 8.2623291015625, 8.57080078125, 8.8792724609375, 9.187744140625, 9.4962158203125, 9.8046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 16.0, 11.0, 18.0, 15.0, 25.0, 26.0, 26.0, 32.0, 32.0, 36.0, 26.0, 43.0, 45.0, 40.0, 48.0, 41.0, 49.0, 38.0, 36.0, 42.0, 38.0, 43.0, 47.0, 29.0, 29.0, 15.0, 23.0, 22.0, 22.0, 14.0, 16.0, 9.0, 11.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.93255615234375, -5.7401123046875, -5.54766845703125, -5.355224609375, -5.16278076171875, -4.9703369140625, -4.77789306640625, -4.58544921875, -4.39300537109375, -4.2005615234375, -4.00811767578125, -3.815673828125, -3.62322998046875, -3.4307861328125, -3.23834228515625, -3.0458984375, -2.85345458984375, -2.6610107421875, -2.46856689453125, -2.276123046875, -2.08367919921875, -1.8912353515625, -1.69879150390625, -1.50634765625, -1.31390380859375, -1.1214599609375, -0.92901611328125, -0.736572265625, -0.54412841796875, -0.3516845703125, -0.15924072265625, 0.033203125, 0.22564697265625, 0.4180908203125, 0.61053466796875, 0.802978515625, 0.99542236328125, 1.1878662109375, 1.38031005859375, 1.57275390625, 1.76519775390625, 1.9576416015625, 2.15008544921875, 2.342529296875, 2.53497314453125, 2.7274169921875, 2.91986083984375, 3.1123046875, 3.30474853515625, 3.4971923828125, 3.68963623046875, 3.882080078125, 4.07452392578125, 4.2669677734375, 4.45941162109375, 4.65185546875, 4.84429931640625, 5.0367431640625, 5.22918701171875, 5.421630859375, 5.61407470703125, 5.8065185546875, 5.99896240234375, 6.19140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 5.0, 25.0, 31.0, 59.0, 72.0, 89.0, 144.0, 229.0, 330.0, 487.0, 702.0, 1079.0, 1706.0, 2727.0, 4419.0, 7394.0, 12855.0, 22812.0, 41298.0, 74663.0, 127713.0, 182986.0, 196337.0, 152931.0, 94714.0, 53502.0, 29128.0, 16190.0, 9287.0, 5335.0, 3311.0, 2086.0, 1327.0, 821.0, 563.0, 386.0, 273.0, 171.0, 105.0, 93.0, 50.0, 43.0, 24.0, 21.0, 10.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.1651611328125, -6.927978515625, -6.6907958984375, -6.45361328125, -6.2164306640625, -5.979248046875, -5.7420654296875, -5.5048828125, -5.2677001953125, -5.030517578125, -4.7933349609375, -4.55615234375, -4.3189697265625, -4.081787109375, -3.8446044921875, -3.607421875, -3.3702392578125, -3.133056640625, -2.8958740234375, -2.65869140625, -2.4215087890625, -2.184326171875, -1.9471435546875, -1.7099609375, -1.4727783203125, -1.235595703125, -0.9984130859375, -0.76123046875, -0.5240478515625, -0.286865234375, -0.0496826171875, 0.1875, 0.4246826171875, 0.661865234375, 0.8990478515625, 1.13623046875, 1.3734130859375, 1.610595703125, 1.8477783203125, 2.0849609375, 2.3221435546875, 2.559326171875, 2.7965087890625, 3.03369140625, 3.2708740234375, 3.508056640625, 3.7452392578125, 3.982421875, 4.2196044921875, 4.456787109375, 4.6939697265625, 4.93115234375, 5.1683349609375, 5.405517578125, 5.6427001953125, 5.8798828125, 6.1170654296875, 6.354248046875, 6.5914306640625, 6.82861328125, 7.0657958984375, 7.302978515625, 7.5401611328125, 7.77734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 4.0, 8.0, 11.0, 7.0, 18.0, 13.0, 20.0, 17.0, 24.0, 25.0, 25.0, 42.0, 47.0, 32.0, 31.0, 46.0, 30.0, 45.0, 39.0, 36.0, 36.0, 35.0, 47.0, 41.0, 30.0, 38.0, 26.0, 29.0, 30.0, 14.0, 17.0, 25.0, 21.0, 8.0, 8.0, 15.0, 9.0, 9.0, 9.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.173828125, -3.062744140625, -2.95166015625, -2.840576171875, -2.7294921875, -2.618408203125, -2.50732421875, -2.396240234375, -2.28515625, -2.174072265625, -2.06298828125, -1.951904296875, -1.8408203125, -1.729736328125, -1.61865234375, -1.507568359375, -1.396484375, -1.285400390625, -1.17431640625, -1.063232421875, -0.9521484375, -0.841064453125, -0.72998046875, -0.618896484375, -0.5078125, -0.396728515625, -0.28564453125, -0.174560546875, -0.0634765625, 0.047607421875, 0.15869140625, 0.269775390625, 0.380859375, 0.491943359375, 0.60302734375, 0.714111328125, 0.8251953125, 0.936279296875, 1.04736328125, 1.158447265625, 1.26953125, 1.380615234375, 1.49169921875, 1.602783203125, 1.7138671875, 1.824951171875, 1.93603515625, 2.047119140625, 2.158203125, 2.269287109375, 2.38037109375, 2.491455078125, 2.6025390625, 2.713623046875, 2.82470703125, 2.935791015625, 3.046875, 3.157958984375, 3.26904296875, 3.380126953125, 3.4912109375, 3.602294921875, 3.71337890625, 3.824462890625, 3.935546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 12.0, 15.0, 21.0, 26.0, 33.0, 53.0, 61.0, 89.0, 99.0, 171.0, 233.0, 305.0, 455.0, 604.0, 935.0, 1392.0, 2122.0, 3703.0, 6625.0, 12757.0, 26600.0, 58522.0, 129315.0, 243278.0, 265804.0, 156801.0, 71456.0, 32170.0, 15357.0, 7884.0, 4263.0, 2505.0, 1560.0, 1004.0, 632.0, 477.0, 329.0, 222.0, 194.0, 128.0, 90.0, 84.0, 55.0, 38.0, 20.0, 12.0, 21.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0], "bins": [-5.484375, -5.32366943359375, -5.1629638671875, -5.00225830078125, -4.841552734375, -4.68084716796875, -4.5201416015625, -4.35943603515625, -4.19873046875, -4.03802490234375, -3.8773193359375, -3.71661376953125, -3.555908203125, -3.39520263671875, -3.2344970703125, -3.07379150390625, -2.9130859375, -2.75238037109375, -2.5916748046875, -2.43096923828125, -2.270263671875, -2.10955810546875, -1.9488525390625, -1.78814697265625, -1.62744140625, -1.46673583984375, -1.3060302734375, -1.14532470703125, -0.984619140625, -0.82391357421875, -0.6632080078125, -0.50250244140625, -0.341796875, -0.18109130859375, -0.0203857421875, 0.14031982421875, 0.301025390625, 0.46173095703125, 0.6224365234375, 0.78314208984375, 0.94384765625, 1.10455322265625, 1.2652587890625, 1.42596435546875, 1.586669921875, 1.74737548828125, 1.9080810546875, 2.06878662109375, 2.2294921875, 2.39019775390625, 2.5509033203125, 2.71160888671875, 2.872314453125, 3.03302001953125, 3.1937255859375, 3.35443115234375, 3.51513671875, 3.67584228515625, 3.8365478515625, 3.99725341796875, 4.157958984375, 4.31866455078125, 4.4793701171875, 4.64007568359375, 4.80078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 10.0, 14.0, 11.0, 20.0, 24.0, 43.0, 53.0, 90.0, 102.0, 107.0, 110.0, 112.0, 73.0, 68.0, 33.0, 30.0, 27.0, 13.0, 10.0, 9.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007758140563964844, -0.0007547512650489807, -0.000733688473701477, -0.0007126256823539734, -0.0006915628910064697, -0.0006705000996589661, -0.0006494373083114624, -0.0006283745169639587, -0.0006073117256164551, -0.0005862489342689514, -0.0005651861429214478, -0.0005441233515739441, -0.0005230605602264404, -0.0005019977688789368, -0.0004809349775314331, -0.00045987218618392944, -0.0004388093948364258, -0.0004177466034889221, -0.00039668381214141846, -0.0003756210207939148, -0.00035455822944641113, -0.00033349543809890747, -0.0003124326467514038, -0.00029136985540390015, -0.0002703070640563965, -0.0002492442727088928, -0.00022818148136138916, -0.0002071186900138855, -0.00018605589866638184, -0.00016499310731887817, -0.0001439303159713745, -0.00012286752462387085, -0.00010180473327636719, -8.074194192886353e-05, -5.967915058135986e-05, -3.86163592338562e-05, -1.755356788635254e-05, 3.509223461151123e-06, 2.4572014808654785e-05, 4.563480615615845e-05, 6.669759750366211e-05, 8.776038885116577e-05, 0.00010882318019866943, 0.0001298859715461731, 0.00015094876289367676, 0.00017201155424118042, 0.00019307434558868408, 0.00021413713693618774, 0.0002351999282836914, 0.00025626271963119507, 0.00027732551097869873, 0.0002983883023262024, 0.00031945109367370605, 0.0003405138850212097, 0.0003615766763687134, 0.00038263946771621704, 0.0004037022590637207, 0.00042476505041122437, 0.00044582784175872803, 0.0004668906331062317, 0.00048795342445373535, 0.000509016215801239, 0.0005300790071487427, 0.0005511417984962463, 0.00057220458984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 9.0, 6.0, 24.0, 19.0, 30.0, 74.0, 91.0, 143.0, 188.0, 300.0, 461.0, 670.0, 1048.0, 1663.0, 2725.0, 4510.0, 7881.0, 14472.0, 27449.0, 54641.0, 109570.0, 191141.0, 237037.0, 182992.0, 102245.0, 51000.0, 25820.0, 13479.0, 7483.0, 4248.0, 2641.0, 1602.0, 1015.0, 628.0, 397.0, 267.0, 202.0, 120.0, 78.0, 66.0, 41.0, 23.0, 18.0, 9.0, 9.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.1072998046875, -3.972412109375, -3.8375244140625, -3.70263671875, -3.5677490234375, -3.432861328125, -3.2979736328125, -3.1630859375, -3.0281982421875, -2.893310546875, -2.7584228515625, -2.62353515625, -2.4886474609375, -2.353759765625, -2.2188720703125, -2.083984375, -1.9490966796875, -1.814208984375, -1.6793212890625, -1.54443359375, -1.4095458984375, -1.274658203125, -1.1397705078125, -1.0048828125, -0.8699951171875, -0.735107421875, -0.6002197265625, -0.46533203125, -0.3304443359375, -0.195556640625, -0.0606689453125, 0.07421875, 0.2091064453125, 0.343994140625, 0.4788818359375, 0.61376953125, 0.7486572265625, 0.883544921875, 1.0184326171875, 1.1533203125, 1.2882080078125, 1.423095703125, 1.5579833984375, 1.69287109375, 1.8277587890625, 1.962646484375, 2.0975341796875, 2.232421875, 2.3673095703125, 2.502197265625, 2.6370849609375, 2.77197265625, 2.9068603515625, 3.041748046875, 3.1766357421875, 3.3115234375, 3.4464111328125, 3.581298828125, 3.7161865234375, 3.85107421875, 3.9859619140625, 4.120849609375, 4.2557373046875, 4.390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 4.0, 3.0, 7.0, 8.0, 6.0, 8.0, 17.0, 11.0, 23.0, 24.0, 20.0, 31.0, 24.0, 36.0, 37.0, 57.0, 45.0, 60.0, 48.0, 61.0, 56.0, 48.0, 46.0, 47.0, 43.0, 47.0, 30.0, 37.0, 21.0, 16.0, 9.0, 10.0, 13.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0728378295898438, -1.0411834716796875, -1.0095291137695312, -0.977874755859375, -0.9462203979492188, -0.9145660400390625, -0.8829116821289062, -0.85125732421875, -0.8196029663085938, -0.7879486083984375, -0.7562942504882812, -0.724639892578125, -0.6929855346679688, -0.6613311767578125, -0.6296768188476562, -0.5980224609375, -0.5663681030273438, -0.5347137451171875, -0.5030593872070312, -0.471405029296875, -0.43975067138671875, -0.4080963134765625, -0.37644195556640625, -0.34478759765625, -0.31313323974609375, -0.2814788818359375, -0.24982452392578125, -0.218170166015625, -0.18651580810546875, -0.1548614501953125, -0.12320709228515625, -0.091552734375, -0.05989837646484375, -0.0282440185546875, 0.00341033935546875, 0.035064697265625, 0.06671905517578125, 0.0983734130859375, 0.13002777099609375, 0.16168212890625, 0.19333648681640625, 0.2249908447265625, 0.25664520263671875, 0.288299560546875, 0.31995391845703125, 0.3516082763671875, 0.38326263427734375, 0.4149169921875, 0.44657135009765625, 0.4782257080078125, 0.5098800659179688, 0.541534423828125, 0.5731887817382812, 0.6048431396484375, 0.6364974975585938, 0.66815185546875, 0.6998062133789062, 0.7314605712890625, 0.7631149291992188, 0.794769287109375, 0.8264236450195312, 0.8580780029296875, 0.8897323608398438, 0.92138671875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 10.0, 8.0, 9.0, 20.0, 17.0, 18.0, 20.0, 27.0, 31.0, 26.0, 46.0, 47.0, 51.0, 53.0, 44.0, 53.0, 64.0, 61.0, 57.0, 41.0, 49.0, 45.0, 39.0, 31.0, 22.0, 15.0, 22.0, 15.0, 14.0, 6.0, 7.0, 13.0, 3.0, 4.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.669829845428467, -5.44361686706543, -5.217403888702393, -4.9911909103393555, -4.764978408813477, -4.5387654304504395, -4.312552452087402, -4.086339473724365, -3.8601267337799072, -3.63391375541687, -3.407701015472412, -3.181488037109375, -2.955275058746338, -2.72906231880188, -2.5028493404388428, -2.2766366004943848, -2.0504236221313477, -1.8242107629776, -1.5979979038238525, -1.3717849254608154, -1.1455720663070679, -0.9193592071533203, -0.6931462287902832, -0.46693336963653564, -0.24072051048278809, -0.01450762152671814, 0.2117052674293518, 0.43791818618774414, 0.6641310453414917, 0.8903439044952393, 1.1165568828582764, 1.342769742012024, 1.5689830780029297, 1.7951959371566772, 2.021408796310425, 2.247621774673462, 2.47383451461792, 2.700047492980957, 2.926260471343994, 3.1524734497070312, 3.3786861896514893, 3.6048991680145264, 3.8311119079589844, 4.0573248863220215, 4.283537864685059, 4.5097503662109375, 4.735963821411133, 4.962176322937012, 5.188389301300049, 5.414602279663086, 5.640815258026123, 5.86702823638916, 6.093240737915039, 6.319453716278076, 6.545666694641113, 6.77187967300415, 6.9980926513671875, 7.224305629730225, 7.450518608093262, 7.676731109619141, 7.902944087982178, 8.129157066345215, 8.355369567871094, 8.581583023071289, 8.807795524597168]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 8.0, 12.0, 10.0, 12.0, 17.0, 27.0, 28.0, 26.0, 31.0, 28.0, 29.0, 43.0, 49.0, 39.0, 43.0, 39.0, 47.0, 43.0, 39.0, 52.0, 32.0, 38.0, 43.0, 39.0, 38.0, 29.0, 27.0, 19.0, 16.0, 11.0, 15.0, 13.0, 7.0, 7.0, 11.0, 10.0, 7.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.829577445983887, -5.636209011077881, -5.442840576171875, -5.249472141265869, -5.056103706359863, -4.862735271453857, -4.669366836547852, -4.475998878479004, -4.28262996673584, -4.089261531829834, -3.895893096923828, -3.7025246620178223, -3.5091562271118164, -3.3157877922058105, -3.122419595718384, -2.929051160812378, -2.735682964324951, -2.5423145294189453, -2.3489460945129395, -2.1555776596069336, -1.9622093439102173, -1.7688409090042114, -1.5754725933074951, -1.3821041584014893, -1.1887357234954834, -0.9953672885894775, -0.8019989132881165, -0.6086305379867554, -0.4152621030807495, -0.22189366817474365, -0.028525352478027344, 0.16484308242797852, 0.35821104049682617, 0.551579475402832, 0.7449478507041931, 0.9383162260055542, 1.13168466091156, 1.325053095817566, 1.5184214115142822, 1.711789846420288, 1.905158281326294, 2.0985267162323, 2.2918951511383057, 2.4852633476257324, 2.6786317825317383, 2.872000217437744, 3.06536865234375, 3.258737087249756, 3.4521055221557617, 3.6454739570617676, 3.8388423919677734, 4.032210826873779, 4.225579261779785, 4.418947696685791, 4.612316131591797, 4.8056840896606445, 4.999053001403809, 5.1924214363098145, 5.38578987121582, 5.579158306121826, 5.772526741027832, 5.965895175933838, 6.159263610839844, 6.352631568908691, 6.546000003814697]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 11.0, 12.0, 13.0, 15.0, 31.0, 39.0, 51.0, 84.0, 128.0, 172.0, 285.0, 414.0, 649.0, 1028.0, 1636.0, 2735.0, 4914.0, 9382.0, 20586.0, 54150.0, 178128.0, 628150.0, 1424491.0, 1225652.0, 444573.0, 123220.0, 40087.0, 16161.0, 7659.0, 3946.0, 2292.0, 1368.0, 811.0, 516.0, 308.0, 202.0, 129.0, 71.0, 74.0, 37.0, 35.0, 16.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.953125, -11.6287841796875, -11.304443359375, -10.9801025390625, -10.65576171875, -10.3314208984375, -10.007080078125, -9.6827392578125, -9.3583984375, -9.0340576171875, -8.709716796875, -8.3853759765625, -8.06103515625, -7.7366943359375, -7.412353515625, -7.0880126953125, -6.763671875, -6.4393310546875, -6.114990234375, -5.7906494140625, -5.46630859375, -5.1419677734375, -4.817626953125, -4.4932861328125, -4.1689453125, -3.8446044921875, -3.520263671875, -3.1959228515625, -2.87158203125, -2.5472412109375, -2.222900390625, -1.8985595703125, -1.57421875, -1.2498779296875, -0.925537109375, -0.6011962890625, -0.27685546875, 0.0474853515625, 0.371826171875, 0.6961669921875, 1.0205078125, 1.3448486328125, 1.669189453125, 1.9935302734375, 2.31787109375, 2.6422119140625, 2.966552734375, 3.2908935546875, 3.615234375, 3.9395751953125, 4.263916015625, 4.5882568359375, 4.91259765625, 5.2369384765625, 5.561279296875, 5.8856201171875, 6.2099609375, 6.5343017578125, 6.858642578125, 7.1829833984375, 7.50732421875, 7.8316650390625, 8.156005859375, 8.4803466796875, 8.8046875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 13.0, 8.0, 6.0, 15.0, 20.0, 23.0, 25.0, 32.0, 32.0, 26.0, 42.0, 41.0, 31.0, 43.0, 38.0, 43.0, 47.0, 42.0, 35.0, 53.0, 41.0, 32.0, 37.0, 42.0, 35.0, 34.0, 25.0, 20.0, 18.0, 16.0, 10.0, 17.0, 7.0, 9.0, 5.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.28729248046875, -5.1175537109375, -4.94781494140625, -4.778076171875, -4.60833740234375, -4.4385986328125, -4.26885986328125, -4.09912109375, -3.92938232421875, -3.7596435546875, -3.58990478515625, -3.420166015625, -3.25042724609375, -3.0806884765625, -2.91094970703125, -2.7412109375, -2.57147216796875, -2.4017333984375, -2.23199462890625, -2.062255859375, -1.89251708984375, -1.7227783203125, -1.55303955078125, -1.38330078125, -1.21356201171875, -1.0438232421875, -0.87408447265625, -0.704345703125, -0.53460693359375, -0.3648681640625, -0.19512939453125, -0.025390625, 0.14434814453125, 0.3140869140625, 0.48382568359375, 0.653564453125, 0.82330322265625, 0.9930419921875, 1.16278076171875, 1.33251953125, 1.50225830078125, 1.6719970703125, 1.84173583984375, 2.011474609375, 2.18121337890625, 2.3509521484375, 2.52069091796875, 2.6904296875, 2.86016845703125, 3.0299072265625, 3.19964599609375, 3.369384765625, 3.53912353515625, 3.7088623046875, 3.87860107421875, 4.04833984375, 4.21807861328125, 4.3878173828125, 4.55755615234375, 4.727294921875, 4.89703369140625, 5.0667724609375, 5.23651123046875, 5.40625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 11.0, 6.0, 13.0, 19.0, 33.0, 53.0, 80.0, 104.0, 124.0, 223.0, 323.0, 423.0, 660.0, 953.0, 1472.0, 2446.0, 3773.0, 6128.0, 10027.0, 17870.0, 33924.0, 70689.0, 160794.0, 383023.0, 822360.0, 1153790.0, 827577.0, 384920.0, 162087.0, 70958.0, 34563.0, 17974.0, 10248.0, 5965.0, 3708.0, 2365.0, 1585.0, 978.0, 636.0, 446.0, 305.0, 192.0, 125.0, 99.0, 78.0, 43.0, 41.0, 28.0, 11.0, 11.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0], "bins": [-9.3125, -9.0345458984375, -8.756591796875, -8.4786376953125, -8.20068359375, -7.9227294921875, -7.644775390625, -7.3668212890625, -7.0888671875, -6.8109130859375, -6.532958984375, -6.2550048828125, -5.97705078125, -5.6990966796875, -5.421142578125, -5.1431884765625, -4.865234375, -4.5872802734375, -4.309326171875, -4.0313720703125, -3.75341796875, -3.4754638671875, -3.197509765625, -2.9195556640625, -2.6416015625, -2.3636474609375, -2.085693359375, -1.8077392578125, -1.52978515625, -1.2518310546875, -0.973876953125, -0.6959228515625, -0.41796875, -0.1400146484375, 0.137939453125, 0.4158935546875, 0.69384765625, 0.9718017578125, 1.249755859375, 1.5277099609375, 1.8056640625, 2.0836181640625, 2.361572265625, 2.6395263671875, 2.91748046875, 3.1954345703125, 3.473388671875, 3.7513427734375, 4.029296875, 4.3072509765625, 4.585205078125, 4.8631591796875, 5.14111328125, 5.4190673828125, 5.697021484375, 5.9749755859375, 6.2529296875, 6.5308837890625, 6.808837890625, 7.0867919921875, 7.36474609375, 7.6427001953125, 7.920654296875, 8.1986083984375, 8.4765625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 6.0, 8.0, 13.0, 24.0, 35.0, 39.0, 36.0, 58.0, 79.0, 121.0, 150.0, 157.0, 243.0, 271.0, 328.0, 357.0, 306.0, 360.0, 318.0, 283.0, 193.0, 157.0, 127.0, 110.0, 76.0, 60.0, 29.0, 26.0, 23.0, 26.0, 16.0, 9.0, 6.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.60546875, -3.50653076171875, -3.4075927734375, -3.30865478515625, -3.209716796875, -3.11077880859375, -3.0118408203125, -2.91290283203125, -2.81396484375, -2.71502685546875, -2.6160888671875, -2.51715087890625, -2.418212890625, -2.31927490234375, -2.2203369140625, -2.12139892578125, -2.0224609375, -1.92352294921875, -1.8245849609375, -1.72564697265625, -1.626708984375, -1.52777099609375, -1.4288330078125, -1.32989501953125, -1.23095703125, -1.13201904296875, -1.0330810546875, -0.93414306640625, -0.835205078125, -0.73626708984375, -0.6373291015625, -0.53839111328125, -0.439453125, -0.34051513671875, -0.2415771484375, -0.14263916015625, -0.043701171875, 0.05523681640625, 0.1541748046875, 0.25311279296875, 0.35205078125, 0.45098876953125, 0.5499267578125, 0.64886474609375, 0.747802734375, 0.84674072265625, 0.9456787109375, 1.04461669921875, 1.1435546875, 1.24249267578125, 1.3414306640625, 1.44036865234375, 1.539306640625, 1.63824462890625, 1.7371826171875, 1.83612060546875, 1.93505859375, 2.03399658203125, 2.1329345703125, 2.23187255859375, 2.330810546875, 2.42974853515625, 2.5286865234375, 2.62762451171875, 2.7265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 1.0, 11.0, 11.0, 9.0, 20.0, 17.0, 29.0, 22.0, 35.0, 46.0, 49.0, 47.0, 48.0, 51.0, 71.0, 59.0, 58.0, 53.0, 43.0, 45.0, 36.0, 35.0, 36.0, 41.0, 14.0, 21.0, 19.0, 12.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.937065124511719, -5.70990514755249, -5.4827446937561035, -5.255584716796875, -5.028424263000488, -4.80126428604126, -4.574104309082031, -4.3469438552856445, -4.119783878326416, -3.8926236629486084, -3.665463447570801, -3.4383034706115723, -3.2111432552337646, -2.983983039855957, -2.7568228244781494, -2.529662609100342, -2.302502393722534, -2.0753421783447266, -1.8481820821762085, -1.6210218667984009, -1.3938617706298828, -1.1667015552520752, -0.9395413398742676, -0.7123812437057495, -0.4852210283279419, -0.25806087255477905, -0.030900686979293823, 0.1962594985961914, 0.42341965436935425, 0.6505798101425171, 0.8777400255203247, 1.1049001216888428, 1.3320603370666504, 1.559220552444458, 1.786380648612976, 2.013540744781494, 2.2407009601593018, 2.4678611755371094, 2.695021390914917, 2.9221816062927246, 3.149341583251953, 3.3765017986297607, 3.6036620140075684, 3.830821990966797, 4.057982444763184, 4.285142421722412, 4.512302398681641, 4.739462852478027, 4.966623306274414, 5.193783283233643, 5.420943737030029, 5.648103713989258, 5.8752641677856445, 6.102424144744873, 6.329584121704102, 6.556744575500488, 6.783904552459717, 7.011064529418945, 7.238224983215332, 7.4653849601745605, 7.692545413970947, 7.919705390930176, 8.146865844726562, 8.374025344848633, 8.60118579864502]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 11.0, 8.0, 7.0, 8.0, 10.0, 13.0, 18.0, 22.0, 22.0, 21.0, 23.0, 31.0, 30.0, 34.0, 27.0, 39.0, 41.0, 39.0, 35.0, 43.0, 41.0, 30.0, 36.0, 53.0, 36.0, 30.0, 33.0, 32.0, 31.0, 21.0, 24.0, 28.0, 20.0, 21.0, 16.0, 11.0, 8.0, 5.0, 9.0, 5.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.409823894500732, -5.24122953414917, -5.072634696960449, -4.904040336608887, -4.735445976257324, -4.5668511390686035, -4.398256778717041, -4.22966194152832, -4.061067581176758, -3.892472982406616, -3.7238783836364746, -3.555284023284912, -3.3866894245147705, -3.218094825744629, -3.0495004653930664, -2.880905866622925, -2.712311267852783, -2.5437166690826416, -2.3751220703125, -2.2065277099609375, -2.037933111190796, -1.8693385124206543, -1.7007440328598022, -1.5321495532989502, -1.3635549545288086, -1.194960355758667, -1.026365876197815, -0.8577713370323181, -0.6891767978668213, -0.5205822587013245, -0.35198771953582764, -0.18339323997497559, -0.014799118041992188, 0.15379542112350464, 0.32238996028900146, 0.4909844994544983, 0.6595790386199951, 0.8281735777854919, 0.9967681169509888, 1.1653625965118408, 1.3339571952819824, 1.502551794052124, 1.671146273612976, 1.8397407531738281, 2.0083353519439697, 2.1769299507141113, 2.345524311065674, 2.5141189098358154, 2.682713508605957, 2.8513081073760986, 3.0199027061462402, 3.1884970664978027, 3.3570916652679443, 3.525686264038086, 3.6942806243896484, 3.86287522315979, 4.031469821929932, 4.200064182281494, 4.368659019470215, 4.537253379821777, 4.70584774017334, 4.8744425773620605, 5.043036937713623, 5.211631774902344, 5.380226135253906]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 6.0, 11.0, 17.0, 28.0, 49.0, 65.0, 90.0, 167.0, 235.0, 373.0, 534.0, 909.0, 1448.0, 2230.0, 3453.0, 5289.0, 8446.0, 13540.0, 21607.0, 35535.0, 57158.0, 89479.0, 129576.0, 160367.0, 158427.0, 126270.0, 87080.0, 55405.0, 34442.0, 21058.0, 12758.0, 8004.0, 5189.0, 3318.0, 2101.0, 1357.0, 879.0, 591.0, 359.0, 252.0, 160.0, 120.0, 57.0, 39.0, 34.0, 20.0, 9.0, 6.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.330078125, -1.2871246337890625, -1.244171142578125, -1.2012176513671875, -1.15826416015625, -1.1153106689453125, -1.072357177734375, -1.0294036865234375, -0.9864501953125, -0.9434967041015625, -0.900543212890625, -0.8575897216796875, -0.81463623046875, -0.7716827392578125, -0.728729248046875, -0.6857757568359375, -0.642822265625, -0.5998687744140625, -0.556915283203125, -0.5139617919921875, -0.47100830078125, -0.4280548095703125, -0.385101318359375, -0.3421478271484375, -0.2991943359375, -0.2562408447265625, -0.213287353515625, -0.1703338623046875, -0.12738037109375, -0.0844268798828125, -0.041473388671875, 0.0014801025390625, 0.04443359375, 0.0873870849609375, 0.130340576171875, 0.1732940673828125, 0.21624755859375, 0.2592010498046875, 0.302154541015625, 0.3451080322265625, 0.3880615234375, 0.4310150146484375, 0.473968505859375, 0.5169219970703125, 0.55987548828125, 0.6028289794921875, 0.645782470703125, 0.6887359619140625, 0.731689453125, 0.7746429443359375, 0.817596435546875, 0.8605499267578125, 0.90350341796875, 0.9464569091796875, 0.989410400390625, 1.0323638916015625, 1.0753173828125, 1.1182708740234375, 1.161224365234375, 1.2041778564453125, 1.24713134765625, 1.2900848388671875, 1.333038330078125, 1.3759918212890625, 1.4189453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 4.0, 7.0, 3.0, 9.0, 6.0, 9.0, 12.0, 8.0, 20.0, 19.0, 15.0, 25.0, 27.0, 22.0, 23.0, 25.0, 35.0, 30.0, 33.0, 34.0, 38.0, 44.0, 35.0, 34.0, 47.0, 34.0, 32.0, 33.0, 30.0, 27.0, 28.0, 29.0, 26.0, 23.0, 25.0, 22.0, 17.0, 21.0, 17.0, 15.0, 7.0, 4.0, 10.0, 7.0, 6.0, 10.0, 6.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0], "bins": [-5.64453125, -5.4791259765625, -5.313720703125, -5.1483154296875, -4.98291015625, -4.8175048828125, -4.652099609375, -4.4866943359375, -4.3212890625, -4.1558837890625, -3.990478515625, -3.8250732421875, -3.65966796875, -3.4942626953125, -3.328857421875, -3.1634521484375, -2.998046875, -2.8326416015625, -2.667236328125, -2.5018310546875, -2.33642578125, -2.1710205078125, -2.005615234375, -1.8402099609375, -1.6748046875, -1.5093994140625, -1.343994140625, -1.1785888671875, -1.01318359375, -0.8477783203125, -0.682373046875, -0.5169677734375, -0.3515625, -0.1861572265625, -0.020751953125, 0.1446533203125, 0.31005859375, 0.4754638671875, 0.640869140625, 0.8062744140625, 0.9716796875, 1.1370849609375, 1.302490234375, 1.4678955078125, 1.63330078125, 1.7987060546875, 1.964111328125, 2.1295166015625, 2.294921875, 2.4603271484375, 2.625732421875, 2.7911376953125, 2.95654296875, 3.1219482421875, 3.287353515625, 3.4527587890625, 3.6181640625, 3.7835693359375, 3.948974609375, 4.1143798828125, 4.27978515625, 4.4451904296875, 4.610595703125, 4.7760009765625, 4.94140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 13.0, 13.0, 12.0, 21.0, 36.0, 32.0, 58.0, 57.0, 98.0, 133.0, 207.0, 267.0, 436.0, 628.0, 902.0, 1439.0, 2175.0, 3398.0, 5341.0, 8712.0, 14852.0, 27323.0, 128123.0, 743768.0, 55753.0, 21851.0, 12245.0, 7245.0, 4523.0, 2991.0, 1908.0, 1217.0, 839.0, 580.0, 389.0, 270.0, 200.0, 132.0, 85.0, 81.0, 48.0, 48.0, 26.0, 26.0, 13.0, 16.0, 7.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.75042724609375, -3.6180419921875, -3.48565673828125, -3.353271484375, -3.22088623046875, -3.0885009765625, -2.95611572265625, -2.82373046875, -2.69134521484375, -2.5589599609375, -2.42657470703125, -2.294189453125, -2.16180419921875, -2.0294189453125, -1.89703369140625, -1.7646484375, -1.63226318359375, -1.4998779296875, -1.36749267578125, -1.235107421875, -1.10272216796875, -0.9703369140625, -0.83795166015625, -0.70556640625, -0.57318115234375, -0.4407958984375, -0.30841064453125, -0.176025390625, -0.04364013671875, 0.0887451171875, 0.22113037109375, 0.353515625, 0.48590087890625, 0.6182861328125, 0.75067138671875, 0.883056640625, 1.01544189453125, 1.1478271484375, 1.28021240234375, 1.41259765625, 1.54498291015625, 1.6773681640625, 1.80975341796875, 1.942138671875, 2.07452392578125, 2.2069091796875, 2.33929443359375, 2.4716796875, 2.60406494140625, 2.7364501953125, 2.86883544921875, 3.001220703125, 3.13360595703125, 3.2659912109375, 3.39837646484375, 3.53076171875, 3.66314697265625, 3.7955322265625, 3.92791748046875, 4.060302734375, 4.19268798828125, 4.3250732421875, 4.45745849609375, 4.58984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 10.0, 5.0, 12.0, 12.0, 13.0, 13.0, 21.0, 16.0, 22.0, 17.0, 35.0, 35.0, 44.0, 43.0, 41.0, 44.0, 40.0, 28.0, 46.0, 52.0, 37.0, 53.0, 43.0, 45.0, 40.0, 44.0, 33.0, 24.0, 24.0, 13.0, 20.0, 9.0, 11.0, 9.0, 16.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.20703125, -5.05267333984375, -4.8983154296875, -4.74395751953125, -4.589599609375, -4.43524169921875, -4.2808837890625, -4.12652587890625, -3.97216796875, -3.81781005859375, -3.6634521484375, -3.50909423828125, -3.354736328125, -3.20037841796875, -3.0460205078125, -2.89166259765625, -2.7373046875, -2.58294677734375, -2.4285888671875, -2.27423095703125, -2.119873046875, -1.96551513671875, -1.8111572265625, -1.65679931640625, -1.50244140625, -1.34808349609375, -1.1937255859375, -1.03936767578125, -0.885009765625, -0.73065185546875, -0.5762939453125, -0.42193603515625, -0.267578125, -0.11322021484375, 0.0411376953125, 0.19549560546875, 0.349853515625, 0.50421142578125, 0.6585693359375, 0.81292724609375, 0.96728515625, 1.12164306640625, 1.2760009765625, 1.43035888671875, 1.584716796875, 1.73907470703125, 1.8934326171875, 2.04779052734375, 2.2021484375, 2.35650634765625, 2.5108642578125, 2.66522216796875, 2.819580078125, 2.97393798828125, 3.1282958984375, 3.28265380859375, 3.43701171875, 3.59136962890625, 3.7457275390625, 3.90008544921875, 4.054443359375, 4.20880126953125, 4.3631591796875, 4.51751708984375, 4.671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 8.0, 25.0, 19.0, 36.0, 59.0, 73.0, 100.0, 155.0, 254.0, 325.0, 487.0, 725.0, 1238.0, 1908.0, 3469.0, 6481.0, 13892.0, 40473.0, 765461.0, 167048.0, 24132.0, 9936.0, 4900.0, 2782.0, 1574.0, 1067.0, 616.0, 399.0, 269.0, 186.0, 115.0, 94.0, 60.0, 45.0, 33.0, 20.0, 17.0, 10.0, 6.0, 10.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.86474609375, -0.835723876953125, -0.80670166015625, -0.777679443359375, -0.7486572265625, -0.719635009765625, -0.69061279296875, -0.661590576171875, -0.632568359375, -0.603546142578125, -0.57452392578125, -0.545501708984375, -0.5164794921875, -0.487457275390625, -0.45843505859375, -0.429412841796875, -0.400390625, -0.371368408203125, -0.34234619140625, -0.313323974609375, -0.2843017578125, -0.255279541015625, -0.22625732421875, -0.197235107421875, -0.168212890625, -0.139190673828125, -0.11016845703125, -0.081146240234375, -0.0521240234375, -0.023101806640625, 0.00592041015625, 0.034942626953125, 0.06396484375, 0.092987060546875, 0.12200927734375, 0.151031494140625, 0.1800537109375, 0.209075927734375, 0.23809814453125, 0.267120361328125, 0.296142578125, 0.325164794921875, 0.35418701171875, 0.383209228515625, 0.4122314453125, 0.441253662109375, 0.47027587890625, 0.499298095703125, 0.5283203125, 0.557342529296875, 0.58636474609375, 0.615386962890625, 0.6444091796875, 0.673431396484375, 0.70245361328125, 0.731475830078125, 0.760498046875, 0.789520263671875, 0.81854248046875, 0.847564697265625, 0.8765869140625, 0.905609130859375, 0.93463134765625, 0.963653564453125, 0.99267578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 10.0, 17.0, 16.0, 20.0, 19.0, 24.0, 36.0, 50.0, 49.0, 58.0, 87.0, 81.0, 87.0, 73.0, 58.0, 64.0, 40.0, 30.0, 34.0, 27.0, 20.0, 18.0, 21.0, 14.0, 5.0, 6.0, 5.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.705522537231445e-05, -6.528384983539581e-05, -6.351247429847717e-05, -6.174109876155853e-05, -5.996972322463989e-05, -5.819834768772125e-05, -5.642697215080261e-05, -5.465559661388397e-05, -5.288422107696533e-05, -5.111284554004669e-05, -4.934147000312805e-05, -4.757009446620941e-05, -4.579871892929077e-05, -4.402734339237213e-05, -4.225596785545349e-05, -4.048459231853485e-05, -3.871321678161621e-05, -3.694184124469757e-05, -3.517046570777893e-05, -3.339909017086029e-05, -3.162771463394165e-05, -2.985633909702301e-05, -2.808496356010437e-05, -2.631358802318573e-05, -2.454221248626709e-05, -2.277083694934845e-05, -2.099946141242981e-05, -1.922808587551117e-05, -1.745671033859253e-05, -1.568533480167389e-05, -1.3913959264755249e-05, -1.2142583727836609e-05, -1.0371208190917969e-05, -8.599832653999329e-06, -6.8284571170806885e-06, -5.057081580162048e-06, -3.285706043243408e-06, -1.514330506324768e-06, 2.5704503059387207e-07, 2.028420567512512e-06, 3.7997961044311523e-06, 5.5711716413497925e-06, 7.342547178268433e-06, 9.113922715187073e-06, 1.0885298252105713e-05, 1.2656673789024353e-05, 1.4428049325942993e-05, 1.6199424862861633e-05, 1.7970800399780273e-05, 1.9742175936698914e-05, 2.1513551473617554e-05, 2.3284927010536194e-05, 2.5056302547454834e-05, 2.6827678084373474e-05, 2.8599053621292114e-05, 3.0370429158210754e-05, 3.2141804695129395e-05, 3.3913180232048035e-05, 3.5684555768966675e-05, 3.7455931305885315e-05, 3.9227306842803955e-05, 4.0998682379722595e-05, 4.2770057916641235e-05, 4.4541433453559875e-05, 4.6312808990478516e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 9.0, 11.0, 21.0, 19.0, 33.0, 41.0, 78.0, 118.0, 144.0, 235.0, 300.0, 472.0, 684.0, 978.0, 1487.0, 2144.0, 3516.0, 5644.0, 9357.0, 16025.0, 30348.0, 60696.0, 126711.0, 231521.0, 251536.0, 150349.0, 73058.0, 35988.0, 19010.0, 10347.0, 6215.0, 3992.0, 2471.0, 1603.0, 1088.0, 686.0, 481.0, 393.0, 237.0, 164.0, 124.0, 61.0, 51.0, 27.0, 20.0, 22.0, 14.0, 10.0, 9.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.63671875, -0.6168975830078125, -0.597076416015625, -0.5772552490234375, -0.55743408203125, -0.5376129150390625, -0.517791748046875, -0.4979705810546875, -0.4781494140625, -0.4583282470703125, -0.438507080078125, -0.4186859130859375, -0.39886474609375, -0.3790435791015625, -0.359222412109375, -0.3394012451171875, -0.319580078125, -0.2997589111328125, -0.279937744140625, -0.2601165771484375, -0.24029541015625, -0.2204742431640625, -0.200653076171875, -0.1808319091796875, -0.1610107421875, -0.1411895751953125, -0.121368408203125, -0.1015472412109375, -0.08172607421875, -0.0619049072265625, -0.042083740234375, -0.0222625732421875, -0.00244140625, 0.0173797607421875, 0.037200927734375, 0.0570220947265625, 0.07684326171875, 0.0966644287109375, 0.116485595703125, 0.1363067626953125, 0.1561279296875, 0.1759490966796875, 0.195770263671875, 0.2155914306640625, 0.23541259765625, 0.2552337646484375, 0.275054931640625, 0.2948760986328125, 0.314697265625, 0.3345184326171875, 0.354339599609375, 0.3741607666015625, 0.39398193359375, 0.4138031005859375, 0.433624267578125, 0.4534454345703125, 0.4732666015625, 0.4930877685546875, 0.512908935546875, 0.5327301025390625, 0.55255126953125, 0.5723724365234375, 0.592193603515625, 0.6120147705078125, 0.6318359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 0.0, 4.0, 3.0, 3.0, 8.0, 3.0, 9.0, 9.0, 11.0, 18.0, 6.0, 10.0, 17.0, 20.0, 28.0, 22.0, 40.0, 29.0, 54.0, 70.0, 72.0, 72.0, 89.0, 66.0, 50.0, 60.0, 50.0, 32.0, 22.0, 14.0, 12.0, 14.0, 13.0, 11.0, 9.0, 14.0, 9.0, 11.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.1543731689453125, -0.148834228515625, -0.1432952880859375, -0.13775634765625, -0.1322174072265625, -0.126678466796875, -0.1211395263671875, -0.1156005859375, -0.1100616455078125, -0.104522705078125, -0.0989837646484375, -0.09344482421875, -0.0879058837890625, -0.082366943359375, -0.0768280029296875, -0.0712890625, -0.0657501220703125, -0.060211181640625, -0.0546722412109375, -0.04913330078125, -0.0435943603515625, -0.038055419921875, -0.0325164794921875, -0.0269775390625, -0.0214385986328125, -0.015899658203125, -0.0103607177734375, -0.00482177734375, 0.0007171630859375, 0.006256103515625, 0.0117950439453125, 0.017333984375, 0.0228729248046875, 0.028411865234375, 0.0339508056640625, 0.03948974609375, 0.0450286865234375, 0.050567626953125, 0.0561065673828125, 0.0616455078125, 0.0671844482421875, 0.072723388671875, 0.0782623291015625, 0.08380126953125, 0.0893402099609375, 0.094879150390625, 0.1004180908203125, 0.10595703125, 0.1114959716796875, 0.117034912109375, 0.1225738525390625, 0.12811279296875, 0.1336517333984375, 0.139190673828125, 0.1447296142578125, 0.1502685546875, 0.1558074951171875, 0.161346435546875, 0.1668853759765625, 0.17242431640625, 0.1779632568359375, 0.183502197265625, 0.1890411376953125, 0.194580078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 8.0, 3.0, 10.0, 6.0, 5.0, 10.0, 13.0, 18.0, 15.0, 31.0, 16.0, 33.0, 38.0, 53.0, 48.0, 37.0, 61.0, 57.0, 61.0, 54.0, 60.0, 51.0, 34.0, 35.0, 42.0, 46.0, 25.0, 34.0, 15.0, 16.0, 20.0, 11.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.636909484863281, -5.4160919189453125, -5.195274353027344, -4.974456787109375, -4.7536396980285645, -4.532822132110596, -4.312004566192627, -4.091187000274658, -3.8703694343566895, -3.6495518684387207, -3.428734540939331, -3.2079169750213623, -2.9870994091033936, -2.766282081604004, -2.545464515686035, -2.3246469497680664, -2.1038296222686768, -1.8830121755599976, -1.6621946096420288, -1.4413771629333496, -1.2205595970153809, -0.9997421503067017, -0.7789247035980225, -0.5581071376800537, -0.3372896909713745, -0.11647219955921173, 0.10434529185295105, 0.32516276836395264, 0.5459802746772766, 0.7667977809906006, 0.9876152276992798, 1.2084327936172485, 1.4292502403259277, 1.650067687034607, 1.8708852529525757, 2.091702699661255, 2.3125202655792236, 2.5333375930786133, 2.754155158996582, 2.974972724914551, 3.1957902908325195, 3.4166078567504883, 3.637425184249878, 3.8582427501678467, 4.079060077667236, 4.299877643585205, 4.520695209503174, 4.741512775421143, 4.962329864501953, 5.183147430419922, 5.403964996337891, 5.624782562255859, 5.84559965133667, 6.066417217254639, 6.287234783172607, 6.508052349090576, 6.728869915008545, 6.949687480926514, 7.170505046844482, 7.391322135925293, 7.612139701843262, 7.8329572677612305, 8.0537748336792, 8.274592399597168, 8.495409965515137]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 8.0, 7.0, 11.0, 7.0, 12.0, 20.0, 23.0, 24.0, 17.0, 30.0, 31.0, 25.0, 30.0, 31.0, 44.0, 35.0, 40.0, 42.0, 36.0, 41.0, 33.0, 36.0, 44.0, 37.0, 32.0, 33.0, 32.0, 27.0, 25.0, 24.0, 21.0, 23.0, 22.0, 17.0, 11.0, 8.0, 7.0, 4.0, 9.0, 9.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.290039539337158, -5.124873638153076, -4.959707736968994, -4.794541358947754, -4.629375457763672, -4.46420955657959, -4.299043655395508, -4.133877754211426, -3.9687116146087646, -3.8035457134246826, -3.6383795738220215, -3.4732136726379395, -3.3080477714538574, -3.1428816318511963, -2.9777157306671143, -2.812549591064453, -2.647383689880371, -2.482217788696289, -2.317051649093628, -2.151885747909546, -1.9867197275161743, -1.8215537071228027, -1.6563878059387207, -1.4912217855453491, -1.3260557651519775, -1.160889744758606, -0.9957237839698792, -0.8305578231811523, -0.6653918027877808, -0.5002257823944092, -0.3350598216056824, -0.16989386081695557, -0.004727840423583984, 0.1604381501674652, 0.3256041407585144, 0.4907701313495636, 0.6559361219406128, 0.8211021423339844, 0.9862681031227112, 1.151434063911438, 1.3166000843048096, 1.4817661046981812, 1.6469321250915527, 1.8120980262756348, 1.9772640466690063, 2.142430067062378, 2.30759596824646, 2.472762107849121, 2.637928009033203, 2.803093910217285, 2.9682600498199463, 3.1334259510040283, 3.2985920906066895, 3.4637579917907715, 3.6289238929748535, 3.7940897941589355, 3.9592559337615967, 4.124422073364258, 4.28958797454834, 4.454753875732422, 4.619919776916504, 4.785085678100586, 4.950252056121826, 5.115417957305908, 5.28058385848999]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 13.0, 8.0, 27.0, 32.0, 55.0, 89.0, 99.0, 173.0, 261.0, 393.0, 631.0, 907.0, 1375.0, 2357.0, 3627.0, 5909.0, 9633.0, 16070.0, 26924.0, 44737.0, 72483.0, 108297.0, 142655.0, 158538.0, 145405.0, 112526.0, 75711.0, 47335.0, 28268.0, 17000.0, 10275.0, 6150.0, 3747.0, 2402.0, 1536.0, 1030.0, 640.0, 424.0, 299.0, 181.0, 123.0, 85.0, 36.0, 30.0, 19.0, 13.0, 10.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.54022216796875, -4.4007568359375, -4.26129150390625, -4.121826171875, -3.98236083984375, -3.8428955078125, -3.70343017578125, -3.56396484375, -3.42449951171875, -3.2850341796875, -3.14556884765625, -3.006103515625, -2.86663818359375, -2.7271728515625, -2.58770751953125, -2.4482421875, -2.30877685546875, -2.1693115234375, -2.02984619140625, -1.890380859375, -1.75091552734375, -1.6114501953125, -1.47198486328125, -1.33251953125, -1.19305419921875, -1.0535888671875, -0.91412353515625, -0.774658203125, -0.63519287109375, -0.4957275390625, -0.35626220703125, -0.216796875, -0.07733154296875, 0.0621337890625, 0.20159912109375, 0.341064453125, 0.48052978515625, 0.6199951171875, 0.75946044921875, 0.89892578125, 1.03839111328125, 1.1778564453125, 1.31732177734375, 1.456787109375, 1.59625244140625, 1.7357177734375, 1.87518310546875, 2.0146484375, 2.15411376953125, 2.2935791015625, 2.43304443359375, 2.572509765625, 2.71197509765625, 2.8514404296875, 2.99090576171875, 3.13037109375, 3.26983642578125, 3.4093017578125, 3.54876708984375, 3.688232421875, 3.82769775390625, 3.9671630859375, 4.10662841796875, 4.24609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 4.0, 8.0, 12.0, 10.0, 9.0, 19.0, 21.0, 32.0, 25.0, 17.0, 25.0, 34.0, 36.0, 35.0, 27.0, 33.0, 37.0, 39.0, 43.0, 33.0, 45.0, 46.0, 36.0, 46.0, 33.0, 34.0, 35.0, 21.0, 17.0, 20.0, 27.0, 20.0, 20.0, 13.0, 7.0, 13.0, 13.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-5.921875, -5.75360107421875, -5.5853271484375, -5.41705322265625, -5.248779296875, -5.08050537109375, -4.9122314453125, -4.74395751953125, -4.57568359375, -4.40740966796875, -4.2391357421875, -4.07086181640625, -3.902587890625, -3.73431396484375, -3.5660400390625, -3.39776611328125, -3.2294921875, -3.06121826171875, -2.8929443359375, -2.72467041015625, -2.556396484375, -2.38812255859375, -2.2198486328125, -2.05157470703125, -1.88330078125, -1.71502685546875, -1.5467529296875, -1.37847900390625, -1.210205078125, -1.04193115234375, -0.8736572265625, -0.70538330078125, -0.537109375, -0.36883544921875, -0.2005615234375, -0.03228759765625, 0.135986328125, 0.30426025390625, 0.4725341796875, 0.64080810546875, 0.80908203125, 0.97735595703125, 1.1456298828125, 1.31390380859375, 1.482177734375, 1.65045166015625, 1.8187255859375, 1.98699951171875, 2.1552734375, 2.32354736328125, 2.4918212890625, 2.66009521484375, 2.828369140625, 2.99664306640625, 3.1649169921875, 3.33319091796875, 3.50146484375, 3.66973876953125, 3.8380126953125, 4.00628662109375, 4.174560546875, 4.34283447265625, 4.5111083984375, 4.67938232421875, 4.84765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 19.0, 24.0, 38.0, 58.0, 87.0, 140.0, 198.0, 320.0, 514.0, 797.0, 1278.0, 1938.0, 3111.0, 5043.0, 7889.0, 12931.0, 21252.0, 34087.0, 54560.0, 82729.0, 114839.0, 142178.0, 148811.0, 130963.0, 100213.0, 68474.0, 43783.0, 27505.0, 17061.0, 10393.0, 6432.0, 3965.0, 2477.0, 1620.0, 1020.0, 651.0, 393.0, 246.0, 158.0, 115.0, 83.0, 66.0, 14.0, 24.0, 14.0, 11.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.2908935546875, -4.144287109375, -3.9976806640625, -3.85107421875, -3.7044677734375, -3.557861328125, -3.4112548828125, -3.2646484375, -3.1180419921875, -2.971435546875, -2.8248291015625, -2.67822265625, -2.5316162109375, -2.385009765625, -2.2384033203125, -2.091796875, -1.9451904296875, -1.798583984375, -1.6519775390625, -1.50537109375, -1.3587646484375, -1.212158203125, -1.0655517578125, -0.9189453125, -0.7723388671875, -0.625732421875, -0.4791259765625, -0.33251953125, -0.1859130859375, -0.039306640625, 0.1072998046875, 0.25390625, 0.4005126953125, 0.547119140625, 0.6937255859375, 0.84033203125, 0.9869384765625, 1.133544921875, 1.2801513671875, 1.4267578125, 1.5733642578125, 1.719970703125, 1.8665771484375, 2.01318359375, 2.1597900390625, 2.306396484375, 2.4530029296875, 2.599609375, 2.7462158203125, 2.892822265625, 3.0394287109375, 3.18603515625, 3.3326416015625, 3.479248046875, 3.6258544921875, 3.7724609375, 3.9190673828125, 4.065673828125, 4.2122802734375, 4.35888671875, 4.5054931640625, 4.652099609375, 4.7987060546875, 4.9453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 6.0, 12.0, 21.0, 16.0, 20.0, 20.0, 21.0, 25.0, 30.0, 25.0, 22.0, 28.0, 43.0, 32.0, 33.0, 40.0, 18.0, 35.0, 43.0, 34.0, 26.0, 39.0, 29.0, 39.0, 39.0, 29.0, 28.0, 23.0, 29.0, 28.0, 19.0, 22.0, 12.0, 15.0, 7.0, 13.0, 8.0, 7.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0], "bins": [-3.537109375, -3.43609619140625, -3.3350830078125, -3.23406982421875, -3.133056640625, -3.03204345703125, -2.9310302734375, -2.83001708984375, -2.72900390625, -2.62799072265625, -2.5269775390625, -2.42596435546875, -2.324951171875, -2.22393798828125, -2.1229248046875, -2.02191162109375, -1.9208984375, -1.81988525390625, -1.7188720703125, -1.61785888671875, -1.516845703125, -1.41583251953125, -1.3148193359375, -1.21380615234375, -1.11279296875, -1.01177978515625, -0.9107666015625, -0.80975341796875, -0.708740234375, -0.60772705078125, -0.5067138671875, -0.40570068359375, -0.3046875, -0.20367431640625, -0.1026611328125, -0.00164794921875, 0.099365234375, 0.20037841796875, 0.3013916015625, 0.40240478515625, 0.50341796875, 0.60443115234375, 0.7054443359375, 0.80645751953125, 0.907470703125, 1.00848388671875, 1.1094970703125, 1.21051025390625, 1.3115234375, 1.41253662109375, 1.5135498046875, 1.61456298828125, 1.715576171875, 1.81658935546875, 1.9176025390625, 2.01861572265625, 2.11962890625, 2.22064208984375, 2.3216552734375, 2.42266845703125, 2.523681640625, 2.62469482421875, 2.7257080078125, 2.82672119140625, 2.927734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 11.0, 22.0, 28.0, 38.0, 57.0, 84.0, 120.0, 201.0, 270.0, 394.0, 531.0, 837.0, 1217.0, 1853.0, 2886.0, 4491.0, 7193.0, 11599.0, 19138.0, 31725.0, 52232.0, 84824.0, 127227.0, 161799.0, 165716.0, 133735.0, 92367.0, 57605.0, 34775.0, 21095.0, 12735.0, 7770.0, 4892.0, 3041.0, 2015.0, 1281.0, 881.0, 579.0, 378.0, 282.0, 196.0, 113.0, 94.0, 63.0, 40.0, 43.0, 28.0, 6.0, 14.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0], "bins": [-2.490234375, -2.41497802734375, -2.3397216796875, -2.26446533203125, -2.189208984375, -2.11395263671875, -2.0386962890625, -1.96343994140625, -1.88818359375, -1.81292724609375, -1.7376708984375, -1.66241455078125, -1.587158203125, -1.51190185546875, -1.4366455078125, -1.36138916015625, -1.2861328125, -1.21087646484375, -1.1356201171875, -1.06036376953125, -0.985107421875, -0.90985107421875, -0.8345947265625, -0.75933837890625, -0.68408203125, -0.60882568359375, -0.5335693359375, -0.45831298828125, -0.383056640625, -0.30780029296875, -0.2325439453125, -0.15728759765625, -0.08203125, -0.00677490234375, 0.0684814453125, 0.14373779296875, 0.218994140625, 0.29425048828125, 0.3695068359375, 0.44476318359375, 0.52001953125, 0.59527587890625, 0.6705322265625, 0.74578857421875, 0.821044921875, 0.89630126953125, 0.9715576171875, 1.04681396484375, 1.1220703125, 1.19732666015625, 1.2725830078125, 1.34783935546875, 1.423095703125, 1.49835205078125, 1.5736083984375, 1.64886474609375, 1.72412109375, 1.79937744140625, 1.8746337890625, 1.94989013671875, 2.025146484375, 2.10040283203125, 2.1756591796875, 2.25091552734375, 2.326171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 10.0, 7.0, 16.0, 25.0, 29.0, 41.0, 44.0, 36.0, 70.0, 50.0, 68.0, 61.0, 84.0, 47.0, 76.0, 70.0, 53.0, 44.0, 33.0, 23.0, 18.0, 21.0, 8.0, 9.0, 11.0, 5.0, 2.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022137165069580078, -0.00021263770759105682, -0.00020390376448631287, -0.0001951698213815689, -0.00018643587827682495, -0.000177701935172081, -0.00016896799206733704, -0.00016023404896259308, -0.00015150010585784912, -0.00014276616275310516, -0.0001340322196483612, -0.00012529827654361725, -0.00011656433343887329, -0.00010783039033412933, -9.909644722938538e-05, -9.036250412464142e-05, -8.162856101989746e-05, -7.28946179151535e-05, -6.416067481040955e-05, -5.542673170566559e-05, -4.669278860092163e-05, -3.795884549617767e-05, -2.9224902391433716e-05, -2.0490959286689758e-05, -1.17570161819458e-05, -3.0230730772018433e-06, 5.710870027542114e-06, 1.4444813132286072e-05, 2.317875623703003e-05, 3.191269934177399e-05, 4.0646642446517944e-05, 4.93805855512619e-05, 5.811452865600586e-05, 6.684847176074982e-05, 7.558241486549377e-05, 8.431635797023773e-05, 9.305030107498169e-05, 0.00010178424417972565, 0.0001105181872844696, 0.00011925213038921356, 0.00012798607349395752, 0.00013672001659870148, 0.00014545395970344543, 0.0001541879028081894, 0.00016292184591293335, 0.0001716557890176773, 0.00018038973212242126, 0.00018912367522716522, 0.00019785761833190918, 0.00020659156143665314, 0.0002153255045413971, 0.00022405944764614105, 0.000232793390750885, 0.00024152733385562897, 0.0002502612769603729, 0.0002589952200651169, 0.00026772916316986084, 0.0002764631062746048, 0.00028519704937934875, 0.0002939309924840927, 0.00030266493558883667, 0.00031139887869358063, 0.0003201328217983246, 0.00032886676490306854, 0.0003376007080078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 20.0, 20.0, 28.0, 49.0, 64.0, 90.0, 110.0, 210.0, 264.0, 400.0, 596.0, 792.0, 1312.0, 1909.0, 3200.0, 4898.0, 8251.0, 14057.0, 24484.0, 43174.0, 75640.0, 122797.0, 170361.0, 183632.0, 150835.0, 100409.0, 59201.0, 33599.0, 19008.0, 11047.0, 6599.0, 3956.0, 2558.0, 1594.0, 1121.0, 724.0, 514.0, 315.0, 214.0, 148.0, 101.0, 73.0, 57.0, 42.0, 24.0, 16.0, 4.0, 8.0, 5.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.5234375, -2.440093994140625, -2.35675048828125, -2.273406982421875, -2.1900634765625, -2.106719970703125, -2.02337646484375, -1.940032958984375, -1.856689453125, -1.773345947265625, -1.69000244140625, -1.606658935546875, -1.5233154296875, -1.439971923828125, -1.35662841796875, -1.273284912109375, -1.18994140625, -1.106597900390625, -1.02325439453125, -0.939910888671875, -0.8565673828125, -0.773223876953125, -0.68988037109375, -0.606536865234375, -0.523193359375, -0.439849853515625, -0.35650634765625, -0.273162841796875, -0.1898193359375, -0.106475830078125, -0.02313232421875, 0.060211181640625, 0.1435546875, 0.226898193359375, 0.31024169921875, 0.393585205078125, 0.4769287109375, 0.560272216796875, 0.64361572265625, 0.726959228515625, 0.810302734375, 0.893646240234375, 0.97698974609375, 1.060333251953125, 1.1436767578125, 1.227020263671875, 1.31036376953125, 1.393707275390625, 1.47705078125, 1.560394287109375, 1.64373779296875, 1.727081298828125, 1.8104248046875, 1.893768310546875, 1.97711181640625, 2.060455322265625, 2.143798828125, 2.227142333984375, 2.31048583984375, 2.393829345703125, 2.4771728515625, 2.560516357421875, 2.64385986328125, 2.727203369140625, 2.810546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 10.0, 10.0, 16.0, 14.0, 20.0, 20.0, 27.0, 21.0, 30.0, 44.0, 38.0, 37.0, 47.0, 43.0, 51.0, 41.0, 57.0, 58.0, 41.0, 35.0, 43.0, 43.0, 29.0, 34.0, 24.0, 28.0, 23.0, 20.0, 15.0, 8.0, 13.0, 9.0, 4.0, 7.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0], "bins": [-1.0224609375, -0.9961700439453125, -0.969879150390625, -0.9435882568359375, -0.91729736328125, -0.8910064697265625, -0.864715576171875, -0.8384246826171875, -0.8121337890625, -0.7858428955078125, -0.759552001953125, -0.7332611083984375, -0.70697021484375, -0.6806793212890625, -0.654388427734375, -0.6280975341796875, -0.601806640625, -0.5755157470703125, -0.549224853515625, -0.5229339599609375, -0.49664306640625, -0.4703521728515625, -0.444061279296875, -0.4177703857421875, -0.3914794921875, -0.3651885986328125, -0.338897705078125, -0.3126068115234375, -0.28631591796875, -0.2600250244140625, -0.233734130859375, -0.2074432373046875, -0.18115234375, -0.1548614501953125, -0.128570556640625, -0.1022796630859375, -0.07598876953125, -0.0496978759765625, -0.023406982421875, 0.0028839111328125, 0.0291748046875, 0.0554656982421875, 0.081756591796875, 0.1080474853515625, 0.13433837890625, 0.1606292724609375, 0.186920166015625, 0.2132110595703125, 0.239501953125, 0.2657928466796875, 0.292083740234375, 0.3183746337890625, 0.34466552734375, 0.3709564208984375, 0.397247314453125, 0.4235382080078125, 0.4498291015625, 0.4761199951171875, 0.502410888671875, 0.5287017822265625, 0.55499267578125, 0.5812835693359375, 0.607574462890625, 0.6338653564453125, 0.66015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 10.0, 3.0, 6.0, 19.0, 15.0, 15.0, 24.0, 23.0, 26.0, 27.0, 30.0, 49.0, 42.0, 47.0, 42.0, 63.0, 54.0, 48.0, 47.0, 45.0, 51.0, 38.0, 37.0, 36.0, 26.0, 26.0, 30.0, 20.0, 23.0, 9.0, 13.0, 8.0, 7.0, 6.0, 2.0, 0.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8198676109313965, -5.619709491729736, -5.419551372528076, -5.219393253326416, -5.019235134124756, -4.819077014923096, -4.618918418884277, -4.418760299682617, -4.218602180480957, -4.018444061279297, -3.8182859420776367, -3.6181278228759766, -3.4179697036743164, -3.2178115844726562, -3.017653226852417, -2.817495107650757, -2.617337226867676, -2.4171791076660156, -2.2170209884643555, -2.0168628692626953, -1.8167046308517456, -1.6165465116500854, -1.4163882732391357, -1.2162301540374756, -1.0160720348358154, -0.8159139156341553, -0.6157557368278503, -0.4155975580215454, -0.21543943881988525, -0.015281319618225098, 0.1848769187927246, 0.38503503799438477, 0.5851936340332031, 0.7853517532348633, 0.9855099320411682, 1.1856681108474731, 1.3858262300491333, 1.5859843492507935, 1.7861425876617432, 1.9863007068634033, 2.1864588260650635, 2.3866169452667236, 2.586775064468384, 2.786933422088623, 2.987091541290283, 3.1872496604919434, 3.3874077796936035, 3.5875658988952637, 3.787724018096924, 3.987882137298584, 4.188040256500244, 4.388198375701904, 4.5883564949035645, 4.788514614105225, 4.988673210144043, 5.188831329345703, 5.388989448547363, 5.589147567749023, 5.789305686950684, 5.989463806152344, 6.189621925354004, 6.389780044555664, 6.589938163757324, 6.790096282958984, 6.9902544021606445]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 2.0, 11.0, 10.0, 15.0, 18.0, 15.0, 18.0, 22.0, 29.0, 24.0, 18.0, 28.0, 37.0, 34.0, 27.0, 37.0, 33.0, 42.0, 38.0, 46.0, 47.0, 29.0, 45.0, 28.0, 32.0, 43.0, 35.0, 29.0, 24.0, 20.0, 19.0, 24.0, 21.0, 9.0, 8.0, 12.0, 9.0, 8.0, 4.0, 3.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.675997257232666, -5.503960132598877, -5.331923484802246, -5.159886360168457, -4.987849712371826, -4.815812587738037, -4.643775939941406, -4.471738815307617, -4.299701690673828, -4.127664566040039, -3.955627918243408, -3.783590793609619, -3.6115541458129883, -3.439517021179199, -3.2674801349639893, -3.0954432487487793, -2.9234066009521484, -2.7513697147369385, -2.5793328285217285, -2.4072957038879395, -2.2352590560913086, -2.0632219314575195, -1.8911850452423096, -1.7191481590270996, -1.5471112728118896, -1.3750743865966797, -1.2030375003814697, -1.0310004949569702, -0.8589636087417603, -0.6869267225265503, -0.5148897171020508, -0.3428528308868408, -0.17081546783447266, 0.0012214481830596924, 0.17325836420059204, 0.3452953100204468, 0.5173321962356567, 0.6893690824508667, 0.8614060878753662, 1.0334429740905762, 1.2054798603057861, 1.377516746520996, 1.549553632736206, 1.7215906381607056, 1.8936275243759155, 2.065664291381836, 2.237701416015625, 2.409738302230835, 2.581775188446045, 2.753812074661255, 2.925848960876465, 3.097886085510254, 3.2699227333068848, 3.441959857940674, 3.613996744155884, 3.7860336303710938, 3.9580705165863037, 4.130107402801514, 4.302144527435303, 4.474181175231934, 4.646218299865723, 4.8182549476623535, 4.990292072296143, 5.162328720092773, 5.3343658447265625]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 2.0, 9.0, 14.0, 21.0, 34.0, 29.0, 56.0, 62.0, 105.0, 130.0, 207.0, 281.0, 526.0, 791.0, 1204.0, 1920.0, 3423.0, 6235.0, 12662.0, 29322.0, 82279.0, 273805.0, 869118.0, 1495028.0, 954299.0, 311753.0, 91426.0, 31182.0, 13357.0, 6447.0, 3404.0, 2008.0, 1164.0, 704.0, 437.0, 260.0, 180.0, 117.0, 81.0, 66.0, 45.0, 29.0, 20.0, 15.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.3125, -10.9942626953125, -10.676025390625, -10.3577880859375, -10.03955078125, -9.7213134765625, -9.403076171875, -9.0848388671875, -8.7666015625, -8.4483642578125, -8.130126953125, -7.8118896484375, -7.49365234375, -7.1754150390625, -6.857177734375, -6.5389404296875, -6.220703125, -5.9024658203125, -5.584228515625, -5.2659912109375, -4.94775390625, -4.6295166015625, -4.311279296875, -3.9930419921875, -3.6748046875, -3.3565673828125, -3.038330078125, -2.7200927734375, -2.40185546875, -2.0836181640625, -1.765380859375, -1.4471435546875, -1.12890625, -0.8106689453125, -0.492431640625, -0.1741943359375, 0.14404296875, 0.4622802734375, 0.780517578125, 1.0987548828125, 1.4169921875, 1.7352294921875, 2.053466796875, 2.3717041015625, 2.68994140625, 3.0081787109375, 3.326416015625, 3.6446533203125, 3.962890625, 4.2811279296875, 4.599365234375, 4.9176025390625, 5.23583984375, 5.5540771484375, 5.872314453125, 6.1905517578125, 6.5087890625, 6.8270263671875, 7.145263671875, 7.4635009765625, 7.78173828125, 8.0999755859375, 8.418212890625, 8.7364501953125, 9.0546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 5.0, 6.0, 7.0, 10.0, 10.0, 14.0, 18.0, 23.0, 16.0, 21.0, 27.0, 27.0, 29.0, 35.0, 25.0, 42.0, 34.0, 41.0, 31.0, 47.0, 36.0, 42.0, 36.0, 43.0, 51.0, 43.0, 29.0, 25.0, 30.0, 28.0, 29.0, 29.0, 19.0, 10.0, 12.0, 11.0, 14.0, 3.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.01953125, -4.86383056640625, -4.7081298828125, -4.55242919921875, -4.396728515625, -4.24102783203125, -4.0853271484375, -3.92962646484375, -3.77392578125, -3.61822509765625, -3.4625244140625, -3.30682373046875, -3.151123046875, -2.99542236328125, -2.8397216796875, -2.68402099609375, -2.5283203125, -2.37261962890625, -2.2169189453125, -2.06121826171875, -1.905517578125, -1.74981689453125, -1.5941162109375, -1.43841552734375, -1.28271484375, -1.12701416015625, -0.9713134765625, -0.81561279296875, -0.659912109375, -0.50421142578125, -0.3485107421875, -0.19281005859375, -0.037109375, 0.11859130859375, 0.2742919921875, 0.42999267578125, 0.585693359375, 0.74139404296875, 0.8970947265625, 1.05279541015625, 1.20849609375, 1.36419677734375, 1.5198974609375, 1.67559814453125, 1.831298828125, 1.98699951171875, 2.1427001953125, 2.29840087890625, 2.4541015625, 2.60980224609375, 2.7655029296875, 2.92120361328125, 3.076904296875, 3.23260498046875, 3.3883056640625, 3.54400634765625, 3.69970703125, 3.85540771484375, 4.0111083984375, 4.16680908203125, 4.322509765625, 4.47821044921875, 4.6339111328125, 4.78961181640625, 4.9453125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 9.0, 10.0, 13.0, 13.0, 26.0, 36.0, 64.0, 77.0, 111.0, 202.0, 323.0, 477.0, 780.0, 1298.0, 2226.0, 3765.0, 6826.0, 12827.0, 26031.0, 58685.0, 153386.0, 439364.0, 1080803.0, 1323749.0, 680218.0, 241731.0, 87127.0, 36124.0, 17139.0, 9035.0, 4875.0, 2783.0, 1576.0, 978.0, 602.0, 350.0, 214.0, 152.0, 94.0, 68.0, 44.0, 22.0, 22.0, 12.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.7784423828125, -9.431884765625, -9.0853271484375, -8.73876953125, -8.3922119140625, -8.045654296875, -7.6990966796875, -7.3525390625, -7.0059814453125, -6.659423828125, -6.3128662109375, -5.96630859375, -5.6197509765625, -5.273193359375, -4.9266357421875, -4.580078125, -4.2335205078125, -3.886962890625, -3.5404052734375, -3.19384765625, -2.8472900390625, -2.500732421875, -2.1541748046875, -1.8076171875, -1.4610595703125, -1.114501953125, -0.7679443359375, -0.42138671875, -0.0748291015625, 0.271728515625, 0.6182861328125, 0.96484375, 1.3114013671875, 1.657958984375, 2.0045166015625, 2.35107421875, 2.6976318359375, 3.044189453125, 3.3907470703125, 3.7373046875, 4.0838623046875, 4.430419921875, 4.7769775390625, 5.12353515625, 5.4700927734375, 5.816650390625, 6.1632080078125, 6.509765625, 6.8563232421875, 7.202880859375, 7.5494384765625, 7.89599609375, 8.2425537109375, 8.589111328125, 8.9356689453125, 9.2822265625, 9.6287841796875, 9.975341796875, 10.3218994140625, 10.66845703125, 11.0150146484375, 11.361572265625, 11.7081298828125, 12.0546875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 19.0, 16.0, 21.0, 32.0, 31.0, 60.0, 59.0, 69.0, 110.0, 128.0, 165.0, 195.0, 236.0, 268.0, 274.0, 321.0, 280.0, 257.0, 280.0, 237.0, 189.0, 174.0, 165.0, 107.0, 82.0, 65.0, 44.0, 31.0, 22.0, 20.0, 18.0, 19.0, 15.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.529571533203125, -2.44000244140625, -2.350433349609375, -2.2608642578125, -2.171295166015625, -2.08172607421875, -1.992156982421875, -1.902587890625, -1.813018798828125, -1.72344970703125, -1.633880615234375, -1.5443115234375, -1.454742431640625, -1.36517333984375, -1.275604248046875, -1.18603515625, -1.096466064453125, -1.00689697265625, -0.917327880859375, -0.8277587890625, -0.738189697265625, -0.64862060546875, -0.559051513671875, -0.469482421875, -0.379913330078125, -0.29034423828125, -0.200775146484375, -0.1112060546875, -0.021636962890625, 0.06793212890625, 0.157501220703125, 0.2470703125, 0.336639404296875, 0.42620849609375, 0.515777587890625, 0.6053466796875, 0.694915771484375, 0.78448486328125, 0.874053955078125, 0.963623046875, 1.053192138671875, 1.14276123046875, 1.232330322265625, 1.3218994140625, 1.411468505859375, 1.50103759765625, 1.590606689453125, 1.68017578125, 1.769744873046875, 1.85931396484375, 1.948883056640625, 2.0384521484375, 2.128021240234375, 2.21759033203125, 2.307159423828125, 2.396728515625, 2.486297607421875, 2.57586669921875, 2.665435791015625, 2.7550048828125, 2.844573974609375, 2.93414306640625, 3.023712158203125, 3.11328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 10.0, 10.0, 12.0, 20.0, 18.0, 26.0, 26.0, 27.0, 38.0, 44.0, 47.0, 60.0, 48.0, 69.0, 60.0, 54.0, 52.0, 37.0, 40.0, 35.0, 42.0, 35.0, 28.0, 27.0, 33.0, 16.0, 10.0, 9.0, 7.0, 10.0, 13.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.6698431968688965, -7.442725658416748, -7.215608596801758, -6.988491058349609, -6.761373996734619, -6.534256458282471, -6.3071393966674805, -6.080021858215332, -5.852904319763184, -5.625786781311035, -5.398669719696045, -5.1715521812438965, -4.944435119628906, -4.717317581176758, -4.490200042724609, -4.263082981109619, -4.035965919494629, -3.8088486194610596, -3.5817313194274902, -3.354613780975342, -3.1274964809417725, -2.900379180908203, -2.673261880874634, -2.4461445808410645, -2.219027042388916, -1.9919097423553467, -1.7647923231124878, -1.5376750230789185, -1.3105576038360596, -1.0834403038024902, -0.8563230037689209, -0.629205584526062, -0.4020881652832031, -0.1749708205461502, 0.05214652419090271, 0.27926385402679443, 0.5063812136650085, 0.7334985733032227, 0.960615873336792, 1.1877332925796509, 1.4148505926132202, 1.6419678926467896, 1.8690853118896484, 2.0962026119232178, 2.323319911956787, 2.5504374504089355, 2.777554512023926, 3.004672050476074, 3.2317893505096436, 3.458906650543213, 3.6860239505767822, 3.9131412506103516, 4.1402587890625, 4.367376327514648, 4.594493389129639, 4.821610927581787, 5.048727989196777, 5.275845527648926, 5.502962589263916, 5.7300801277160645, 5.957197189331055, 6.184314727783203, 6.411432266235352, 6.638549327850342, 6.86566686630249]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 6.0, 9.0, 10.0, 4.0, 15.0, 17.0, 21.0, 20.0, 14.0, 28.0, 26.0, 26.0, 33.0, 28.0, 30.0, 32.0, 36.0, 37.0, 39.0, 38.0, 47.0, 46.0, 27.0, 37.0, 28.0, 30.0, 35.0, 38.0, 39.0, 33.0, 21.0, 18.0, 19.0, 12.0, 14.0, 11.0, 15.0, 11.0, 8.0, 5.0, 7.0, 6.0, 1.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.9899001121521, -5.814560413360596, -5.639220714569092, -5.463881492614746, -5.288541793823242, -5.113202095031738, -4.937862396240234, -4.7625226974487305, -4.587183475494385, -4.411843776702881, -4.236504077911377, -4.061164855957031, -3.8858251571655273, -3.7104854583740234, -3.5351457595825195, -3.3598062992095947, -3.184466600418091, -3.009126901626587, -2.833787441253662, -2.658447742462158, -2.4831082820892334, -2.3077685832977295, -2.1324291229248047, -1.9570894241333008, -1.7817498445510864, -1.606410264968872, -1.4310706853866577, -1.2557311058044434, -1.0803914070129395, -0.9050518870353699, -0.7297122478485107, -0.5543726682662964, -0.37903308868408203, -0.20369349420070648, -0.028353899717330933, 0.1469857096672058, 0.32232528924942017, 0.4976648688316345, 0.6730045080184937, 0.848344087600708, 1.0236836671829224, 1.1990232467651367, 1.374362826347351, 1.5497024059295654, 1.7250421047210693, 1.9003815650939941, 2.075721263885498, 2.251060962677002, 2.4264004230499268, 2.6017401218414307, 2.7770795822143555, 2.9524192810058594, 3.127758741378784, 3.303098440170288, 3.478437900543213, 3.653777599334717, 3.8291172981262207, 4.004456996917725, 4.1797966957092285, 4.355135917663574, 4.530475616455078, 4.705815315246582, 4.881155014038086, 5.05649471282959, 5.2318339347839355]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 24.0, 14.0, 37.0, 62.0, 97.0, 120.0, 197.0, 337.0, 473.0, 703.0, 1044.0, 1719.0, 2632.0, 4162.0, 6813.0, 11048.0, 18500.0, 31303.0, 53404.0, 90278.0, 141426.0, 186011.0, 177469.0, 127067.0, 78156.0, 46399.0, 26974.0, 16138.0, 9786.0, 5850.0, 3661.0, 2274.0, 1426.0, 979.0, 635.0, 483.0, 298.0, 196.0, 120.0, 76.0, 48.0, 40.0, 21.0, 10.0, 7.0, 11.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3525390625, -1.3087158203125, -1.264892578125, -1.2210693359375, -1.17724609375, -1.1334228515625, -1.089599609375, -1.0457763671875, -1.001953125, -0.9581298828125, -0.914306640625, -0.8704833984375, -0.82666015625, -0.7828369140625, -0.739013671875, -0.6951904296875, -0.6513671875, -0.6075439453125, -0.563720703125, -0.5198974609375, -0.47607421875, -0.4322509765625, -0.388427734375, -0.3446044921875, -0.30078125, -0.2569580078125, -0.213134765625, -0.1693115234375, -0.12548828125, -0.0816650390625, -0.037841796875, 0.0059814453125, 0.0498046875, 0.0936279296875, 0.137451171875, 0.1812744140625, 0.22509765625, 0.2689208984375, 0.312744140625, 0.3565673828125, 0.400390625, 0.4442138671875, 0.488037109375, 0.5318603515625, 0.57568359375, 0.6195068359375, 0.663330078125, 0.7071533203125, 0.7509765625, 0.7947998046875, 0.838623046875, 0.8824462890625, 0.92626953125, 0.9700927734375, 1.013916015625, 1.0577392578125, 1.1015625, 1.1453857421875, 1.189208984375, 1.2330322265625, 1.27685546875, 1.3206787109375, 1.364501953125, 1.4083251953125, 1.4521484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 4.0, 5.0, 10.0, 6.0, 7.0, 12.0, 18.0, 20.0, 16.0, 23.0, 30.0, 31.0, 25.0, 24.0, 29.0, 32.0, 39.0, 45.0, 42.0, 33.0, 42.0, 40.0, 32.0, 37.0, 36.0, 44.0, 30.0, 33.0, 31.0, 27.0, 20.0, 32.0, 19.0, 19.0, 11.0, 14.0, 11.0, 6.0, 12.0, 8.0, 16.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.8203125, -5.63665771484375, -5.4530029296875, -5.26934814453125, -5.085693359375, -4.90203857421875, -4.7183837890625, -4.53472900390625, -4.35107421875, -4.16741943359375, -3.9837646484375, -3.80010986328125, -3.616455078125, -3.43280029296875, -3.2491455078125, -3.06549072265625, -2.8818359375, -2.69818115234375, -2.5145263671875, -2.33087158203125, -2.147216796875, -1.96356201171875, -1.7799072265625, -1.59625244140625, -1.41259765625, -1.22894287109375, -1.0452880859375, -0.86163330078125, -0.677978515625, -0.49432373046875, -0.3106689453125, -0.12701416015625, 0.056640625, 0.24029541015625, 0.4239501953125, 0.60760498046875, 0.791259765625, 0.97491455078125, 1.1585693359375, 1.34222412109375, 1.52587890625, 1.70953369140625, 1.8931884765625, 2.07684326171875, 2.260498046875, 2.44415283203125, 2.6278076171875, 2.81146240234375, 2.9951171875, 3.17877197265625, 3.3624267578125, 3.54608154296875, 3.729736328125, 3.91339111328125, 4.0970458984375, 4.28070068359375, 4.46435546875, 4.64801025390625, 4.8316650390625, 5.01531982421875, 5.198974609375, 5.38262939453125, 5.5662841796875, 5.74993896484375, 5.93359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 10.0, 15.0, 12.0, 18.0, 36.0, 38.0, 48.0, 89.0, 98.0, 156.0, 207.0, 306.0, 455.0, 646.0, 1119.0, 1748.0, 2874.0, 4667.0, 8109.0, 14537.0, 27949.0, 162948.0, 729212.0, 46632.0, 19643.0, 10802.0, 6249.0, 3642.0, 2224.0, 1410.0, 883.0, 552.0, 351.0, 256.0, 166.0, 122.0, 99.0, 46.0, 40.0, 30.0, 19.0, 24.0, 12.0, 18.0, 6.0, 11.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-4.06640625, -3.9403076171875, -3.814208984375, -3.6881103515625, -3.56201171875, -3.4359130859375, -3.309814453125, -3.1837158203125, -3.0576171875, -2.9315185546875, -2.805419921875, -2.6793212890625, -2.55322265625, -2.4271240234375, -2.301025390625, -2.1749267578125, -2.048828125, -1.9227294921875, -1.796630859375, -1.6705322265625, -1.54443359375, -1.4183349609375, -1.292236328125, -1.1661376953125, -1.0400390625, -0.9139404296875, -0.787841796875, -0.6617431640625, -0.53564453125, -0.4095458984375, -0.283447265625, -0.1573486328125, -0.03125, 0.0948486328125, 0.220947265625, 0.3470458984375, 0.47314453125, 0.5992431640625, 0.725341796875, 0.8514404296875, 0.9775390625, 1.1036376953125, 1.229736328125, 1.3558349609375, 1.48193359375, 1.6080322265625, 1.734130859375, 1.8602294921875, 1.986328125, 2.1124267578125, 2.238525390625, 2.3646240234375, 2.49072265625, 2.6168212890625, 2.742919921875, 2.8690185546875, 2.9951171875, 3.1212158203125, 3.247314453125, 3.3734130859375, 3.49951171875, 3.6256103515625, 3.751708984375, 3.8778076171875, 4.00390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 12.0, 7.0, 3.0, 9.0, 16.0, 16.0, 21.0, 19.0, 15.0, 16.0, 21.0, 20.0, 20.0, 25.0, 39.0, 38.0, 32.0, 35.0, 35.0, 54.0, 32.0, 38.0, 40.0, 32.0, 34.0, 30.0, 38.0, 23.0, 37.0, 17.0, 24.0, 20.0, 22.0, 28.0, 19.0, 19.0, 16.0, 17.0, 14.0, 7.0, 10.0, 6.0, 5.0, 6.0, 3.0, 7.0, 1.0, 0.0, 4.0, 1.0], "bins": [-4.62890625, -4.497650146484375, -4.36639404296875, -4.235137939453125, -4.1038818359375, -3.972625732421875, -3.84136962890625, -3.710113525390625, -3.578857421875, -3.447601318359375, -3.31634521484375, -3.185089111328125, -3.0538330078125, -2.922576904296875, -2.79132080078125, -2.660064697265625, -2.52880859375, -2.397552490234375, -2.26629638671875, -2.135040283203125, -2.0037841796875, -1.872528076171875, -1.74127197265625, -1.610015869140625, -1.478759765625, -1.347503662109375, -1.21624755859375, -1.084991455078125, -0.9537353515625, -0.822479248046875, -0.69122314453125, -0.559967041015625, -0.4287109375, -0.297454833984375, -0.16619873046875, -0.034942626953125, 0.0963134765625, 0.227569580078125, 0.35882568359375, 0.490081787109375, 0.621337890625, 0.752593994140625, 0.88385009765625, 1.015106201171875, 1.1463623046875, 1.277618408203125, 1.40887451171875, 1.540130615234375, 1.67138671875, 1.802642822265625, 1.93389892578125, 2.065155029296875, 2.1964111328125, 2.327667236328125, 2.45892333984375, 2.590179443359375, 2.721435546875, 2.852691650390625, 2.98394775390625, 3.115203857421875, 3.2464599609375, 3.377716064453125, 3.50897216796875, 3.640228271484375, 3.771484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 11.0, 13.0, 27.0, 26.0, 48.0, 71.0, 111.0, 180.0, 287.0, 504.0, 861.0, 1474.0, 3011.0, 6382.0, 15036.0, 56888.0, 879667.0, 56049.0, 15041.0, 6306.0, 2933.0, 1526.0, 827.0, 454.0, 285.0, 195.0, 124.0, 61.0, 38.0, 31.0, 19.0, 19.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83447265625, -0.806182861328125, -0.77789306640625, -0.749603271484375, -0.7213134765625, -0.693023681640625, -0.66473388671875, -0.636444091796875, -0.608154296875, -0.579864501953125, -0.55157470703125, -0.523284912109375, -0.4949951171875, -0.466705322265625, -0.43841552734375, -0.410125732421875, -0.3818359375, -0.353546142578125, -0.32525634765625, -0.296966552734375, -0.2686767578125, -0.240386962890625, -0.21209716796875, -0.183807373046875, -0.155517578125, -0.127227783203125, -0.09893798828125, -0.070648193359375, -0.0423583984375, -0.014068603515625, 0.01422119140625, 0.042510986328125, 0.07080078125, 0.099090576171875, 0.12738037109375, 0.155670166015625, 0.1839599609375, 0.212249755859375, 0.24053955078125, 0.268829345703125, 0.297119140625, 0.325408935546875, 0.35369873046875, 0.381988525390625, 0.4102783203125, 0.438568115234375, 0.46685791015625, 0.495147705078125, 0.5234375, 0.551727294921875, 0.58001708984375, 0.608306884765625, 0.6365966796875, 0.664886474609375, 0.69317626953125, 0.721466064453125, 0.749755859375, 0.778045654296875, 0.80633544921875, 0.834625244140625, 0.8629150390625, 0.891204833984375, 0.91949462890625, 0.947784423828125, 0.97607421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 13.0, 12.0, 16.0, 32.0, 42.0, 47.0, 64.0, 94.0, 79.0, 110.0, 94.0, 108.0, 67.0, 58.0, 37.0, 30.0, 25.0, 17.0, 8.0, 8.0, 7.0, 10.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3272972106933594e-05, -4.1816383600234985e-05, -4.035979509353638e-05, -3.890320658683777e-05, -3.744661808013916e-05, -3.599002957344055e-05, -3.453344106674194e-05, -3.3076852560043335e-05, -3.1620264053344727e-05, -3.0163675546646118e-05, -2.870708703994751e-05, -2.72504985332489e-05, -2.5793910026550293e-05, -2.4337321519851685e-05, -2.2880733013153076e-05, -2.1424144506454468e-05, -1.996755599975586e-05, -1.851096749305725e-05, -1.7054378986358643e-05, -1.5597790479660034e-05, -1.4141201972961426e-05, -1.2684613466262817e-05, -1.1228024959564209e-05, -9.7714364528656e-06, -8.314847946166992e-06, -6.858259439468384e-06, -5.401670932769775e-06, -3.945082426071167e-06, -2.4884939193725586e-06, -1.0319054126739502e-06, 4.246830940246582e-07, 1.8812716007232666e-06, 3.337860107421875e-06, 4.794448614120483e-06, 6.251037120819092e-06, 7.7076256275177e-06, 9.164214134216309e-06, 1.0620802640914917e-05, 1.2077391147613525e-05, 1.3533979654312134e-05, 1.4990568161010742e-05, 1.644715666770935e-05, 1.790374517440796e-05, 1.9360333681106567e-05, 2.0816922187805176e-05, 2.2273510694503784e-05, 2.3730099201202393e-05, 2.5186687707901e-05, 2.664327621459961e-05, 2.8099864721298218e-05, 2.9556453227996826e-05, 3.1013041734695435e-05, 3.246963024139404e-05, 3.392621874809265e-05, 3.538280725479126e-05, 3.683939576148987e-05, 3.8295984268188477e-05, 3.9752572774887085e-05, 4.120916128158569e-05, 4.26657497882843e-05, 4.412233829498291e-05, 4.557892680168152e-05, 4.703551530838013e-05, 4.8492103815078735e-05, 4.9948692321777344e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 4.0, 15.0, 13.0, 25.0, 27.0, 42.0, 82.0, 93.0, 121.0, 193.0, 272.0, 394.0, 522.0, 876.0, 1236.0, 1871.0, 2833.0, 4375.0, 6864.0, 11063.0, 18409.0, 30821.0, 53687.0, 96891.0, 166410.0, 219211.0, 179336.0, 106132.0, 59523.0, 34169.0, 19933.0, 11912.0, 7446.0, 4663.0, 2873.0, 1984.0, 1401.0, 860.0, 594.0, 418.0, 299.0, 201.0, 132.0, 79.0, 82.0, 51.0, 33.0, 22.0, 21.0, 12.0, 11.0, 6.0, 4.0, 5.0, 2.0], "bins": [-0.55908203125, -0.5429153442382812, -0.5267486572265625, -0.5105819702148438, -0.494415283203125, -0.47824859619140625, -0.4620819091796875, -0.44591522216796875, -0.42974853515625, -0.41358184814453125, -0.3974151611328125, -0.38124847412109375, -0.365081787109375, -0.34891510009765625, -0.3327484130859375, -0.31658172607421875, -0.3004150390625, -0.28424835205078125, -0.2680816650390625, -0.25191497802734375, -0.235748291015625, -0.21958160400390625, -0.2034149169921875, -0.18724822998046875, -0.17108154296875, -0.15491485595703125, -0.1387481689453125, -0.12258148193359375, -0.106414794921875, -0.09024810791015625, -0.0740814208984375, -0.05791473388671875, -0.041748046875, -0.02558135986328125, -0.0094146728515625, 0.00675201416015625, 0.022918701171875, 0.03908538818359375, 0.0552520751953125, 0.07141876220703125, 0.08758544921875, 0.10375213623046875, 0.1199188232421875, 0.13608551025390625, 0.152252197265625, 0.16841888427734375, 0.1845855712890625, 0.20075225830078125, 0.2169189453125, 0.23308563232421875, 0.2492523193359375, 0.26541900634765625, 0.281585693359375, 0.29775238037109375, 0.3139190673828125, 0.33008575439453125, 0.34625244140625, 0.36241912841796875, 0.3785858154296875, 0.39475250244140625, 0.410919189453125, 0.42708587646484375, 0.4432525634765625, 0.45941925048828125, 0.4755859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 8.0, 7.0, 6.0, 10.0, 10.0, 5.0, 11.0, 16.0, 29.0, 30.0, 22.0, 31.0, 25.0, 31.0, 36.0, 48.0, 50.0, 68.0, 86.0, 68.0, 61.0, 49.0, 31.0, 28.0, 34.0, 30.0, 18.0, 17.0, 23.0, 15.0, 7.0, 19.0, 13.0, 9.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1951904296875, -0.1892566680908203, -0.18332290649414062, -0.17738914489746094, -0.17145538330078125, -0.16552162170410156, -0.15958786010742188, -0.1536540985107422, -0.1477203369140625, -0.1417865753173828, -0.13585281372070312, -0.12991905212402344, -0.12398529052734375, -0.11805152893066406, -0.11211776733398438, -0.10618400573730469, -0.100250244140625, -0.09431648254394531, -0.08838272094726562, -0.08244895935058594, -0.07651519775390625, -0.07058143615722656, -0.06464767456054688, -0.05871391296386719, -0.0527801513671875, -0.04684638977050781, -0.040912628173828125, -0.03497886657714844, -0.02904510498046875, -0.023111343383789062, -0.017177581787109375, -0.011243820190429688, -0.00531005859375, 0.0006237030029296875, 0.006557464599609375, 0.012491226196289062, 0.01842498779296875, 0.024358749389648438, 0.030292510986328125, 0.03622627258300781, 0.0421600341796875, 0.04809379577636719, 0.054027557373046875, 0.05996131896972656, 0.06589508056640625, 0.07182884216308594, 0.07776260375976562, 0.08369636535644531, 0.089630126953125, 0.09556388854980469, 0.10149765014648438, 0.10743141174316406, 0.11336517333984375, 0.11929893493652344, 0.12523269653320312, 0.1311664581298828, 0.1371002197265625, 0.1430339813232422, 0.14896774291992188, 0.15490150451660156, 0.16083526611328125, 0.16676902770996094, 0.17270278930664062, 0.1786365509033203, 0.1845703125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 15.0, 8.0, 13.0, 21.0, 14.0, 27.0, 24.0, 35.0, 33.0, 42.0, 44.0, 54.0, 62.0, 61.0, 67.0, 47.0, 50.0, 40.0, 39.0, 35.0, 41.0, 29.0, 42.0, 21.0, 24.0, 24.0, 14.0, 4.0, 8.0, 11.0, 15.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.505505084991455, -7.2827467918396, -7.059988021850586, -6.8372297286987305, -6.614471435546875, -6.3917131423950195, -6.168954849243164, -5.94619607925415, -5.723437786102295, -5.5006794929504395, -5.277920722961426, -5.05516242980957, -4.832404136657715, -4.609645843505859, -4.386887550354004, -4.16412878036499, -3.9413704872131348, -3.7186121940612793, -3.4958536624908447, -3.27309513092041, -3.0503368377685547, -2.827578544616699, -2.6048200130462646, -2.38206148147583, -2.1593031883239746, -1.9365447759628296, -1.7137863636016846, -1.4910279512405396, -1.2682695388793945, -1.0455111265182495, -0.8227527141571045, -0.5999943017959595, -0.37723636627197266, -0.15447795391082764, 0.06828045845031738, 0.2910388708114624, 0.5137972831726074, 0.7365556955337524, 0.9593141078948975, 1.1820725202560425, 1.4048309326171875, 1.6275893449783325, 1.8503477573394775, 2.073106288909912, 2.2958645820617676, 2.518622875213623, 2.7413814067840576, 2.964139938354492, 3.1868982315063477, 3.409656524658203, 3.6324150562286377, 3.8551735877990723, 4.077931880950928, 4.300690174102783, 4.523448944091797, 4.746207237243652, 4.968965530395508, 5.191723823547363, 5.414482116699219, 5.637240886688232, 5.859999179840088, 6.082757472991943, 6.305516242980957, 6.5282745361328125, 6.751032829284668]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 4.0, 8.0, 10.0, 7.0, 11.0, 7.0, 14.0, 19.0, 26.0, 20.0, 24.0, 26.0, 23.0, 33.0, 28.0, 28.0, 35.0, 32.0, 44.0, 30.0, 54.0, 40.0, 39.0, 37.0, 37.0, 28.0, 25.0, 37.0, 40.0, 49.0, 23.0, 24.0, 18.0, 16.0, 15.0, 12.0, 12.0, 16.0, 7.0, 9.0, 8.0, 6.0, 2.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.041230201721191, -5.864303112030029, -5.687376022338867, -5.510448932647705, -5.333521842956543, -5.156594753265381, -4.979667663574219, -4.802740573883057, -4.6258134841918945, -4.448886394500732, -4.27195930480957, -4.095032215118408, -3.918105125427246, -3.741178035736084, -3.564250946044922, -3.3873238563537598, -3.2103965282440186, -3.0334694385528564, -2.8565423488616943, -2.6796152591705322, -2.50268816947937, -2.325761079788208, -2.148833751678467, -1.9719067811965942, -1.7949796915054321, -1.61805260181427, -1.441125512123108, -1.2641983032226562, -1.0872712135314941, -0.9103441834449768, -0.7334170341491699, -0.5564899444580078, -0.3795628547668457, -0.2026357501745224, -0.025708645582199097, 0.1512184739112854, 0.3281455636024475, 0.5050726532936096, 0.6819998025894165, 0.8589268922805786, 1.0358539819717407, 1.2127810716629028, 1.389708161354065, 1.5666353702545166, 1.7435624599456787, 1.9204895496368408, 2.097416639328003, 2.274343729019165, 2.451270818710327, 2.6281979084014893, 2.8051249980926514, 2.9820520877838135, 3.1589791774749756, 3.3359062671661377, 3.512833595275879, 3.689760684967041, 3.866687774658203, 4.043614864349365, 4.220541954040527, 4.3974690437316895, 4.574396133422852, 4.751323223114014, 4.928250312805176, 5.105177402496338, 5.2821044921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 16.0, 16.0, 25.0, 32.0, 49.0, 66.0, 74.0, 117.0, 182.0, 241.0, 375.0, 612.0, 969.0, 1575.0, 2541.0, 4536.0, 8171.0, 14665.0, 27813.0, 53460.0, 98587.0, 160321.0, 203209.0, 186584.0, 127538.0, 72858.0, 38196.0, 20204.0, 10576.0, 6090.0, 3435.0, 2037.0, 1139.0, 791.0, 498.0, 281.0, 195.0, 115.0, 95.0, 59.0, 51.0, 34.0, 37.0, 21.0, 30.0, 5.0, 5.0, 7.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.77734375, -5.5953369140625, -5.413330078125, -5.2313232421875, -5.04931640625, -4.8673095703125, -4.685302734375, -4.5032958984375, -4.3212890625, -4.1392822265625, -3.957275390625, -3.7752685546875, -3.59326171875, -3.4112548828125, -3.229248046875, -3.0472412109375, -2.865234375, -2.6832275390625, -2.501220703125, -2.3192138671875, -2.13720703125, -1.9552001953125, -1.773193359375, -1.5911865234375, -1.4091796875, -1.2271728515625, -1.045166015625, -0.8631591796875, -0.68115234375, -0.4991455078125, -0.317138671875, -0.1351318359375, 0.046875, 0.2288818359375, 0.410888671875, 0.5928955078125, 0.77490234375, 0.9569091796875, 1.138916015625, 1.3209228515625, 1.5029296875, 1.6849365234375, 1.866943359375, 2.0489501953125, 2.23095703125, 2.4129638671875, 2.594970703125, 2.7769775390625, 2.958984375, 3.1409912109375, 3.322998046875, 3.5050048828125, 3.68701171875, 3.8690185546875, 4.051025390625, 4.2330322265625, 4.4150390625, 4.5970458984375, 4.779052734375, 4.9610595703125, 5.14306640625, 5.3250732421875, 5.507080078125, 5.6890869140625, 5.87109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 6.0, 7.0, 6.0, 4.0, 7.0, 20.0, 13.0, 20.0, 20.0, 21.0, 30.0, 26.0, 34.0, 25.0, 34.0, 44.0, 44.0, 32.0, 30.0, 45.0, 60.0, 41.0, 37.0, 43.0, 33.0, 36.0, 30.0, 41.0, 32.0, 27.0, 31.0, 11.0, 14.0, 14.0, 20.0, 8.0, 8.0, 10.0, 9.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.61328125, -6.41900634765625, -6.2247314453125, -6.03045654296875, -5.836181640625, -5.64190673828125, -5.4476318359375, -5.25335693359375, -5.05908203125, -4.86480712890625, -4.6705322265625, -4.47625732421875, -4.281982421875, -4.08770751953125, -3.8934326171875, -3.69915771484375, -3.5048828125, -3.31060791015625, -3.1163330078125, -2.92205810546875, -2.727783203125, -2.53350830078125, -2.3392333984375, -2.14495849609375, -1.95068359375, -1.75640869140625, -1.5621337890625, -1.36785888671875, -1.173583984375, -0.97930908203125, -0.7850341796875, -0.59075927734375, -0.396484375, -0.20220947265625, -0.0079345703125, 0.18634033203125, 0.380615234375, 0.57489013671875, 0.7691650390625, 0.96343994140625, 1.15771484375, 1.35198974609375, 1.5462646484375, 1.74053955078125, 1.934814453125, 2.12908935546875, 2.3233642578125, 2.51763916015625, 2.7119140625, 2.90618896484375, 3.1004638671875, 3.29473876953125, 3.489013671875, 3.68328857421875, 3.8775634765625, 4.07183837890625, 4.26611328125, 4.46038818359375, 4.6546630859375, 4.84893798828125, 5.043212890625, 5.23748779296875, 5.4317626953125, 5.62603759765625, 5.8203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 8.0, 12.0, 22.0, 46.0, 58.0, 106.0, 110.0, 211.0, 296.0, 504.0, 765.0, 1207.0, 1967.0, 3113.0, 5143.0, 8369.0, 13863.0, 24095.0, 40986.0, 68929.0, 107520.0, 147612.0, 168314.0, 154315.0, 114964.0, 74616.0, 45241.0, 26744.0, 15595.0, 9045.0, 5599.0, 3374.0, 2103.0, 1307.0, 794.0, 554.0, 344.0, 211.0, 152.0, 124.0, 78.0, 38.0, 39.0, 20.0, 14.0, 9.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.359375, -5.1998291015625, -5.040283203125, -4.8807373046875, -4.72119140625, -4.5616455078125, -4.402099609375, -4.2425537109375, -4.0830078125, -3.9234619140625, -3.763916015625, -3.6043701171875, -3.44482421875, -3.2852783203125, -3.125732421875, -2.9661865234375, -2.806640625, -2.6470947265625, -2.487548828125, -2.3280029296875, -2.16845703125, -2.0089111328125, -1.849365234375, -1.6898193359375, -1.5302734375, -1.3707275390625, -1.211181640625, -1.0516357421875, -0.89208984375, -0.7325439453125, -0.572998046875, -0.4134521484375, -0.25390625, -0.0943603515625, 0.065185546875, 0.2247314453125, 0.38427734375, 0.5438232421875, 0.703369140625, 0.8629150390625, 1.0224609375, 1.1820068359375, 1.341552734375, 1.5010986328125, 1.66064453125, 1.8201904296875, 1.979736328125, 2.1392822265625, 2.298828125, 2.4583740234375, 2.617919921875, 2.7774658203125, 2.93701171875, 3.0965576171875, 3.256103515625, 3.4156494140625, 3.5751953125, 3.7347412109375, 3.894287109375, 4.0538330078125, 4.21337890625, 4.3729248046875, 4.532470703125, 4.6920166015625, 4.8515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 8.0, 6.0, 3.0, 11.0, 16.0, 18.0, 20.0, 25.0, 38.0, 21.0, 25.0, 29.0, 31.0, 35.0, 37.0, 45.0, 35.0, 34.0, 53.0, 46.0, 30.0, 42.0, 30.0, 35.0, 28.0, 37.0, 32.0, 32.0, 19.0, 26.0, 27.0, 21.0, 15.0, 9.0, 16.0, 8.0, 7.0, 6.0, 6.0, 7.0, 8.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -3.015350341796875, -2.89984130859375, -2.784332275390625, -2.6688232421875, -2.553314208984375, -2.43780517578125, -2.322296142578125, -2.206787109375, -2.091278076171875, -1.97576904296875, -1.860260009765625, -1.7447509765625, -1.629241943359375, -1.51373291015625, -1.398223876953125, -1.28271484375, -1.167205810546875, -1.05169677734375, -0.936187744140625, -0.8206787109375, -0.705169677734375, -0.58966064453125, -0.474151611328125, -0.358642578125, -0.243133544921875, -0.12762451171875, -0.012115478515625, 0.1033935546875, 0.218902587890625, 0.33441162109375, 0.449920654296875, 0.5654296875, 0.680938720703125, 0.79644775390625, 0.911956787109375, 1.0274658203125, 1.142974853515625, 1.25848388671875, 1.373992919921875, 1.489501953125, 1.605010986328125, 1.72052001953125, 1.836029052734375, 1.9515380859375, 2.067047119140625, 2.18255615234375, 2.298065185546875, 2.41357421875, 2.529083251953125, 2.64459228515625, 2.760101318359375, 2.8756103515625, 2.991119384765625, 3.10662841796875, 3.222137451171875, 3.337646484375, 3.453155517578125, 3.56866455078125, 3.684173583984375, 3.7996826171875, 3.915191650390625, 4.03070068359375, 4.146209716796875, 4.26171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 18.0, 29.0, 30.0, 37.0, 77.0, 84.0, 138.0, 201.0, 267.0, 455.0, 593.0, 931.0, 1370.0, 2187.0, 3549.0, 5657.0, 9288.0, 15108.0, 25666.0, 43300.0, 71046.0, 107998.0, 147224.0, 164532.0, 148316.0, 112144.0, 74088.0, 45502.0, 26919.0, 15960.0, 9598.0, 5842.0, 3635.0, 2368.0, 1450.0, 973.0, 610.0, 428.0, 262.0, 219.0, 131.0, 90.0, 59.0, 45.0, 32.0, 22.0, 18.0, 16.0, 13.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-2.095703125, -2.029266357421875, -1.96282958984375, -1.896392822265625, -1.8299560546875, -1.763519287109375, -1.69708251953125, -1.630645751953125, -1.564208984375, -1.497772216796875, -1.43133544921875, -1.364898681640625, -1.2984619140625, -1.232025146484375, -1.16558837890625, -1.099151611328125, -1.03271484375, -0.966278076171875, -0.89984130859375, -0.833404541015625, -0.7669677734375, -0.700531005859375, -0.63409423828125, -0.567657470703125, -0.501220703125, -0.434783935546875, -0.36834716796875, -0.301910400390625, -0.2354736328125, -0.169036865234375, -0.10260009765625, -0.036163330078125, 0.0302734375, 0.096710205078125, 0.16314697265625, 0.229583740234375, 0.2960205078125, 0.362457275390625, 0.42889404296875, 0.495330810546875, 0.561767578125, 0.628204345703125, 0.69464111328125, 0.761077880859375, 0.8275146484375, 0.893951416015625, 0.96038818359375, 1.026824951171875, 1.09326171875, 1.159698486328125, 1.22613525390625, 1.292572021484375, 1.3590087890625, 1.425445556640625, 1.49188232421875, 1.558319091796875, 1.624755859375, 1.691192626953125, 1.75762939453125, 1.824066162109375, 1.8905029296875, 1.956939697265625, 2.02337646484375, 2.089813232421875, 2.15625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 7.0, 17.0, 22.0, 35.0, 37.0, 44.0, 71.0, 78.0, 93.0, 116.0, 110.0, 88.0, 74.0, 63.0, 39.0, 37.0, 26.0, 19.0, 6.0, 11.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003795623779296875, -0.00036829710006713867, -0.00035703182220458984, -0.000345766544342041, -0.0003345012664794922, -0.00032323598861694336, -0.00031197071075439453, -0.0003007054328918457, -0.0002894401550292969, -0.00027817487716674805, -0.0002669095993041992, -0.0002556443214416504, -0.00024437904357910156, -0.00023311376571655273, -0.0002218484878540039, -0.00021058320999145508, -0.00019931793212890625, -0.00018805265426635742, -0.0001767873764038086, -0.00016552209854125977, -0.00015425682067871094, -0.0001429915428161621, -0.00013172626495361328, -0.00012046098709106445, -0.00010919570922851562, -9.79304313659668e-05, -8.666515350341797e-05, -7.539987564086914e-05, -6.413459777832031e-05, -5.2869319915771484e-05, -4.1604042053222656e-05, -3.0338764190673828e-05, -1.9073486328125e-05, -7.808208465576172e-06, 3.4570693969726562e-06, 1.4722347259521484e-05, 2.5987625122070312e-05, 3.725290298461914e-05, 4.851818084716797e-05, 5.97834587097168e-05, 7.104873657226562e-05, 8.231401443481445e-05, 9.357929229736328e-05, 0.00010484457015991211, 0.00011610984802246094, 0.00012737512588500977, 0.0001386404037475586, 0.00014990568161010742, 0.00016117095947265625, 0.00017243623733520508, 0.0001837015151977539, 0.00019496679306030273, 0.00020623207092285156, 0.0002174973487854004, 0.00022876262664794922, 0.00024002790451049805, 0.0002512931823730469, 0.0002625584602355957, 0.00027382373809814453, 0.00028508901596069336, 0.0002963542938232422, 0.000307619571685791, 0.00031888484954833984, 0.00033015012741088867, 0.0003414154052734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 15.0, 14.0, 16.0, 41.0, 42.0, 60.0, 97.0, 124.0, 207.0, 285.0, 453.0, 698.0, 1080.0, 1761.0, 2960.0, 5150.0, 8304.0, 14685.0, 26056.0, 44809.0, 76025.0, 119590.0, 162360.0, 176843.0, 149230.0, 104197.0, 63767.0, 37899.0, 21641.0, 12155.0, 7119.0, 4078.0, 2510.0, 1466.0, 945.0, 659.0, 383.0, 271.0, 168.0, 111.0, 72.0, 67.0, 40.0, 28.0, 20.0, 11.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.310546875, -2.234375, -2.158203125, -2.08203125, -2.005859375, -1.9296875, -1.853515625, -1.77734375, -1.701171875, -1.625, -1.548828125, -1.47265625, -1.396484375, -1.3203125, -1.244140625, -1.16796875, -1.091796875, -1.015625, -0.939453125, -0.86328125, -0.787109375, -0.7109375, -0.634765625, -0.55859375, -0.482421875, -0.40625, -0.330078125, -0.25390625, -0.177734375, -0.1015625, -0.025390625, 0.05078125, 0.126953125, 0.203125, 0.279296875, 0.35546875, 0.431640625, 0.5078125, 0.583984375, 0.66015625, 0.736328125, 0.8125, 0.888671875, 0.96484375, 1.041015625, 1.1171875, 1.193359375, 1.26953125, 1.345703125, 1.421875, 1.498046875, 1.57421875, 1.650390625, 1.7265625, 1.802734375, 1.87890625, 1.955078125, 2.03125, 2.107421875, 2.18359375, 2.259765625, 2.3359375, 2.412109375, 2.48828125, 2.564453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 5.0, 9.0, 9.0, 13.0, 14.0, 18.0, 26.0, 33.0, 31.0, 31.0, 38.0, 49.0, 40.0, 33.0, 44.0, 37.0, 53.0, 52.0, 49.0, 53.0, 40.0, 41.0, 35.0, 29.0, 25.0, 34.0, 23.0, 16.0, 28.0, 17.0, 20.0, 10.0, 8.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7392578125, -0.717437744140625, -0.69561767578125, -0.673797607421875, -0.6519775390625, -0.630157470703125, -0.60833740234375, -0.586517333984375, -0.564697265625, -0.542877197265625, -0.52105712890625, -0.499237060546875, -0.4774169921875, -0.455596923828125, -0.43377685546875, -0.411956787109375, -0.39013671875, -0.368316650390625, -0.34649658203125, -0.324676513671875, -0.3028564453125, -0.281036376953125, -0.25921630859375, -0.237396240234375, -0.215576171875, -0.193756103515625, -0.17193603515625, -0.150115966796875, -0.1282958984375, -0.106475830078125, -0.08465576171875, -0.062835693359375, -0.041015625, -0.019195556640625, 0.00262451171875, 0.024444580078125, 0.0462646484375, 0.068084716796875, 0.08990478515625, 0.111724853515625, 0.133544921875, 0.155364990234375, 0.17718505859375, 0.199005126953125, 0.2208251953125, 0.242645263671875, 0.26446533203125, 0.286285400390625, 0.30810546875, 0.329925537109375, 0.35174560546875, 0.373565673828125, 0.3953857421875, 0.417205810546875, 0.43902587890625, 0.460845947265625, 0.482666015625, 0.504486083984375, 0.52630615234375, 0.548126220703125, 0.5699462890625, 0.591766357421875, 0.61358642578125, 0.635406494140625, 0.6572265625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 10.0, 12.0, 21.0, 10.0, 29.0, 24.0, 21.0, 33.0, 32.0, 51.0, 46.0, 63.0, 63.0, 49.0, 64.0, 59.0, 64.0, 48.0, 40.0, 39.0, 32.0, 33.0, 31.0, 22.0, 15.0, 15.0, 16.0, 10.0, 10.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.004897117614746, -7.771902561187744, -7.538908004760742, -7.305913925170898, -7.0729193687438965, -6.8399248123168945, -6.606930255889893, -6.373935699462891, -6.140941619873047, -5.907947063446045, -5.674952507019043, -5.441958427429199, -5.208963871002197, -4.975969314575195, -4.742974758148193, -4.509980201721191, -4.276986122131348, -4.043991565704346, -3.810997247695923, -3.578002691268921, -3.345008373260498, -3.112013816833496, -2.879019260406494, -2.6460249423980713, -2.4130301475524902, -2.1800355911254883, -1.9470412731170654, -1.7140467166900635, -1.4810523986816406, -1.2480578422546387, -1.0150634050369263, -0.7820689678192139, -0.549074649810791, -0.3160802125930786, -0.08308574557304382, 0.14990872144699097, 0.38290315866470337, 0.6158976554870605, 0.848892092704773, 1.0818865299224854, 1.3148809671401978, 1.5478754043579102, 1.7808698415756226, 2.013864278793335, 2.246858835220337, 2.4798531532287598, 2.7128477096557617, 2.9458422660827637, 3.1788365840911865, 3.4118311405181885, 3.6448254585266113, 3.8778200149536133, 4.110814571380615, 4.343809127807617, 4.576803207397461, 4.809797763824463, 5.042792320251465, 5.275786876678467, 5.508781433105469, 5.7417755126953125, 5.9747700691223145, 6.207764625549316, 6.440759181976318, 6.67375373840332, 6.906747817993164]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 4.0, 8.0, 10.0, 9.0, 11.0, 21.0, 26.0, 11.0, 25.0, 30.0, 14.0, 36.0, 40.0, 26.0, 32.0, 40.0, 45.0, 44.0, 46.0, 40.0, 42.0, 37.0, 37.0, 38.0, 34.0, 32.0, 30.0, 29.0, 27.0, 21.0, 25.0, 20.0, 17.0, 11.0, 14.0, 12.0, 8.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.913154125213623, -5.722644329071045, -5.532134532928467, -5.341624736785889, -5.1511149406433105, -4.960605144500732, -4.7700958251953125, -4.579586029052734, -4.389076232910156, -4.198566436767578, -4.008056640625, -3.817546844482422, -3.6270370483398438, -3.4365272521972656, -3.2460176944732666, -3.0555078983306885, -2.8649978637695312, -2.674488067626953, -2.483978271484375, -2.293468475341797, -2.1029586791992188, -1.9124490022659302, -1.7219393253326416, -1.5314295291900635, -1.3409197330474854, -1.1504099369049072, -0.9599002003669739, -0.7693904638290405, -0.5788806676864624, -0.3883708715438843, -0.1978611946105957, -0.007351398468017578, 0.18315839767456055, 0.3736681640148163, 0.564177930355072, 0.7546876668930054, 0.9451974630355835, 1.1357072591781616, 1.3262169361114502, 1.5167267322540283, 1.7072365283966064, 1.8977463245391846, 2.0882561206817627, 2.2787656784057617, 2.46927547454834, 2.659785270690918, 2.850295066833496, 3.040804862976074, 3.2313146591186523, 3.4218244552612305, 3.6123342514038086, 3.8028440475463867, 3.993353843688965, 4.183863639831543, 4.374373435974121, 4.564883232116699, 4.755393028259277, 4.9459028244018555, 5.136412620544434, 5.326922416687012, 5.51743221282959, 5.707942008972168, 5.898451805114746, 6.088961601257324, 6.279470920562744]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 7.0, 13.0, 22.0, 27.0, 43.0, 52.0, 73.0, 130.0, 210.0, 277.0, 441.0, 651.0, 986.0, 1597.0, 2471.0, 4355.0, 7503.0, 14542.0, 31165.0, 82729.0, 258456.0, 791670.0, 1425750.0, 1015722.0, 363904.0, 112274.0, 40093.0, 17417.0, 8874.0, 4949.0, 2906.0, 1742.0, 1085.0, 770.0, 455.0, 307.0, 190.0, 130.0, 92.0, 64.0, 45.0, 27.0, 20.0, 10.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.986572265625, -9.66064453125, -9.334716796875, -9.0087890625, -8.682861328125, -8.35693359375, -8.031005859375, -7.705078125, -7.379150390625, -7.05322265625, -6.727294921875, -6.4013671875, -6.075439453125, -5.74951171875, -5.423583984375, -5.09765625, -4.771728515625, -4.44580078125, -4.119873046875, -3.7939453125, -3.468017578125, -3.14208984375, -2.816162109375, -2.490234375, -2.164306640625, -1.83837890625, -1.512451171875, -1.1865234375, -0.860595703125, -0.53466796875, -0.208740234375, 0.1171875, 0.443115234375, 0.76904296875, 1.094970703125, 1.4208984375, 1.746826171875, 2.07275390625, 2.398681640625, 2.724609375, 3.050537109375, 3.37646484375, 3.702392578125, 4.0283203125, 4.354248046875, 4.68017578125, 5.006103515625, 5.33203125, 5.657958984375, 5.98388671875, 6.309814453125, 6.6357421875, 6.961669921875, 7.28759765625, 7.613525390625, 7.939453125, 8.265380859375, 8.59130859375, 8.917236328125, 9.2431640625, 9.569091796875, 9.89501953125, 10.220947265625, 10.546875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 3.0, 7.0, 8.0, 3.0, 14.0, 10.0, 17.0, 18.0, 17.0, 28.0, 25.0, 19.0, 27.0, 30.0, 33.0, 32.0, 35.0, 36.0, 39.0, 43.0, 39.0, 47.0, 48.0, 36.0, 34.0, 35.0, 36.0, 35.0, 36.0, 23.0, 27.0, 29.0, 15.0, 23.0, 16.0, 9.0, 12.0, 11.0, 7.0, 9.0, 2.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.16796875, -5.00006103515625, -4.8321533203125, -4.66424560546875, -4.496337890625, -4.32843017578125, -4.1605224609375, -3.99261474609375, -3.82470703125, -3.65679931640625, -3.4888916015625, -3.32098388671875, -3.153076171875, -2.98516845703125, -2.8172607421875, -2.64935302734375, -2.4814453125, -2.31353759765625, -2.1456298828125, -1.97772216796875, -1.809814453125, -1.64190673828125, -1.4739990234375, -1.30609130859375, -1.13818359375, -0.97027587890625, -0.8023681640625, -0.63446044921875, -0.466552734375, -0.29864501953125, -0.1307373046875, 0.03717041015625, 0.205078125, 0.37298583984375, 0.5408935546875, 0.70880126953125, 0.876708984375, 1.04461669921875, 1.2125244140625, 1.38043212890625, 1.54833984375, 1.71624755859375, 1.8841552734375, 2.05206298828125, 2.219970703125, 2.38787841796875, 2.5557861328125, 2.72369384765625, 2.8916015625, 3.05950927734375, 3.2274169921875, 3.39532470703125, 3.563232421875, 3.73114013671875, 3.8990478515625, 4.06695556640625, 4.23486328125, 4.40277099609375, 4.5706787109375, 4.73858642578125, 4.906494140625, 5.07440185546875, 5.2423095703125, 5.41021728515625, 5.578125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 9.0, 14.0, 21.0, 36.0, 51.0, 68.0, 113.0, 151.0, 205.0, 352.0, 520.0, 779.0, 1213.0, 1895.0, 2962.0, 5102.0, 8538.0, 15261.0, 28259.0, 58779.0, 136226.0, 342935.0, 798477.0, 1210369.0, 888020.0, 397845.0, 157793.0, 66443.0, 31550.0, 16445.0, 9405.0, 5364.0, 3346.0, 2053.0, 1311.0, 881.0, 525.0, 341.0, 212.0, 136.0, 97.0, 58.0, 36.0, 25.0, 24.0, 8.0, 12.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.230712890625, -9.90673828125, -9.582763671875, -9.2587890625, -8.934814453125, -8.61083984375, -8.286865234375, -7.962890625, -7.638916015625, -7.31494140625, -6.990966796875, -6.6669921875, -6.343017578125, -6.01904296875, -5.695068359375, -5.37109375, -5.047119140625, -4.72314453125, -4.399169921875, -4.0751953125, -3.751220703125, -3.42724609375, -3.103271484375, -2.779296875, -2.455322265625, -2.13134765625, -1.807373046875, -1.4833984375, -1.159423828125, -0.83544921875, -0.511474609375, -0.1875, 0.136474609375, 0.46044921875, 0.784423828125, 1.1083984375, 1.432373046875, 1.75634765625, 2.080322265625, 2.404296875, 2.728271484375, 3.05224609375, 3.376220703125, 3.7001953125, 4.024169921875, 4.34814453125, 4.672119140625, 4.99609375, 5.320068359375, 5.64404296875, 5.968017578125, 6.2919921875, 6.615966796875, 6.93994140625, 7.263916015625, 7.587890625, 7.911865234375, 8.23583984375, 8.559814453125, 8.8837890625, 9.207763671875, 9.53173828125, 9.855712890625, 10.1796875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 8.0, 4.0, 5.0, 7.0, 4.0, 7.0, 16.0, 26.0, 31.0, 39.0, 34.0, 55.0, 72.0, 68.0, 95.0, 116.0, 124.0, 166.0, 195.0, 251.0, 222.0, 247.0, 270.0, 262.0, 278.0, 255.0, 202.0, 189.0, 172.0, 132.0, 102.0, 89.0, 80.0, 51.0, 37.0, 35.0, 24.0, 21.0, 25.0, 13.0, 12.0, 9.0, 7.0, 5.0, 2.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.955078125, -2.86834716796875, -2.7816162109375, -2.69488525390625, -2.608154296875, -2.52142333984375, -2.4346923828125, -2.34796142578125, -2.26123046875, -2.17449951171875, -2.0877685546875, -2.00103759765625, -1.914306640625, -1.82757568359375, -1.7408447265625, -1.65411376953125, -1.5673828125, -1.48065185546875, -1.3939208984375, -1.30718994140625, -1.220458984375, -1.13372802734375, -1.0469970703125, -0.96026611328125, -0.87353515625, -0.78680419921875, -0.7000732421875, -0.61334228515625, -0.526611328125, -0.43988037109375, -0.3531494140625, -0.26641845703125, -0.1796875, -0.09295654296875, -0.0062255859375, 0.08050537109375, 0.167236328125, 0.25396728515625, 0.3406982421875, 0.42742919921875, 0.51416015625, 0.60089111328125, 0.6876220703125, 0.77435302734375, 0.861083984375, 0.94781494140625, 1.0345458984375, 1.12127685546875, 1.2080078125, 1.29473876953125, 1.3814697265625, 1.46820068359375, 1.554931640625, 1.64166259765625, 1.7283935546875, 1.81512451171875, 1.90185546875, 1.98858642578125, 2.0753173828125, 2.16204833984375, 2.248779296875, 2.33551025390625, 2.4222412109375, 2.50897216796875, 2.595703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 12.0, 10.0, 18.0, 12.0, 16.0, 28.0, 29.0, 37.0, 36.0, 44.0, 34.0, 67.0, 43.0, 58.0, 50.0, 48.0, 54.0, 55.0, 46.0, 44.0, 42.0, 28.0, 38.0, 23.0, 27.0, 11.0, 14.0, 11.0, 13.0, 3.0, 8.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.565197944641113, -7.3334784507751465, -7.1017584800720215, -6.870038986206055, -6.638319492340088, -6.406599998474121, -6.174880027770996, -5.943160533905029, -5.7114410400390625, -5.479721546173096, -5.248001575469971, -5.016282081604004, -4.784562587738037, -4.55284309387207, -4.321123123168945, -4.0894036293029785, -3.8576836585998535, -3.6259639263153076, -3.394244432449341, -3.162524700164795, -2.930805206298828, -2.6990854740142822, -2.4673657417297363, -2.2356462478637695, -2.0039265155792236, -1.7722069025039673, -1.540487289428711, -1.308767557144165, -1.0770479440689087, -0.8453283309936523, -0.6136085987091064, -0.3818889856338501, -0.15016937255859375, 0.08155027031898499, 0.3132699131965637, 0.5449895858764648, 0.7767091989517212, 1.0084288120269775, 1.2401485443115234, 1.4718681573867798, 1.7035877704620361, 1.9353073835372925, 2.167026996612549, 2.3987467288970947, 2.6304664611816406, 2.8621859550476074, 3.0939056873321533, 3.325625419616699, 3.557344913482666, 3.789064645767212, 4.020784378051758, 4.252503871917725, 4.484223365783691, 4.715943336486816, 4.947662830352783, 5.17938232421875, 5.411102294921875, 5.642821788787842, 5.874541759490967, 6.106261253356934, 6.3379807472229, 6.569700241088867, 6.801420211791992, 7.033139705657959, 7.264859199523926]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 10.0, 7.0, 14.0, 10.0, 14.0, 18.0, 18.0, 17.0, 23.0, 32.0, 23.0, 27.0, 39.0, 37.0, 45.0, 27.0, 46.0, 39.0, 48.0, 37.0, 39.0, 36.0, 39.0, 33.0, 43.0, 35.0, 29.0, 21.0, 26.0, 32.0, 18.0, 22.0, 17.0, 12.0, 13.0, 13.0, 9.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.340610504150391, -6.140810966491699, -5.941011905670166, -5.741212844848633, -5.541413307189941, -5.34161376953125, -5.141814708709717, -4.942015647888184, -4.742216110229492, -4.542416572570801, -4.342617511749268, -4.142818450927734, -3.943018913269043, -3.7432196140289307, -3.5434203147888184, -3.343621015548706, -3.1438217163085938, -2.9440224170684814, -2.744223117828369, -2.544423818588257, -2.3446245193481445, -2.1448252201080322, -1.94502592086792, -1.7452266216278076, -1.5454273223876953, -1.345628023147583, -1.1458287239074707, -0.9460294246673584, -0.7462301254272461, -0.5464308261871338, -0.3466315269470215, -0.14683222770690918, 0.05296659469604492, 0.2527658939361572, 0.45256519317626953, 0.6523644924163818, 0.8521637916564941, 1.0519630908966064, 1.2517623901367188, 1.451561689376831, 1.6513609886169434, 1.8511602878570557, 2.050959587097168, 2.2507588863372803, 2.4505581855773926, 2.650357484817505, 2.850156784057617, 3.0499560832977295, 3.249755382537842, 3.449554681777954, 3.6493539810180664, 3.8491532802581787, 4.048952579498291, 4.248751640319824, 4.448551177978516, 4.648350715637207, 4.84814977645874, 5.047948837280273, 5.247748374938965, 5.447547912597656, 5.6473469734191895, 5.847146034240723, 6.046945571899414, 6.2467451095581055, 6.446544170379639]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 25.0, 27.0, 55.0, 66.0, 127.0, 182.0, 309.0, 471.0, 732.0, 1168.0, 2015.0, 3378.0, 5728.0, 9673.0, 16685.0, 30199.0, 54894.0, 98248.0, 160751.0, 209136.0, 182845.0, 117994.0, 66978.0, 37209.0, 20693.0, 11693.0, 6771.0, 4116.0, 2433.0, 1477.0, 905.0, 559.0, 343.0, 216.0, 158.0, 99.0, 63.0, 32.0, 27.0, 18.0, 11.0, 10.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.2294921875, -1.191864013671875, -1.15423583984375, -1.116607666015625, -1.0789794921875, -1.041351318359375, -1.00372314453125, -0.966094970703125, -0.928466796875, -0.890838623046875, -0.85321044921875, -0.815582275390625, -0.7779541015625, -0.740325927734375, -0.70269775390625, -0.665069580078125, -0.62744140625, -0.589813232421875, -0.55218505859375, -0.514556884765625, -0.4769287109375, -0.439300537109375, -0.40167236328125, -0.364044189453125, -0.326416015625, -0.288787841796875, -0.25115966796875, -0.213531494140625, -0.1759033203125, -0.138275146484375, -0.10064697265625, -0.063018798828125, -0.025390625, 0.012237548828125, 0.04986572265625, 0.087493896484375, 0.1251220703125, 0.162750244140625, 0.20037841796875, 0.238006591796875, 0.275634765625, 0.313262939453125, 0.35089111328125, 0.388519287109375, 0.4261474609375, 0.463775634765625, 0.50140380859375, 0.539031982421875, 0.57666015625, 0.614288330078125, 0.65191650390625, 0.689544677734375, 0.7271728515625, 0.764801025390625, 0.80242919921875, 0.840057373046875, 0.877685546875, 0.915313720703125, 0.95294189453125, 0.990570068359375, 1.0281982421875, 1.065826416015625, 1.10345458984375, 1.141082763671875, 1.1787109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 11.0, 8.0, 11.0, 13.0, 25.0, 25.0, 22.0, 25.0, 30.0, 33.0, 36.0, 40.0, 36.0, 36.0, 36.0, 46.0, 42.0, 43.0, 43.0, 31.0, 50.0, 44.0, 48.0, 25.0, 24.0, 31.0, 25.0, 28.0, 26.0, 18.0, 14.0, 12.0, 9.0, 8.0, 9.0, 12.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.22003173828125, -6.9947509765625, -6.76947021484375, -6.544189453125, -6.31890869140625, -6.0936279296875, -5.86834716796875, -5.64306640625, -5.41778564453125, -5.1925048828125, -4.96722412109375, -4.741943359375, -4.51666259765625, -4.2913818359375, -4.06610107421875, -3.8408203125, -3.61553955078125, -3.3902587890625, -3.16497802734375, -2.939697265625, -2.71441650390625, -2.4891357421875, -2.26385498046875, -2.03857421875, -1.81329345703125, -1.5880126953125, -1.36273193359375, -1.137451171875, -0.91217041015625, -0.6868896484375, -0.46160888671875, -0.236328125, -0.01104736328125, 0.2142333984375, 0.43951416015625, 0.664794921875, 0.89007568359375, 1.1153564453125, 1.34063720703125, 1.56591796875, 1.79119873046875, 2.0164794921875, 2.24176025390625, 2.467041015625, 2.69232177734375, 2.9176025390625, 3.14288330078125, 3.3681640625, 3.59344482421875, 3.8187255859375, 4.04400634765625, 4.269287109375, 4.49456787109375, 4.7198486328125, 4.94512939453125, 5.17041015625, 5.39569091796875, 5.6209716796875, 5.84625244140625, 6.071533203125, 6.29681396484375, 6.5220947265625, 6.74737548828125, 6.97265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 10.0, 10.0, 11.0, 20.0, 30.0, 67.0, 57.0, 115.0, 156.0, 293.0, 541.0, 987.0, 2007.0, 4414.0, 10706.0, 29323.0, 484606.0, 466766.0, 29128.0, 10668.0, 4479.0, 1936.0, 980.0, 515.0, 255.0, 152.0, 91.0, 70.0, 42.0, 34.0, 15.0, 12.0, 9.0, 12.0, 12.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.26953125, -5.11895751953125, -4.9683837890625, -4.81781005859375, -4.667236328125, -4.51666259765625, -4.3660888671875, -4.21551513671875, -4.06494140625, -3.91436767578125, -3.7637939453125, -3.61322021484375, -3.462646484375, -3.31207275390625, -3.1614990234375, -3.01092529296875, -2.8603515625, -2.70977783203125, -2.5592041015625, -2.40863037109375, -2.258056640625, -2.10748291015625, -1.9569091796875, -1.80633544921875, -1.65576171875, -1.50518798828125, -1.3546142578125, -1.20404052734375, -1.053466796875, -0.90289306640625, -0.7523193359375, -0.60174560546875, -0.451171875, -0.30059814453125, -0.1500244140625, 0.00054931640625, 0.151123046875, 0.30169677734375, 0.4522705078125, 0.60284423828125, 0.75341796875, 0.90399169921875, 1.0545654296875, 1.20513916015625, 1.355712890625, 1.50628662109375, 1.6568603515625, 1.80743408203125, 1.9580078125, 2.10858154296875, 2.2591552734375, 2.40972900390625, 2.560302734375, 2.71087646484375, 2.8614501953125, 3.01202392578125, 3.16259765625, 3.31317138671875, 3.4637451171875, 3.61431884765625, 3.764892578125, 3.91546630859375, 4.0660400390625, 4.21661376953125, 4.3671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 11.0, 16.0, 10.0, 11.0, 8.0, 12.0, 14.0, 24.0, 23.0, 20.0, 33.0, 27.0, 31.0, 32.0, 36.0, 29.0, 37.0, 49.0, 44.0, 38.0, 47.0, 34.0, 46.0, 41.0, 31.0, 32.0, 37.0, 26.0, 23.0, 19.0, 16.0, 26.0, 17.0, 12.0, 16.0, 11.0, 11.0, 5.0, 9.0, 10.0, 6.0, 3.0, 1.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.489990234375, -4.34326171875, -4.196533203125, -4.0498046875, -3.903076171875, -3.75634765625, -3.609619140625, -3.462890625, -3.316162109375, -3.16943359375, -3.022705078125, -2.8759765625, -2.729248046875, -2.58251953125, -2.435791015625, -2.2890625, -2.142333984375, -1.99560546875, -1.848876953125, -1.7021484375, -1.555419921875, -1.40869140625, -1.261962890625, -1.115234375, -0.968505859375, -0.82177734375, -0.675048828125, -0.5283203125, -0.381591796875, -0.23486328125, -0.088134765625, 0.05859375, 0.205322265625, 0.35205078125, 0.498779296875, 0.6455078125, 0.792236328125, 0.93896484375, 1.085693359375, 1.232421875, 1.379150390625, 1.52587890625, 1.672607421875, 1.8193359375, 1.966064453125, 2.11279296875, 2.259521484375, 2.40625, 2.552978515625, 2.69970703125, 2.846435546875, 2.9931640625, 3.139892578125, 3.28662109375, 3.433349609375, 3.580078125, 3.726806640625, 3.87353515625, 4.020263671875, 4.1669921875, 4.313720703125, 4.46044921875, 4.607177734375, 4.75390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 14.0, 14.0, 17.0, 35.0, 42.0, 45.0, 69.0, 100.0, 142.0, 240.0, 302.0, 510.0, 702.0, 1011.0, 1617.0, 2620.0, 4207.0, 7038.0, 12612.0, 24124.0, 92428.0, 795075.0, 57054.0, 20586.0, 10877.0, 6332.0, 3812.0, 2390.0, 1472.0, 1007.0, 632.0, 404.0, 267.0, 232.0, 152.0, 98.0, 72.0, 58.0, 35.0, 32.0, 17.0, 18.0, 12.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34912109375, -0.3368263244628906, -0.32453155517578125, -0.3122367858886719, -0.2999420166015625, -0.2876472473144531, -0.27535247802734375, -0.2630577087402344, -0.250762939453125, -0.23846817016601562, -0.22617340087890625, -0.21387863159179688, -0.2015838623046875, -0.18928909301757812, -0.17699432373046875, -0.16469955444335938, -0.15240478515625, -0.14011001586914062, -0.12781524658203125, -0.11552047729492188, -0.1032257080078125, -0.09093093872070312, -0.07863616943359375, -0.06634140014648438, -0.054046630859375, -0.041751861572265625, -0.02945709228515625, -0.017162322998046875, -0.0048675537109375, 0.007427215576171875, 0.01972198486328125, 0.032016754150390625, 0.0443115234375, 0.056606292724609375, 0.06890106201171875, 0.08119583129882812, 0.0934906005859375, 0.10578536987304688, 0.11808013916015625, 0.13037490844726562, 0.142669677734375, 0.15496444702148438, 0.16725921630859375, 0.17955398559570312, 0.1918487548828125, 0.20414352416992188, 0.21643829345703125, 0.22873306274414062, 0.24102783203125, 0.2533226013183594, 0.26561737060546875, 0.2779121398925781, 0.2902069091796875, 0.3025016784667969, 0.31479644775390625, 0.3270912170410156, 0.339385986328125, 0.3516807556152344, 0.36397552490234375, 0.3762702941894531, 0.3885650634765625, 0.4008598327636719, 0.41315460205078125, 0.4254493713378906, 0.437744140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 9.0, 12.0, 19.0, 18.0, 35.0, 34.0, 49.0, 56.0, 56.0, 59.0, 77.0, 66.0, 72.0, 74.0, 55.0, 42.0, 53.0, 41.0, 34.0, 25.0, 21.0, 23.0, 12.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.965463161468506e-05, -1.8984079360961914e-05, -1.831352710723877e-05, -1.7642974853515625e-05, -1.697242259979248e-05, -1.6301870346069336e-05, -1.563131809234619e-05, -1.4960765838623047e-05, -1.4290213584899902e-05, -1.3619661331176758e-05, -1.2949109077453613e-05, -1.2278556823730469e-05, -1.1608004570007324e-05, -1.093745231628418e-05, -1.0266900062561035e-05, -9.59634780883789e-06, -8.925795555114746e-06, -8.255243301391602e-06, -7.584691047668457e-06, -6.9141387939453125e-06, -6.243586540222168e-06, -5.5730342864990234e-06, -4.902482032775879e-06, -4.231929779052734e-06, -3.56137752532959e-06, -2.8908252716064453e-06, -2.2202730178833008e-06, -1.5497207641601562e-06, -8.791685104370117e-07, -2.086162567138672e-07, 4.6193599700927734e-07, 1.1324882507324219e-06, 1.8030405044555664e-06, 2.473592758178711e-06, 3.1441450119018555e-06, 3.814697265625e-06, 4.4852495193481445e-06, 5.155801773071289e-06, 5.826354026794434e-06, 6.496906280517578e-06, 7.167458534240723e-06, 7.838010787963867e-06, 8.508563041687012e-06, 9.179115295410156e-06, 9.8496675491333e-06, 1.0520219802856445e-05, 1.119077205657959e-05, 1.1861324310302734e-05, 1.2531876564025879e-05, 1.3202428817749023e-05, 1.3872981071472168e-05, 1.4543533325195312e-05, 1.5214085578918457e-05, 1.58846378326416e-05, 1.6555190086364746e-05, 1.722574234008789e-05, 1.7896294593811035e-05, 1.856684684753418e-05, 1.9237399101257324e-05, 1.990795135498047e-05, 2.0578503608703613e-05, 2.1249055862426758e-05, 2.1919608116149902e-05, 2.2590160369873047e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 10.0, 16.0, 31.0, 34.0, 45.0, 78.0, 101.0, 134.0, 220.0, 307.0, 514.0, 821.0, 1201.0, 1976.0, 3138.0, 5280.0, 9168.0, 16091.0, 28984.0, 52087.0, 93472.0, 159221.0, 220473.0, 188386.0, 116617.0, 64806.0, 36158.0, 20554.0, 11619.0, 6626.0, 3970.0, 2284.0, 1447.0, 926.0, 590.0, 368.0, 260.0, 160.0, 116.0, 75.0, 61.0, 44.0, 17.0, 27.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.42822265625, -0.4142723083496094, -0.40032196044921875, -0.3863716125488281, -0.3724212646484375, -0.3584709167480469, -0.34452056884765625, -0.3305702209472656, -0.316619873046875, -0.3026695251464844, -0.28871917724609375, -0.2747688293457031, -0.2608184814453125, -0.24686813354492188, -0.23291778564453125, -0.21896743774414062, -0.20501708984375, -0.19106674194335938, -0.17711639404296875, -0.16316604614257812, -0.1492156982421875, -0.13526535034179688, -0.12131500244140625, -0.10736465454101562, -0.093414306640625, -0.07946395874023438, -0.06551361083984375, -0.051563262939453125, -0.0376129150390625, -0.023662567138671875, -0.00971221923828125, 0.004238128662109375, 0.0181884765625, 0.032138824462890625, 0.04608917236328125, 0.060039520263671875, 0.0739898681640625, 0.08794021606445312, 0.10189056396484375, 0.11584091186523438, 0.129791259765625, 0.14374160766601562, 0.15769195556640625, 0.17164230346679688, 0.1855926513671875, 0.19954299926757812, 0.21349334716796875, 0.22744369506835938, 0.24139404296875, 0.2553443908691406, 0.26929473876953125, 0.2832450866699219, 0.2971954345703125, 0.3111457824707031, 0.32509613037109375, 0.3390464782714844, 0.352996826171875, 0.3669471740722656, 0.38089752197265625, 0.3948478698730469, 0.4087982177734375, 0.4227485656738281, 0.43669891357421875, 0.4506492614746094, 0.464599609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 11.0, 17.0, 15.0, 13.0, 18.0, 24.0, 27.0, 34.0, 29.0, 33.0, 48.0, 38.0, 48.0, 45.0, 50.0, 71.0, 46.0, 55.0, 44.0, 42.0, 24.0, 43.0, 33.0, 31.0, 19.0, 16.0, 20.0, 12.0, 17.0, 15.0, 10.0, 14.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14478683471679688, -0.13979339599609375, -0.13479995727539062, -0.1298065185546875, -0.12481307983398438, -0.11981964111328125, -0.11482620239257812, -0.109832763671875, -0.10483932495117188, -0.09984588623046875, -0.09485244750976562, -0.0898590087890625, -0.08486557006835938, -0.07987213134765625, -0.07487869262695312, -0.06988525390625, -0.06489181518554688, -0.05989837646484375, -0.054904937744140625, -0.0499114990234375, -0.044918060302734375, -0.03992462158203125, -0.034931182861328125, -0.029937744140625, -0.024944305419921875, -0.01995086669921875, -0.014957427978515625, -0.0099639892578125, -0.004970550537109375, 2.288818359375e-05, 0.005016326904296875, 0.010009765625, 0.015003204345703125, 0.01999664306640625, 0.024990081787109375, 0.0299835205078125, 0.034976959228515625, 0.03997039794921875, 0.044963836669921875, 0.049957275390625, 0.054950714111328125, 0.05994415283203125, 0.06493759155273438, 0.0699310302734375, 0.07492446899414062, 0.07991790771484375, 0.08491134643554688, 0.08990478515625, 0.09489822387695312, 0.09989166259765625, 0.10488510131835938, 0.1098785400390625, 0.11487197875976562, 0.11986541748046875, 0.12485885620117188, 0.129852294921875, 0.13484573364257812, 0.13983917236328125, 0.14483261108398438, 0.1498260498046875, 0.15481948852539062, 0.15981292724609375, 0.16480636596679688, 0.1697998046875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 9.0, 8.0, 10.0, 15.0, 14.0, 21.0, 19.0, 30.0, 33.0, 37.0, 44.0, 45.0, 51.0, 61.0, 46.0, 58.0, 46.0, 58.0, 56.0, 37.0, 50.0, 41.0, 31.0, 39.0, 18.0, 31.0, 13.0, 13.0, 11.0, 13.0, 7.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.655972957611084, -7.4220356941223145, -7.188097953796387, -6.954160690307617, -6.720223426818848, -6.486286163330078, -6.252348899841309, -6.018411159515381, -5.784473896026611, -5.550536632537842, -5.316598892211914, -5.0826616287231445, -4.848724365234375, -4.6147871017456055, -4.380849838256836, -4.146912097930908, -3.9129748344421387, -3.679037570953369, -3.4451000690460205, -3.211162567138672, -2.9772253036499023, -2.743288040161133, -2.509350538253784, -2.2754130363464355, -2.041475772857666, -1.807538390159607, -1.5736010074615479, -1.3396636247634888, -1.1057262420654297, -0.8717888593673706, -0.6378514766693115, -0.40391409397125244, -0.16997671127319336, 0.06396067142486572, 0.2978980541229248, 0.5318354368209839, 0.765772819519043, 0.999710202217102, 1.2336475849151611, 1.4675849676132202, 1.7015223503112793, 1.9354597330093384, 2.1693971157073975, 2.403334617614746, 2.6372718811035156, 2.871209144592285, 3.105146646499634, 3.3390841484069824, 3.573021411895752, 3.8069586753845215, 4.040896415710449, 4.274833679199219, 4.508770942687988, 4.742708206176758, 4.976645469665527, 5.210583209991455, 5.444520473480225, 5.678457736968994, 5.912395477294922, 6.146332740783691, 6.380270004272461, 6.6142072677612305, 6.84814453125, 7.082082271575928, 7.316019535064697]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 8.0, 12.0, 11.0, 16.0, 19.0, 18.0, 19.0, 18.0, 37.0, 23.0, 25.0, 40.0, 43.0, 38.0, 30.0, 47.0, 38.0, 44.0, 41.0, 35.0, 44.0, 35.0, 33.0, 43.0, 36.0, 21.0, 28.0, 28.0, 27.0, 18.0, 23.0, 14.0, 14.0, 14.0, 14.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.365640640258789, -6.165650844573975, -5.96566104888916, -5.765671730041504, -5.5656819343566895, -5.365692138671875, -5.165702819824219, -4.965713024139404, -4.76572322845459, -4.565733432769775, -4.365743637084961, -4.165754318237305, -3.9657645225524902, -3.765774726867676, -3.5657851696014404, -3.365795612335205, -3.1658058166503906, -2.965816020965576, -2.765826463699341, -2.5658369064331055, -2.365847110748291, -2.1658573150634766, -1.9658677577972412, -1.7658780813217163, -1.5658884048461914, -1.3658987283706665, -1.1659090518951416, -0.9659193754196167, -0.7659296989440918, -0.5659400224685669, -0.365950345993042, -0.1659606695175171, 0.034029483795166016, 0.23401916027069092, 0.4340088367462158, 0.6339985132217407, 0.8339881896972656, 1.0339778661727905, 1.2339675426483154, 1.4339572191238403, 1.6339468955993652, 1.8339365720748901, 2.033926248550415, 2.2339158058166504, 2.433905601501465, 2.6338953971862793, 2.8338849544525146, 3.03387451171875, 3.2338643074035645, 3.433854103088379, 3.6338436603546143, 3.8338332176208496, 4.033823013305664, 4.2338128089904785, 4.433802604675293, 4.633791923522949, 4.833781719207764, 5.033771514892578, 5.233760833740234, 5.433750629425049, 5.633740425109863, 5.833730220794678, 6.033720016479492, 6.233709335327148, 6.433699131011963]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 14.0, 23.0, 41.0, 48.0, 83.0, 121.0, 197.0, 333.0, 499.0, 803.0, 1470.0, 2439.0, 4220.0, 7282.0, 12858.0, 22810.0, 40422.0, 71306.0, 114391.0, 160266.0, 179872.0, 158261.0, 111238.0, 68506.0, 39452.0, 22150.0, 12323.0, 7143.0, 4049.0, 2328.0, 1388.0, 843.0, 509.0, 316.0, 207.0, 124.0, 75.0, 47.0, 32.0, 13.0, 14.0, 11.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.13104248046875, -4.9730224609375, -4.81500244140625, -4.656982421875, -4.49896240234375, -4.3409423828125, -4.18292236328125, -4.02490234375, -3.86688232421875, -3.7088623046875, -3.55084228515625, -3.392822265625, -3.23480224609375, -3.0767822265625, -2.91876220703125, -2.7607421875, -2.60272216796875, -2.4447021484375, -2.28668212890625, -2.128662109375, -1.97064208984375, -1.8126220703125, -1.65460205078125, -1.49658203125, -1.33856201171875, -1.1805419921875, -1.02252197265625, -0.864501953125, -0.70648193359375, -0.5484619140625, -0.39044189453125, -0.232421875, -0.07440185546875, 0.0836181640625, 0.24163818359375, 0.399658203125, 0.55767822265625, 0.7156982421875, 0.87371826171875, 1.03173828125, 1.18975830078125, 1.3477783203125, 1.50579833984375, 1.663818359375, 1.82183837890625, 1.9798583984375, 2.13787841796875, 2.2958984375, 2.45391845703125, 2.6119384765625, 2.76995849609375, 2.927978515625, 3.08599853515625, 3.2440185546875, 3.40203857421875, 3.56005859375, 3.71807861328125, 3.8760986328125, 4.03411865234375, 4.192138671875, 4.35015869140625, 4.5081787109375, 4.66619873046875, 4.82421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 11.0, 3.0, 8.0, 5.0, 11.0, 14.0, 20.0, 14.0, 20.0, 17.0, 30.0, 20.0, 26.0, 26.0, 34.0, 34.0, 35.0, 39.0, 42.0, 45.0, 39.0, 46.0, 33.0, 38.0, 39.0, 41.0, 35.0, 30.0, 32.0, 20.0, 27.0, 25.0, 24.0, 15.0, 17.0, 16.0, 10.0, 8.0, 11.0, 11.0, 13.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.3046875, -6.10711669921875, -5.9095458984375, -5.71197509765625, -5.514404296875, -5.31683349609375, -5.1192626953125, -4.92169189453125, -4.72412109375, -4.52655029296875, -4.3289794921875, -4.13140869140625, -3.933837890625, -3.73626708984375, -3.5386962890625, -3.34112548828125, -3.1435546875, -2.94598388671875, -2.7484130859375, -2.55084228515625, -2.353271484375, -2.15570068359375, -1.9581298828125, -1.76055908203125, -1.56298828125, -1.36541748046875, -1.1678466796875, -0.97027587890625, -0.772705078125, -0.57513427734375, -0.3775634765625, -0.17999267578125, 0.017578125, 0.21514892578125, 0.4127197265625, 0.61029052734375, 0.807861328125, 1.00543212890625, 1.2030029296875, 1.40057373046875, 1.59814453125, 1.79571533203125, 1.9932861328125, 2.19085693359375, 2.388427734375, 2.58599853515625, 2.7835693359375, 2.98114013671875, 3.1787109375, 3.37628173828125, 3.5738525390625, 3.77142333984375, 3.968994140625, 4.16656494140625, 4.3641357421875, 4.56170654296875, 4.75927734375, 4.95684814453125, 5.1544189453125, 5.35198974609375, 5.549560546875, 5.74713134765625, 5.9447021484375, 6.14227294921875, 6.33984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 15.0, 17.0, 30.0, 50.0, 66.0, 140.0, 191.0, 372.0, 594.0, 1006.0, 1677.0, 2784.0, 4845.0, 8309.0, 13921.0, 24614.0, 41416.0, 68573.0, 108437.0, 148394.0, 168742.0, 153599.0, 115258.0, 75415.0, 45669.0, 26632.0, 15659.0, 9015.0, 5318.0, 3108.0, 1907.0, 1129.0, 655.0, 415.0, 223.0, 145.0, 93.0, 53.0, 35.0, 14.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.34478759765625, -5.1856689453125, -5.02655029296875, -4.867431640625, -4.70831298828125, -4.5491943359375, -4.39007568359375, -4.23095703125, -4.07183837890625, -3.9127197265625, -3.75360107421875, -3.594482421875, -3.43536376953125, -3.2762451171875, -3.11712646484375, -2.9580078125, -2.79888916015625, -2.6397705078125, -2.48065185546875, -2.321533203125, -2.16241455078125, -2.0032958984375, -1.84417724609375, -1.68505859375, -1.52593994140625, -1.3668212890625, -1.20770263671875, -1.048583984375, -0.88946533203125, -0.7303466796875, -0.57122802734375, -0.412109375, -0.25299072265625, -0.0938720703125, 0.06524658203125, 0.224365234375, 0.38348388671875, 0.5426025390625, 0.70172119140625, 0.86083984375, 1.01995849609375, 1.1790771484375, 1.33819580078125, 1.497314453125, 1.65643310546875, 1.8155517578125, 1.97467041015625, 2.1337890625, 2.29290771484375, 2.4520263671875, 2.61114501953125, 2.770263671875, 2.92938232421875, 3.0885009765625, 3.24761962890625, 3.40673828125, 3.56585693359375, 3.7249755859375, 3.88409423828125, 4.043212890625, 4.20233154296875, 4.3614501953125, 4.52056884765625, 4.6796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 3.0, 3.0, 11.0, 5.0, 10.0, 12.0, 16.0, 13.0, 17.0, 25.0, 17.0, 14.0, 31.0, 22.0, 37.0, 32.0, 31.0, 36.0, 33.0, 28.0, 37.0, 32.0, 39.0, 36.0, 39.0, 41.0, 44.0, 32.0, 31.0, 30.0, 27.0, 33.0, 18.0, 27.0, 17.0, 22.0, 20.0, 14.0, 10.0, 6.0, 8.0, 6.0, 9.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.9921875, -3.873291015625, -3.75439453125, -3.635498046875, -3.5166015625, -3.397705078125, -3.27880859375, -3.159912109375, -3.041015625, -2.922119140625, -2.80322265625, -2.684326171875, -2.5654296875, -2.446533203125, -2.32763671875, -2.208740234375, -2.08984375, -1.970947265625, -1.85205078125, -1.733154296875, -1.6142578125, -1.495361328125, -1.37646484375, -1.257568359375, -1.138671875, -1.019775390625, -0.90087890625, -0.781982421875, -0.6630859375, -0.544189453125, -0.42529296875, -0.306396484375, -0.1875, -0.068603515625, 0.05029296875, 0.169189453125, 0.2880859375, 0.406982421875, 0.52587890625, 0.644775390625, 0.763671875, 0.882568359375, 1.00146484375, 1.120361328125, 1.2392578125, 1.358154296875, 1.47705078125, 1.595947265625, 1.71484375, 1.833740234375, 1.95263671875, 2.071533203125, 2.1904296875, 2.309326171875, 2.42822265625, 2.547119140625, 2.666015625, 2.784912109375, 2.90380859375, 3.022705078125, 3.1416015625, 3.260498046875, 3.37939453125, 3.498291015625, 3.6171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 14.0, 10.0, 15.0, 31.0, 41.0, 63.0, 98.0, 170.0, 234.0, 372.0, 629.0, 939.0, 1512.0, 2559.0, 4146.0, 7033.0, 12262.0, 21458.0, 39028.0, 68911.0, 114609.0, 164027.0, 187061.0, 160997.0, 110347.0, 65887.0, 36575.0, 20676.0, 11754.0, 6735.0, 3996.0, 2443.0, 1421.0, 887.0, 592.0, 352.0, 216.0, 150.0, 103.0, 80.0, 31.0, 30.0, 21.0, 14.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.1641845703125, -2.088134765625, -2.0120849609375, -1.93603515625, -1.8599853515625, -1.783935546875, -1.7078857421875, -1.6318359375, -1.5557861328125, -1.479736328125, -1.4036865234375, -1.32763671875, -1.2515869140625, -1.175537109375, -1.0994873046875, -1.0234375, -0.9473876953125, -0.871337890625, -0.7952880859375, -0.71923828125, -0.6431884765625, -0.567138671875, -0.4910888671875, -0.4150390625, -0.3389892578125, -0.262939453125, -0.1868896484375, -0.11083984375, -0.0347900390625, 0.041259765625, 0.1173095703125, 0.193359375, 0.2694091796875, 0.345458984375, 0.4215087890625, 0.49755859375, 0.5736083984375, 0.649658203125, 0.7257080078125, 0.8017578125, 0.8778076171875, 0.953857421875, 1.0299072265625, 1.10595703125, 1.1820068359375, 1.258056640625, 1.3341064453125, 1.41015625, 1.4862060546875, 1.562255859375, 1.6383056640625, 1.71435546875, 1.7904052734375, 1.866455078125, 1.9425048828125, 2.0185546875, 2.0946044921875, 2.170654296875, 2.2467041015625, 2.32275390625, 2.3988037109375, 2.474853515625, 2.5509033203125, 2.626953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 11.0, 11.0, 7.0, 21.0, 15.0, 29.0, 30.0, 44.0, 35.0, 63.0, 65.0, 68.0, 70.0, 64.0, 76.0, 64.0, 50.0, 49.0, 43.0, 38.0, 25.0, 32.0, 16.0, 19.0, 12.0, 15.0, 6.0, 5.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002079010009765625, -0.00019998103380203247, -0.00019206106662750244, -0.0001841410994529724, -0.00017622113227844238, -0.00016830116510391235, -0.00016038119792938232, -0.0001524612307548523, -0.00014454126358032227, -0.00013662129640579224, -0.0001287013292312622, -0.00012078136205673218, -0.00011286139488220215, -0.00010494142770767212, -9.702146053314209e-05, -8.910149335861206e-05, -8.118152618408203e-05, -7.3261559009552e-05, -6.534159183502197e-05, -5.742162466049194e-05, -4.9501657485961914e-05, -4.1581690311431885e-05, -3.3661723136901855e-05, -2.5741755962371826e-05, -1.7821788787841797e-05, -9.901821613311768e-06, -1.9818544387817383e-06, 5.938112735748291e-06, 1.385807991027832e-05, 2.177804708480835e-05, 2.969801425933838e-05, 3.761798143386841e-05, 4.553794860839844e-05, 5.345791578292847e-05, 6.13778829574585e-05, 6.929785013198853e-05, 7.721781730651855e-05, 8.513778448104858e-05, 9.305775165557861e-05, 0.00010097771883010864, 0.00010889768600463867, 0.0001168176531791687, 0.00012473762035369873, 0.00013265758752822876, 0.0001405775547027588, 0.00014849752187728882, 0.00015641748905181885, 0.00016433745622634888, 0.0001722574234008789, 0.00018017739057540894, 0.00018809735774993896, 0.000196017324924469, 0.00020393729209899902, 0.00021185725927352905, 0.00021977722644805908, 0.0002276971936225891, 0.00023561716079711914, 0.00024353712797164917, 0.0002514570951461792, 0.00025937706232070923, 0.00026729702949523926, 0.0002752169966697693, 0.0002831369638442993, 0.00029105693101882935, 0.0002989768981933594]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 16.0, 36.0, 46.0, 46.0, 83.0, 102.0, 155.0, 222.0, 355.0, 491.0, 720.0, 1044.0, 1752.0, 2666.0, 4272.0, 6886.0, 11089.0, 18265.0, 30077.0, 49073.0, 76809.0, 112723.0, 144954.0, 156147.0, 140001.0, 105078.0, 70663.0, 44162.0, 26931.0, 16361.0, 10088.0, 6280.0, 3901.0, 2406.0, 1569.0, 988.0, 673.0, 459.0, 287.0, 215.0, 138.0, 100.0, 61.0, 47.0, 45.0, 22.0, 15.0, 5.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.291015625, -2.222412109375, -2.15380859375, -2.085205078125, -2.0166015625, -1.947998046875, -1.87939453125, -1.810791015625, -1.7421875, -1.673583984375, -1.60498046875, -1.536376953125, -1.4677734375, -1.399169921875, -1.33056640625, -1.261962890625, -1.193359375, -1.124755859375, -1.05615234375, -0.987548828125, -0.9189453125, -0.850341796875, -0.78173828125, -0.713134765625, -0.64453125, -0.575927734375, -0.50732421875, -0.438720703125, -0.3701171875, -0.301513671875, -0.23291015625, -0.164306640625, -0.095703125, -0.027099609375, 0.04150390625, 0.110107421875, 0.1787109375, 0.247314453125, 0.31591796875, 0.384521484375, 0.453125, 0.521728515625, 0.59033203125, 0.658935546875, 0.7275390625, 0.796142578125, 0.86474609375, 0.933349609375, 1.001953125, 1.070556640625, 1.13916015625, 1.207763671875, 1.2763671875, 1.344970703125, 1.41357421875, 1.482177734375, 1.55078125, 1.619384765625, 1.68798828125, 1.756591796875, 1.8251953125, 1.893798828125, 1.96240234375, 2.031005859375, 2.099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 14.0, 9.0, 15.0, 16.0, 21.0, 21.0, 20.0, 25.0, 34.0, 30.0, 51.0, 32.0, 43.0, 45.0, 44.0, 39.0, 52.0, 43.0, 44.0, 46.0, 35.0, 46.0, 35.0, 27.0, 29.0, 23.0, 28.0, 22.0, 22.0, 15.0, 13.0, 16.0, 6.0, 8.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.72216796875, -0.7002487182617188, -0.6783294677734375, -0.6564102172851562, -0.634490966796875, -0.6125717163085938, -0.5906524658203125, -0.5687332153320312, -0.54681396484375, -0.5248947143554688, -0.5029754638671875, -0.48105621337890625, -0.459136962890625, -0.43721771240234375, -0.4152984619140625, -0.39337921142578125, -0.3714599609375, -0.34954071044921875, -0.3276214599609375, -0.30570220947265625, -0.283782958984375, -0.26186370849609375, -0.2399444580078125, -0.21802520751953125, -0.19610595703125, -0.17418670654296875, -0.1522674560546875, -0.13034820556640625, -0.108428955078125, -0.08650970458984375, -0.0645904541015625, -0.04267120361328125, -0.020751953125, 0.00116729736328125, 0.0230865478515625, 0.04500579833984375, 0.066925048828125, 0.08884429931640625, 0.1107635498046875, 0.13268280029296875, 0.15460205078125, 0.17652130126953125, 0.1984405517578125, 0.22035980224609375, 0.242279052734375, 0.26419830322265625, 0.2861175537109375, 0.30803680419921875, 0.3299560546875, 0.35187530517578125, 0.3737945556640625, 0.39571380615234375, 0.417633056640625, 0.43955230712890625, 0.4614715576171875, 0.48339080810546875, 0.50531005859375, 0.5272293090820312, 0.5491485595703125, 0.5710678100585938, 0.592987060546875, 0.6149063110351562, 0.6368255615234375, 0.6587448120117188, 0.6806640625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 4.0, 14.0, 11.0, 14.0, 13.0, 15.0, 25.0, 26.0, 31.0, 39.0, 47.0, 41.0, 56.0, 61.0, 60.0, 56.0, 52.0, 37.0, 58.0, 55.0, 36.0, 34.0, 33.0, 36.0, 20.0, 27.0, 18.0, 9.0, 16.0, 8.0, 8.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.165626525878906, -7.929124355316162, -7.69262170791626, -7.456119537353516, -7.2196173667907715, -6.983115196228027, -6.746612548828125, -6.510110378265381, -6.273608207702637, -6.037106037139893, -5.80060338973999, -5.564101219177246, -5.327599048614502, -5.091096878051758, -4.8545942306518555, -4.618092060089111, -4.381589889526367, -4.145087718963623, -3.9085853099823, -3.6720829010009766, -3.4355807304382324, -3.199078321456909, -2.962575912475586, -2.726073741912842, -2.4895710945129395, -2.253068685531616, -2.016566514968872, -1.7800641059875488, -1.5435619354248047, -1.3070595264434814, -1.0705572366714478, -0.8340549468994141, -0.5975527763366699, -0.36105048656463623, -0.12454816699028015, 0.11195415258407593, 0.3484564423561096, 0.5849587917327881, 0.8214610815048218, 1.0579633712768555, 1.2944656610488892, 1.5309679508209229, 1.7674702405929565, 2.0039725303649902, 2.2404749393463135, 2.4769773483276367, 2.713479518890381, 2.949981689453125, 3.1864840984344482, 3.4229865074157715, 3.6594886779785156, 3.895991086959839, 4.132493495941162, 4.368995666503906, 4.60549783706665, 4.8420000076293945, 5.078502655029297, 5.315004825592041, 5.551507472991943, 5.7880096435546875, 6.024511814117432, 6.261013984680176, 6.497516632080078, 6.734018802642822, 6.970520973205566]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 6.0, 4.0, 10.0, 9.0, 9.0, 17.0, 22.0, 15.0, 19.0, 27.0, 24.0, 31.0, 41.0, 41.0, 34.0, 33.0, 25.0, 33.0, 39.0, 50.0, 41.0, 35.0, 28.0, 42.0, 34.0, 31.0, 32.0, 22.0, 28.0, 28.0, 25.0, 23.0, 17.0, 17.0, 19.0, 14.0, 10.0, 13.0, 8.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-6.9623284339904785, -6.7615437507629395, -6.5607590675354, -6.359974384307861, -6.159189701080322, -5.958405017852783, -5.757620334625244, -5.556835651397705, -5.356050968170166, -5.155266284942627, -4.954481601715088, -4.753696918487549, -4.55291223526001, -4.352127552032471, -4.151342868804932, -3.9505581855773926, -3.7497737407684326, -3.5489890575408936, -3.3482043743133545, -3.1474196910858154, -2.9466350078582764, -2.7458505630493164, -2.5450658798217773, -2.3442811965942383, -2.143496513366699, -1.9427118301391602, -1.741927146911621, -1.541142463684082, -1.340357780456543, -1.1395732164382935, -0.9387885332107544, -0.7380038499832153, -0.5372190475463867, -0.33643436431884766, -0.13564971089363098, 0.0651349425315857, 0.26591962575912476, 0.46670424938201904, 0.6674889326095581, 0.8682736158370972, 1.0690582990646362, 1.2698429822921753, 1.4706276655197144, 1.6714122295379639, 1.872196912765503, 2.072981595993042, 2.273766279220581, 2.47455096244812, 2.675335645675659, 2.8761203289031982, 3.0769050121307373, 3.2776896953582764, 3.4784743785858154, 3.6792588233947754, 3.8800435066223145, 4.0808281898498535, 4.281612873077393, 4.482397556304932, 4.683182239532471, 4.88396692276001, 5.084751605987549, 5.285536289215088, 5.486320972442627, 5.687105655670166, 5.887890338897705]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 10.0, 12.0, 15.0, 19.0, 29.0, 32.0, 34.0, 55.0, 75.0, 96.0, 155.0, 212.0, 339.0, 416.0, 669.0, 920.0, 1348.0, 1923.0, 3034.0, 4794.0, 8023.0, 13997.0, 27450.0, 62939.0, 165008.0, 451803.0, 990353.0, 1222439.0, 742163.0, 292305.0, 106685.0, 43991.0, 21117.0, 11993.0, 7207.0, 4341.0, 2804.0, 1767.0, 1170.0, 811.0, 567.0, 348.0, 237.0, 173.0, 129.0, 95.0, 62.0, 30.0, 31.0, 17.0, 24.0, 12.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.40625, -9.1055908203125, -8.804931640625, -8.5042724609375, -8.20361328125, -7.9029541015625, -7.602294921875, -7.3016357421875, -7.0009765625, -6.7003173828125, -6.399658203125, -6.0989990234375, -5.79833984375, -5.4976806640625, -5.197021484375, -4.8963623046875, -4.595703125, -4.2950439453125, -3.994384765625, -3.6937255859375, -3.39306640625, -3.0924072265625, -2.791748046875, -2.4910888671875, -2.1904296875, -1.8897705078125, -1.589111328125, -1.2884521484375, -0.98779296875, -0.6871337890625, -0.386474609375, -0.0858154296875, 0.21484375, 0.5155029296875, 0.816162109375, 1.1168212890625, 1.41748046875, 1.7181396484375, 2.018798828125, 2.3194580078125, 2.6201171875, 2.9207763671875, 3.221435546875, 3.5220947265625, 3.82275390625, 4.1234130859375, 4.424072265625, 4.7247314453125, 5.025390625, 5.3260498046875, 5.626708984375, 5.9273681640625, 6.22802734375, 6.5286865234375, 6.829345703125, 7.1300048828125, 7.4306640625, 7.7313232421875, 8.031982421875, 8.3326416015625, 8.63330078125, 8.9339599609375, 9.234619140625, 9.5352783203125, 9.8359375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 5.0, 0.0, 6.0, 6.0, 8.0, 13.0, 13.0, 12.0, 11.0, 20.0, 31.0, 24.0, 32.0, 35.0, 34.0, 37.0, 30.0, 38.0, 34.0, 47.0, 46.0, 45.0, 42.0, 42.0, 36.0, 45.0, 27.0, 30.0, 38.0, 28.0, 31.0, 24.0, 17.0, 16.0, 21.0, 16.0, 9.0, 11.0, 8.0, 11.0, 4.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.4229736328125, -6.228759765625, -6.0345458984375, -5.84033203125, -5.6461181640625, -5.451904296875, -5.2576904296875, -5.0634765625, -4.8692626953125, -4.675048828125, -4.4808349609375, -4.28662109375, -4.0924072265625, -3.898193359375, -3.7039794921875, -3.509765625, -3.3155517578125, -3.121337890625, -2.9271240234375, -2.73291015625, -2.5386962890625, -2.344482421875, -2.1502685546875, -1.9560546875, -1.7618408203125, -1.567626953125, -1.3734130859375, -1.17919921875, -0.9849853515625, -0.790771484375, -0.5965576171875, -0.40234375, -0.2081298828125, -0.013916015625, 0.1802978515625, 0.37451171875, 0.5687255859375, 0.762939453125, 0.9571533203125, 1.1513671875, 1.3455810546875, 1.539794921875, 1.7340087890625, 1.92822265625, 2.1224365234375, 2.316650390625, 2.5108642578125, 2.705078125, 2.8992919921875, 3.093505859375, 3.2877197265625, 3.48193359375, 3.6761474609375, 3.870361328125, 4.0645751953125, 4.2587890625, 4.4530029296875, 4.647216796875, 4.8414306640625, 5.03564453125, 5.2298583984375, 5.424072265625, 5.6182861328125, 5.8125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 14.0, 12.0, 15.0, 17.0, 22.0, 40.0, 46.0, 70.0, 109.0, 164.0, 231.0, 279.0, 403.0, 589.0, 831.0, 1245.0, 1780.0, 2640.0, 3962.0, 6100.0, 9425.0, 15588.0, 27111.0, 49923.0, 100740.0, 220542.0, 484764.0, 886319.0, 1033330.0, 695347.0, 336815.0, 151359.0, 71692.0, 37113.0, 20661.0, 12230.0, 7685.0, 4973.0, 3201.0, 2072.0, 1498.0, 1026.0, 726.0, 463.0, 324.0, 245.0, 148.0, 127.0, 78.0, 70.0, 44.0, 21.0, 20.0, 15.0, 16.0, 9.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.1507568359375, -8.848388671875, -8.5460205078125, -8.24365234375, -7.9412841796875, -7.638916015625, -7.3365478515625, -7.0341796875, -6.7318115234375, -6.429443359375, -6.1270751953125, -5.82470703125, -5.5223388671875, -5.219970703125, -4.9176025390625, -4.615234375, -4.3128662109375, -4.010498046875, -3.7081298828125, -3.40576171875, -3.1033935546875, -2.801025390625, -2.4986572265625, -2.1962890625, -1.8939208984375, -1.591552734375, -1.2891845703125, -0.98681640625, -0.6844482421875, -0.382080078125, -0.0797119140625, 0.22265625, 0.5250244140625, 0.827392578125, 1.1297607421875, 1.43212890625, 1.7344970703125, 2.036865234375, 2.3392333984375, 2.6416015625, 2.9439697265625, 3.246337890625, 3.5487060546875, 3.85107421875, 4.1534423828125, 4.455810546875, 4.7581787109375, 5.060546875, 5.3629150390625, 5.665283203125, 5.9676513671875, 6.27001953125, 6.5723876953125, 6.874755859375, 7.1771240234375, 7.4794921875, 7.7818603515625, 8.084228515625, 8.3865966796875, 8.68896484375, 8.9913330078125, 9.293701171875, 9.5960693359375, 9.8984375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 12.0, 24.0, 21.0, 33.0, 36.0, 47.0, 50.0, 69.0, 98.0, 113.0, 161.0, 208.0, 207.0, 248.0, 244.0, 278.0, 270.0, 243.0, 279.0, 252.0, 200.0, 199.0, 150.0, 124.0, 105.0, 79.0, 68.0, 43.0, 43.0, 37.0, 22.0, 14.0, 15.0, 14.0, 12.0, 7.0, 7.0, 8.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87890625, -2.77825927734375, -2.6776123046875, -2.57696533203125, -2.476318359375, -2.37567138671875, -2.2750244140625, -2.17437744140625, -2.07373046875, -1.97308349609375, -1.8724365234375, -1.77178955078125, -1.671142578125, -1.57049560546875, -1.4698486328125, -1.36920166015625, -1.2685546875, -1.16790771484375, -1.0672607421875, -0.96661376953125, -0.865966796875, -0.76531982421875, -0.6646728515625, -0.56402587890625, -0.46337890625, -0.36273193359375, -0.2620849609375, -0.16143798828125, -0.060791015625, 0.03985595703125, 0.1405029296875, 0.24114990234375, 0.341796875, 0.44244384765625, 0.5430908203125, 0.64373779296875, 0.744384765625, 0.84503173828125, 0.9456787109375, 1.04632568359375, 1.14697265625, 1.24761962890625, 1.3482666015625, 1.44891357421875, 1.549560546875, 1.65020751953125, 1.7508544921875, 1.85150146484375, 1.9521484375, 2.05279541015625, 2.1534423828125, 2.25408935546875, 2.354736328125, 2.45538330078125, 2.5560302734375, 2.65667724609375, 2.75732421875, 2.85797119140625, 2.9586181640625, 3.05926513671875, 3.159912109375, 3.26055908203125, 3.3612060546875, 3.46185302734375, 3.5625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 10.0, 11.0, 21.0, 21.0, 24.0, 28.0, 39.0, 41.0, 45.0, 56.0, 66.0, 62.0, 59.0, 63.0, 56.0, 58.0, 61.0, 48.0, 26.0, 31.0, 37.0, 22.0, 21.0, 13.0, 12.0, 14.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.120320320129395, -10.825846672058105, -10.531373023986816, -10.236900329589844, -9.942426681518555, -9.647953033447266, -9.353479385375977, -9.059005737304688, -8.764532089233398, -8.47005844116211, -8.17558479309082, -7.8811116218566895, -7.586638450622559, -7.2921648025512695, -6.9976911544799805, -6.703217506408691, -6.408744812011719, -6.11427116394043, -5.819797992706299, -5.52532434463501, -5.230851173400879, -4.93637752532959, -4.641903877258301, -4.347430229187012, -4.052957057952881, -3.758483648300171, -3.464010238647461, -3.169536590576172, -2.875063180923462, -2.580589771270752, -2.286116123199463, -1.991642713546753, -1.6971683502197266, -1.4026949405670166, -1.108221411705017, -0.8137479424476624, -0.5192744731903076, -0.22480106353759766, 0.06967246532440186, 0.36414599418640137, 0.6586194038391113, 0.9530928730964661, 1.2475663423538208, 1.5420398712158203, 1.8365132808685303, 2.1309866905212402, 2.4254603385925293, 2.7199337482452393, 3.014407157897949, 3.308880567550659, 3.603353977203369, 3.897827625274658, 4.192300796508789, 4.486774444580078, 4.781248092651367, 5.075721740722656, 5.370194911956787, 5.664668560028076, 5.959141731262207, 6.253615379333496, 6.548089027404785, 6.842562198638916, 7.137035846710205, 7.431509017944336, 7.725982666015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 9.0, 9.0, 19.0, 17.0, 18.0, 22.0, 21.0, 23.0, 32.0, 34.0, 48.0, 35.0, 51.0, 51.0, 36.0, 43.0, 33.0, 46.0, 43.0, 51.0, 41.0, 41.0, 38.0, 30.0, 22.0, 29.0, 28.0, 15.0, 13.0, 19.0, 10.0, 9.0, 9.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.298409461975098, -8.056815147399902, -7.815220355987549, -7.573625564575195, -7.33203125, -7.0904364585876465, -6.848841667175293, -6.607247352600098, -6.365652561187744, -6.124057769775391, -5.882463455200195, -5.640868663787842, -5.399273872375488, -5.157679557800293, -4.9160847663879395, -4.674489974975586, -4.432895660400391, -4.191300868988037, -3.949706554412842, -3.7081117630004883, -3.466517210006714, -3.2249226570129395, -2.983327865600586, -2.7417333126068115, -2.500138759613037, -2.2585442066192627, -2.0169496536254883, -1.7753548622131348, -1.5337603092193604, -1.292165756225586, -1.050571084022522, -0.808976411819458, -0.5673823356628418, -0.3257877230644226, -0.08419311046600342, 0.15740150213241577, 0.39899611473083496, 0.6405906677246094, 0.8821853399276733, 1.1237800121307373, 1.3653745651245117, 1.6069691181182861, 1.84856379032135, 2.090158462524414, 2.3317530155181885, 2.573347568511963, 2.8149423599243164, 3.056536912918091, 3.2981314659118652, 3.5397260189056396, 3.781320571899414, 4.022915363311768, 4.264510154724121, 4.506104469299316, 4.74769926071167, 4.989294052124023, 5.230888366699219, 5.472483158111572, 5.714077472686768, 5.955672264099121, 6.197266578674316, 6.43886137008667, 6.680456161499023, 6.922050476074219, 7.163645267486572]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 15.0, 19.0, 18.0, 35.0, 38.0, 60.0, 105.0, 131.0, 219.0, 322.0, 514.0, 868.0, 1379.0, 2214.0, 3886.0, 6692.0, 11340.0, 19888.0, 35769.0, 64919.0, 117329.0, 189870.0, 219115.0, 161492.0, 93708.0, 51624.0, 28584.0, 15742.0, 9203.0, 5379.0, 3110.0, 1827.0, 1135.0, 730.0, 424.0, 293.0, 177.0, 125.0, 65.0, 46.0, 58.0, 28.0, 16.0, 17.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.109375, -1.0727691650390625, -1.036163330078125, -0.9995574951171875, -0.96295166015625, -0.9263458251953125, -0.889739990234375, -0.8531341552734375, -0.8165283203125, -0.7799224853515625, -0.743316650390625, -0.7067108154296875, -0.67010498046875, -0.6334991455078125, -0.596893310546875, -0.5602874755859375, -0.523681640625, -0.4870758056640625, -0.450469970703125, -0.4138641357421875, -0.37725830078125, -0.3406524658203125, -0.304046630859375, -0.2674407958984375, -0.2308349609375, -0.1942291259765625, -0.157623291015625, -0.1210174560546875, -0.08441162109375, -0.0478057861328125, -0.011199951171875, 0.0254058837890625, 0.06201171875, 0.0986175537109375, 0.135223388671875, 0.1718292236328125, 0.20843505859375, 0.2450408935546875, 0.281646728515625, 0.3182525634765625, 0.3548583984375, 0.3914642333984375, 0.428070068359375, 0.4646759033203125, 0.50128173828125, 0.5378875732421875, 0.574493408203125, 0.6110992431640625, 0.647705078125, 0.6843109130859375, 0.720916748046875, 0.7575225830078125, 0.79412841796875, 0.8307342529296875, 0.867340087890625, 0.9039459228515625, 0.9405517578125, 0.9771575927734375, 1.013763427734375, 1.0503692626953125, 1.08697509765625, 1.1235809326171875, 1.160186767578125, 1.1967926025390625, 1.2333984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 6.0, 8.0, 9.0, 11.0, 6.0, 17.0, 17.0, 23.0, 17.0, 18.0, 36.0, 28.0, 41.0, 42.0, 51.0, 55.0, 33.0, 44.0, 41.0, 49.0, 44.0, 42.0, 34.0, 52.0, 33.0, 43.0, 29.0, 31.0, 23.0, 17.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.3984375, -9.13726806640625, -8.8760986328125, -8.61492919921875, -8.353759765625, -8.09259033203125, -7.8314208984375, -7.57025146484375, -7.30908203125, -7.04791259765625, -6.7867431640625, -6.52557373046875, -6.264404296875, -6.00323486328125, -5.7420654296875, -5.48089599609375, -5.2197265625, -4.95855712890625, -4.6973876953125, -4.43621826171875, -4.175048828125, -3.91387939453125, -3.6527099609375, -3.39154052734375, -3.13037109375, -2.86920166015625, -2.6080322265625, -2.34686279296875, -2.085693359375, -1.82452392578125, -1.5633544921875, -1.30218505859375, -1.041015625, -0.77984619140625, -0.5186767578125, -0.25750732421875, 0.003662109375, 0.26483154296875, 0.5260009765625, 0.78717041015625, 1.04833984375, 1.30950927734375, 1.5706787109375, 1.83184814453125, 2.093017578125, 2.35418701171875, 2.6153564453125, 2.87652587890625, 3.1376953125, 3.39886474609375, 3.6600341796875, 3.92120361328125, 4.182373046875, 4.44354248046875, 4.7047119140625, 4.96588134765625, 5.22705078125, 5.48822021484375, 5.7493896484375, 6.01055908203125, 6.271728515625, 6.53289794921875, 6.7940673828125, 7.05523681640625, 7.31640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 10.0, 16.0, 11.0, 22.0, 29.0, 55.0, 58.0, 107.0, 191.0, 305.0, 496.0, 701.0, 1244.0, 2195.0, 3766.0, 6989.0, 13289.0, 29698.0, 205186.0, 696975.0, 49126.0, 17699.0, 8896.0, 4804.0, 2696.0, 1546.0, 919.0, 574.0, 312.0, 198.0, 157.0, 85.0, 63.0, 45.0, 28.0, 19.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.496124267578125, -2.40435791015625, -2.312591552734375, -2.2208251953125, -2.129058837890625, -2.03729248046875, -1.945526123046875, -1.853759765625, -1.761993408203125, -1.67022705078125, -1.578460693359375, -1.4866943359375, -1.394927978515625, -1.30316162109375, -1.211395263671875, -1.11962890625, -1.027862548828125, -0.93609619140625, -0.844329833984375, -0.7525634765625, -0.660797119140625, -0.56903076171875, -0.477264404296875, -0.385498046875, -0.293731689453125, -0.20196533203125, -0.110198974609375, -0.0184326171875, 0.073333740234375, 0.16510009765625, 0.256866455078125, 0.3486328125, 0.440399169921875, 0.53216552734375, 0.623931884765625, 0.7156982421875, 0.807464599609375, 0.89923095703125, 0.990997314453125, 1.082763671875, 1.174530029296875, 1.26629638671875, 1.358062744140625, 1.4498291015625, 1.541595458984375, 1.63336181640625, 1.725128173828125, 1.81689453125, 1.908660888671875, 2.00042724609375, 2.092193603515625, 2.1839599609375, 2.275726318359375, 2.36749267578125, 2.459259033203125, 2.551025390625, 2.642791748046875, 2.73455810546875, 2.826324462890625, 2.9180908203125, 3.009857177734375, 3.10162353515625, 3.193389892578125, 3.28515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 8.0, 4.0, 5.0, 10.0, 8.0, 14.0, 20.0, 16.0, 15.0, 17.0, 19.0, 23.0, 25.0, 27.0, 27.0, 29.0, 33.0, 33.0, 41.0, 44.0, 51.0, 39.0, 36.0, 37.0, 39.0, 29.0, 43.0, 35.0, 30.0, 21.0, 35.0, 26.0, 29.0, 13.0, 16.0, 15.0, 15.0, 15.0, 13.0, 5.0, 5.0, 5.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-5.44140625, -5.275390625, -5.109375, -4.943359375, -4.77734375, -4.611328125, -4.4453125, -4.279296875, -4.11328125, -3.947265625, -3.78125, -3.615234375, -3.44921875, -3.283203125, -3.1171875, -2.951171875, -2.78515625, -2.619140625, -2.453125, -2.287109375, -2.12109375, -1.955078125, -1.7890625, -1.623046875, -1.45703125, -1.291015625, -1.125, -0.958984375, -0.79296875, -0.626953125, -0.4609375, -0.294921875, -0.12890625, 0.037109375, 0.203125, 0.369140625, 0.53515625, 0.701171875, 0.8671875, 1.033203125, 1.19921875, 1.365234375, 1.53125, 1.697265625, 1.86328125, 2.029296875, 2.1953125, 2.361328125, 2.52734375, 2.693359375, 2.859375, 3.025390625, 3.19140625, 3.357421875, 3.5234375, 3.689453125, 3.85546875, 4.021484375, 4.1875, 4.353515625, 4.51953125, 4.685546875, 4.8515625, 5.017578125, 5.18359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 7.0, 11.0, 9.0, 15.0, 34.0, 56.0, 83.0, 118.0, 248.0, 379.0, 658.0, 1068.0, 2168.0, 3872.0, 7700.0, 15607.0, 36282.0, 721603.0, 204569.0, 27543.0, 12577.0, 6298.0, 3383.0, 1824.0, 973.0, 612.0, 333.0, 200.0, 120.0, 71.0, 50.0, 18.0, 13.0, 7.0, 9.0, 5.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.54638671875, -0.52923583984375, -0.5120849609375, -0.49493408203125, -0.477783203125, -0.46063232421875, -0.4434814453125, -0.42633056640625, -0.4091796875, -0.39202880859375, -0.3748779296875, -0.35772705078125, -0.340576171875, -0.32342529296875, -0.3062744140625, -0.28912353515625, -0.27197265625, -0.25482177734375, -0.2376708984375, -0.22052001953125, -0.203369140625, -0.18621826171875, -0.1690673828125, -0.15191650390625, -0.134765625, -0.11761474609375, -0.1004638671875, -0.08331298828125, -0.066162109375, -0.04901123046875, -0.0318603515625, -0.01470947265625, 0.00244140625, 0.01959228515625, 0.0367431640625, 0.05389404296875, 0.071044921875, 0.08819580078125, 0.1053466796875, 0.12249755859375, 0.1396484375, 0.15679931640625, 0.1739501953125, 0.19110107421875, 0.208251953125, 0.22540283203125, 0.2425537109375, 0.25970458984375, 0.27685546875, 0.29400634765625, 0.3111572265625, 0.32830810546875, 0.345458984375, 0.36260986328125, 0.3797607421875, 0.39691162109375, 0.4140625, 0.43121337890625, 0.4483642578125, 0.46551513671875, 0.482666015625, 0.49981689453125, 0.5169677734375, 0.53411865234375, 0.55126953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 7.0, 7.0, 5.0, 12.0, 3.0, 14.0, 24.0, 16.0, 20.0, 16.0, 34.0, 43.0, 43.0, 40.0, 61.0, 76.0, 53.0, 79.0, 53.0, 69.0, 53.0, 50.0, 42.0, 32.0, 26.0, 28.0, 13.0, 16.0, 12.0, 7.0, 11.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4603137969970703e-05, -1.4078803360462189e-05, -1.3554468750953674e-05, -1.303013414144516e-05, -1.2505799531936646e-05, -1.1981464922428131e-05, -1.1457130312919617e-05, -1.0932795703411102e-05, -1.0408461093902588e-05, -9.884126484394073e-06, -9.359791874885559e-06, -8.835457265377045e-06, -8.31112265586853e-06, -7.786788046360016e-06, -7.2624534368515015e-06, -6.738118827342987e-06, -6.213784217834473e-06, -5.689449608325958e-06, -5.165114998817444e-06, -4.6407803893089294e-06, -4.116445779800415e-06, -3.5921111702919006e-06, -3.0677765607833862e-06, -2.543441951274872e-06, -2.0191073417663574e-06, -1.494772732257843e-06, -9.704381227493286e-07, -4.461035132408142e-07, 7.82310962677002e-08, 6.025657057762146e-07, 1.126900315284729e-06, 1.6512349247932434e-06, 2.175569534301758e-06, 2.6999041438102722e-06, 3.2242387533187866e-06, 3.748573362827301e-06, 4.2729079723358154e-06, 4.79724258184433e-06, 5.321577191352844e-06, 5.845911800861359e-06, 6.370246410369873e-06, 6.8945810198783875e-06, 7.418915629386902e-06, 7.943250238895416e-06, 8.46758484840393e-06, 8.991919457912445e-06, 9.51625406742096e-06, 1.0040588676929474e-05, 1.0564923286437988e-05, 1.1089257895946503e-05, 1.1613592505455017e-05, 1.2137927114963531e-05, 1.2662261724472046e-05, 1.318659633398056e-05, 1.3710930943489075e-05, 1.4235265552997589e-05, 1.4759600162506104e-05, 1.5283934772014618e-05, 1.5808269381523132e-05, 1.6332603991031647e-05, 1.685693860054016e-05, 1.7381273210048676e-05, 1.790560781955719e-05, 1.8429942429065704e-05, 1.895427703857422e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 0.0, 3.0, 8.0, 6.0, 9.0, 10.0, 18.0, 25.0, 38.0, 51.0, 66.0, 94.0, 116.0, 177.0, 234.0, 336.0, 477.0, 731.0, 998.0, 1550.0, 2239.0, 3528.0, 5450.0, 8820.0, 14547.0, 25170.0, 44959.0, 83135.0, 148531.0, 225331.0, 202886.0, 121384.0, 66583.0, 36726.0, 20693.0, 12249.0, 7506.0, 4708.0, 2919.0, 1976.0, 1258.0, 909.0, 647.0, 453.0, 299.0, 196.0, 146.0, 97.0, 75.0, 66.0, 45.0, 22.0, 22.0, 11.0, 9.0, 6.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.395263671875, -0.382843017578125, -0.37042236328125, -0.358001708984375, -0.3455810546875, -0.333160400390625, -0.32073974609375, -0.308319091796875, -0.2958984375, -0.283477783203125, -0.27105712890625, -0.258636474609375, -0.2462158203125, -0.233795166015625, -0.22137451171875, -0.208953857421875, -0.196533203125, -0.184112548828125, -0.17169189453125, -0.159271240234375, -0.1468505859375, -0.134429931640625, -0.12200927734375, -0.109588623046875, -0.09716796875, -0.084747314453125, -0.07232666015625, -0.059906005859375, -0.0474853515625, -0.035064697265625, -0.02264404296875, -0.010223388671875, 0.002197265625, 0.014617919921875, 0.02703857421875, 0.039459228515625, 0.0518798828125, 0.064300537109375, 0.07672119140625, 0.089141845703125, 0.1015625, 0.113983154296875, 0.12640380859375, 0.138824462890625, 0.1512451171875, 0.163665771484375, 0.17608642578125, 0.188507080078125, 0.200927734375, 0.213348388671875, 0.22576904296875, 0.238189697265625, 0.2506103515625, 0.263031005859375, 0.27545166015625, 0.287872314453125, 0.30029296875, 0.312713623046875, 0.32513427734375, 0.337554931640625, 0.3499755859375, 0.362396240234375, 0.37481689453125, 0.387237548828125, 0.399658203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 7.0, 14.0, 11.0, 11.0, 12.0, 20.0, 22.0, 26.0, 19.0, 30.0, 52.0, 43.0, 38.0, 40.0, 49.0, 40.0, 37.0, 46.0, 51.0, 44.0, 53.0, 47.0, 32.0, 35.0, 33.0, 30.0, 30.0, 20.0, 11.0, 11.0, 8.0, 13.0, 8.0, 7.0, 8.0, 3.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13916015625, -0.1347332000732422, -0.13030624389648438, -0.12587928771972656, -0.12145233154296875, -0.11702537536621094, -0.11259841918945312, -0.10817146301269531, -0.1037445068359375, -0.09931755065917969, -0.09489059448242188, -0.09046363830566406, -0.08603668212890625, -0.08160972595214844, -0.07718276977539062, -0.07275581359863281, -0.068328857421875, -0.06390190124511719, -0.059474945068359375, -0.05504798889160156, -0.05062103271484375, -0.04619407653808594, -0.041767120361328125, -0.03734016418457031, -0.0329132080078125, -0.028486251831054688, -0.024059295654296875, -0.019632339477539062, -0.01520538330078125, -0.010778427124023438, -0.006351470947265625, -0.0019245147705078125, 0.00250244140625, 0.0069293975830078125, 0.011356353759765625, 0.015783309936523438, 0.02021026611328125, 0.024637222290039062, 0.029064178466796875, 0.03349113464355469, 0.0379180908203125, 0.04234504699707031, 0.046772003173828125, 0.05119895935058594, 0.05562591552734375, 0.06005287170410156, 0.06447982788085938, 0.06890678405761719, 0.073333740234375, 0.07776069641113281, 0.08218765258789062, 0.08661460876464844, 0.09104156494140625, 0.09546852111816406, 0.09989547729492188, 0.10432243347167969, 0.1087493896484375, 0.11317634582519531, 0.11760330200195312, 0.12203025817871094, 0.12645721435546875, 0.13088417053222656, 0.13531112670898438, 0.1397380828857422, 0.1441650390625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 7.0, 3.0, 7.0, 9.0, 11.0, 19.0, 23.0, 22.0, 27.0, 36.0, 34.0, 48.0, 57.0, 63.0, 60.0, 58.0, 65.0, 61.0, 65.0, 51.0, 53.0, 30.0, 30.0, 28.0, 34.0, 25.0, 11.0, 14.0, 9.0, 12.0, 12.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.944527626037598, -10.64915657043457, -10.353785514831543, -10.058414459228516, -9.763044357299805, -9.467673301696777, -9.17230224609375, -8.876931190490723, -8.581560134887695, -8.286189079284668, -7.990818500518799, -7.6954474449157715, -7.400076389312744, -7.104705810546875, -6.809334754943848, -6.51396369934082, -6.218593120574951, -5.923222064971924, -5.627851486206055, -5.332480430603027, -5.037109375, -4.741738319396973, -4.4463677406311035, -4.150996685028076, -3.855625867843628, -3.5602550506591797, -3.2648839950561523, -2.969513177871704, -2.674142360687256, -2.3787713050842285, -2.0834004878997803, -1.788029432296753, -1.4926586151123047, -1.197287678718567, -0.9019168019294739, -0.6065459251403809, -0.31117498874664307, -0.015804052352905273, 0.27956676483154297, 0.5749378204345703, 0.8703086376190186, 1.1656795740127563, 1.4610505104064941, 1.7564213275909424, 2.0517921447753906, 2.347163200378418, 2.642534017562866, 2.9379050731658936, 3.233275890350342, 3.52864670753479, 3.8240177631378174, 4.119388580322266, 4.414759635925293, 4.71013069152832, 5.0055012702941895, 5.300872325897217, 5.596242904663086, 5.891613960266113, 6.186984539031982, 6.48235559463501, 6.777726650238037, 7.073097229003906, 7.368468284606934, 7.663839340209961, 7.959210395812988]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 6.0, 6.0, 11.0, 17.0, 12.0, 22.0, 21.0, 22.0, 17.0, 28.0, 43.0, 35.0, 46.0, 44.0, 44.0, 50.0, 35.0, 40.0, 35.0, 53.0, 44.0, 47.0, 30.0, 39.0, 44.0, 21.0, 23.0, 32.0, 20.0, 16.0, 12.0, 16.0, 8.0, 9.0, 11.0, 4.0, 7.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.275310516357422, -8.036246299743652, -7.797182083129883, -7.558117866516113, -7.3190531730651855, -7.079988956451416, -6.8409247398376465, -6.601860523223877, -6.362795829772949, -6.12373161315918, -5.88466739654541, -5.645603179931641, -5.406538486480713, -5.167474269866943, -4.928410053253174, -4.689345836639404, -4.450281620025635, -4.211217403411865, -3.9721529483795166, -3.733088731765747, -3.4940242767333984, -3.254960060119629, -3.0158958435058594, -2.77683162689209, -2.537767171859741, -2.2987029552459717, -2.059638500213623, -1.8205742835998535, -1.5815099477767944, -1.3424456119537354, -1.1033813953399658, -0.8643170595169067, -0.6252522468566895, -0.38618794083595276, -0.14712363481521606, 0.09194064140319824, 0.3310049772262573, 0.5700693130493164, 0.8091335296630859, 1.048197865486145, 1.287262201309204, 1.5263265371322632, 1.7653908729553223, 2.004455089569092, 2.2435193061828613, 2.48258376121521, 2.7216479778289795, 2.960712432861328, 3.1997766494750977, 3.438840866088867, 3.677905321121216, 3.9169695377349854, 4.156033992767334, 4.3950982093811035, 4.634162425994873, 4.873226642608643, 5.11229133605957, 5.35135555267334, 5.590419769287109, 5.829483985900879, 6.068548679351807, 6.307612895965576, 6.546677112579346, 6.785741329193115, 7.024805545806885]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 11.0, 8.0, 12.0, 30.0, 45.0, 62.0, 91.0, 147.0, 171.0, 251.0, 379.0, 576.0, 881.0, 1365.0, 2114.0, 3061.0, 5026.0, 7707.0, 12098.0, 18561.0, 29072.0, 44768.0, 65510.0, 92048.0, 116632.0, 132980.0, 130819.0, 113510.0, 88154.0, 62960.0, 42281.0, 27621.0, 17702.0, 11178.0, 7295.0, 4636.0, 2945.0, 1965.0, 1276.0, 863.0, 551.0, 372.0, 275.0, 198.0, 115.0, 85.0, 58.0, 30.0, 22.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0], "bins": [-4.02734375, -3.905059814453125, -3.78277587890625, -3.660491943359375, -3.5382080078125, -3.415924072265625, -3.29364013671875, -3.171356201171875, -3.049072265625, -2.926788330078125, -2.80450439453125, -2.682220458984375, -2.5599365234375, -2.437652587890625, -2.31536865234375, -2.193084716796875, -2.07080078125, -1.948516845703125, -1.82623291015625, -1.703948974609375, -1.5816650390625, -1.459381103515625, -1.33709716796875, -1.214813232421875, -1.092529296875, -0.970245361328125, -0.84796142578125, -0.725677490234375, -0.6033935546875, -0.481109619140625, -0.35882568359375, -0.236541748046875, -0.1142578125, 0.008026123046875, 0.13031005859375, 0.252593994140625, 0.3748779296875, 0.497161865234375, 0.61944580078125, 0.741729736328125, 0.864013671875, 0.986297607421875, 1.10858154296875, 1.230865478515625, 1.3531494140625, 1.475433349609375, 1.59771728515625, 1.720001220703125, 1.84228515625, 1.964569091796875, 2.08685302734375, 2.209136962890625, 2.3314208984375, 2.453704833984375, 2.57598876953125, 2.698272705078125, 2.820556640625, 2.942840576171875, 3.06512451171875, 3.187408447265625, 3.3096923828125, 3.431976318359375, 3.55426025390625, 3.676544189453125, 3.798828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 9.0, 3.0, 7.0, 10.0, 10.0, 19.0, 11.0, 15.0, 24.0, 24.0, 25.0, 28.0, 28.0, 45.0, 30.0, 34.0, 42.0, 34.0, 36.0, 33.0, 37.0, 40.0, 35.0, 34.0, 46.0, 40.0, 31.0, 31.0, 21.0, 25.0, 15.0, 35.0, 21.0, 14.0, 10.0, 10.0, 13.0, 17.0, 7.0, 7.0, 5.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-7.19140625, -6.97711181640625, -6.7628173828125, -6.54852294921875, -6.334228515625, -6.11993408203125, -5.9056396484375, -5.69134521484375, -5.47705078125, -5.26275634765625, -5.0484619140625, -4.83416748046875, -4.619873046875, -4.40557861328125, -4.1912841796875, -3.97698974609375, -3.7626953125, -3.54840087890625, -3.3341064453125, -3.11981201171875, -2.905517578125, -2.69122314453125, -2.4769287109375, -2.26263427734375, -2.04833984375, -1.83404541015625, -1.6197509765625, -1.40545654296875, -1.191162109375, -0.97686767578125, -0.7625732421875, -0.54827880859375, -0.333984375, -0.11968994140625, 0.0946044921875, 0.30889892578125, 0.523193359375, 0.73748779296875, 0.9517822265625, 1.16607666015625, 1.38037109375, 1.59466552734375, 1.8089599609375, 2.02325439453125, 2.237548828125, 2.45184326171875, 2.6661376953125, 2.88043212890625, 3.0947265625, 3.30902099609375, 3.5233154296875, 3.73760986328125, 3.951904296875, 4.16619873046875, 4.3804931640625, 4.59478759765625, 4.80908203125, 5.02337646484375, 5.2376708984375, 5.45196533203125, 5.666259765625, 5.88055419921875, 6.0948486328125, 6.30914306640625, 6.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 10.0, 12.0, 14.0, 15.0, 37.0, 43.0, 62.0, 81.0, 137.0, 194.0, 292.0, 487.0, 669.0, 1022.0, 1536.0, 2477.0, 3726.0, 6342.0, 9769.0, 15552.0, 25304.0, 39750.0, 60954.0, 89444.0, 119477.0, 140894.0, 141053.0, 121658.0, 92068.0, 63536.0, 41649.0, 25987.0, 16428.0, 10064.0, 6311.0, 4031.0, 2541.0, 1581.0, 1113.0, 742.0, 495.0, 309.0, 214.0, 154.0, 93.0, 77.0, 47.0, 33.0, 22.0, 10.0, 16.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.23046875, -4.08966064453125, -3.9488525390625, -3.80804443359375, -3.667236328125, -3.52642822265625, -3.3856201171875, -3.24481201171875, -3.10400390625, -2.96319580078125, -2.8223876953125, -2.68157958984375, -2.540771484375, -2.39996337890625, -2.2591552734375, -2.11834716796875, -1.9775390625, -1.83673095703125, -1.6959228515625, -1.55511474609375, -1.414306640625, -1.27349853515625, -1.1326904296875, -0.99188232421875, -0.85107421875, -0.71026611328125, -0.5694580078125, -0.42864990234375, -0.287841796875, -0.14703369140625, -0.0062255859375, 0.13458251953125, 0.275390625, 0.41619873046875, 0.5570068359375, 0.69781494140625, 0.838623046875, 0.97943115234375, 1.1202392578125, 1.26104736328125, 1.40185546875, 1.54266357421875, 1.6834716796875, 1.82427978515625, 1.965087890625, 2.10589599609375, 2.2467041015625, 2.38751220703125, 2.5283203125, 2.66912841796875, 2.8099365234375, 2.95074462890625, 3.091552734375, 3.23236083984375, 3.3731689453125, 3.51397705078125, 3.65478515625, 3.79559326171875, 3.9364013671875, 4.07720947265625, 4.218017578125, 4.35882568359375, 4.4996337890625, 4.64044189453125, 4.78125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 10.0, 18.0, 20.0, 17.0, 22.0, 28.0, 36.0, 30.0, 38.0, 44.0, 45.0, 48.0, 27.0, 39.0, 51.0, 39.0, 35.0, 38.0, 40.0, 41.0, 33.0, 43.0, 29.0, 31.0, 24.0, 25.0, 24.0, 17.0, 20.0, 7.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.817138671875, -4.66162109375, -4.506103515625, -4.3505859375, -4.195068359375, -4.03955078125, -3.884033203125, -3.728515625, -3.572998046875, -3.41748046875, -3.261962890625, -3.1064453125, -2.950927734375, -2.79541015625, -2.639892578125, -2.484375, -2.328857421875, -2.17333984375, -2.017822265625, -1.8623046875, -1.706787109375, -1.55126953125, -1.395751953125, -1.240234375, -1.084716796875, -0.92919921875, -0.773681640625, -0.6181640625, -0.462646484375, -0.30712890625, -0.151611328125, 0.00390625, 0.159423828125, 0.31494140625, 0.470458984375, 0.6259765625, 0.781494140625, 0.93701171875, 1.092529296875, 1.248046875, 1.403564453125, 1.55908203125, 1.714599609375, 1.8701171875, 2.025634765625, 2.18115234375, 2.336669921875, 2.4921875, 2.647705078125, 2.80322265625, 2.958740234375, 3.1142578125, 3.269775390625, 3.42529296875, 3.580810546875, 3.736328125, 3.891845703125, 4.04736328125, 4.202880859375, 4.3583984375, 4.513916015625, 4.66943359375, 4.824951171875, 4.98046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 11.0, 28.0, 36.0, 47.0, 69.0, 131.0, 225.0, 378.0, 677.0, 1137.0, 2061.0, 3989.0, 7531.0, 15450.0, 31953.0, 65300.0, 123829.0, 193606.0, 220035.0, 173617.0, 103827.0, 52640.0, 26024.0, 12299.0, 6357.0, 3166.0, 1808.0, 955.0, 564.0, 311.0, 165.0, 120.0, 74.0, 43.0, 30.0, 18.0, 17.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.466461181640625, -2.37628173828125, -2.286102294921875, -2.1959228515625, -2.105743408203125, -2.01556396484375, -1.925384521484375, -1.835205078125, -1.745025634765625, -1.65484619140625, -1.564666748046875, -1.4744873046875, -1.384307861328125, -1.29412841796875, -1.203948974609375, -1.11376953125, -1.023590087890625, -0.93341064453125, -0.843231201171875, -0.7530517578125, -0.662872314453125, -0.57269287109375, -0.482513427734375, -0.392333984375, -0.302154541015625, -0.21197509765625, -0.121795654296875, -0.0316162109375, 0.058563232421875, 0.14874267578125, 0.238922119140625, 0.3291015625, 0.419281005859375, 0.50946044921875, 0.599639892578125, 0.6898193359375, 0.779998779296875, 0.87017822265625, 0.960357666015625, 1.050537109375, 1.140716552734375, 1.23089599609375, 1.321075439453125, 1.4112548828125, 1.501434326171875, 1.59161376953125, 1.681793212890625, 1.77197265625, 1.862152099609375, 1.95233154296875, 2.042510986328125, 2.1326904296875, 2.222869873046875, 2.31304931640625, 2.403228759765625, 2.493408203125, 2.583587646484375, 2.67376708984375, 2.763946533203125, 2.8541259765625, 2.944305419921875, 3.03448486328125, 3.124664306640625, 3.21484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 8.0, 3.0, 5.0, 21.0, 16.0, 21.0, 26.0, 37.0, 35.0, 62.0, 70.0, 64.0, 72.0, 79.0, 65.0, 65.0, 65.0, 58.0, 49.0, 41.0, 40.0, 15.0, 23.0, 14.0, 6.0, 8.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00036907196044921875, -0.0003600269556045532, -0.0003509819507598877, -0.00034193694591522217, -0.00033289194107055664, -0.0003238469362258911, -0.0003148019313812256, -0.00030575692653656006, -0.00029671192169189453, -0.000287666916847229, -0.0002786219120025635, -0.00026957690715789795, -0.0002605319023132324, -0.0002514868974685669, -0.00024244189262390137, -0.00023339688777923584, -0.0002243518829345703, -0.00021530687808990479, -0.00020626187324523926, -0.00019721686840057373, -0.0001881718635559082, -0.00017912685871124268, -0.00017008185386657715, -0.00016103684902191162, -0.0001519918441772461, -0.00014294683933258057, -0.00013390183448791504, -0.0001248568296432495, -0.00011581182479858398, -0.00010676681995391846, -9.772181510925293e-05, -8.86768102645874e-05, -7.963180541992188e-05, -7.058680057525635e-05, -6.154179573059082e-05, -5.249679088592529e-05, -4.3451786041259766e-05, -3.440678119659424e-05, -2.536177635192871e-05, -1.6316771507263184e-05, -7.271766662597656e-06, 1.773238182067871e-06, 1.0818243026733398e-05, 1.9863247871398926e-05, 2.8908252716064453e-05, 3.795325756072998e-05, 4.699826240539551e-05, 5.6043267250061035e-05, 6.508827209472656e-05, 7.413327693939209e-05, 8.317828178405762e-05, 9.222328662872314e-05, 0.00010126829147338867, 0.0001103132963180542, 0.00011935830116271973, 0.00012840330600738525, 0.00013744831085205078, 0.0001464933156967163, 0.00015553832054138184, 0.00016458332538604736, 0.0001736283302307129, 0.00018267333507537842, 0.00019171833992004395, 0.00020076334476470947, 0.000209808349609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 10.0, 7.0, 18.0, 21.0, 41.0, 64.0, 78.0, 119.0, 186.0, 237.0, 395.0, 595.0, 823.0, 1369.0, 2052.0, 3268.0, 5544.0, 9619.0, 16276.0, 29419.0, 52562.0, 88484.0, 135717.0, 172672.0, 174389.0, 137966.0, 90934.0, 53495.0, 30469.0, 16947.0, 9774.0, 5674.0, 3428.0, 2098.0, 1316.0, 830.0, 520.0, 382.0, 228.0, 162.0, 123.0, 71.0, 50.0, 29.0, 19.0, 27.0, 16.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.619140625, -2.539825439453125, -2.46051025390625, -2.381195068359375, -2.3018798828125, -2.222564697265625, -2.14324951171875, -2.063934326171875, -1.984619140625, -1.905303955078125, -1.82598876953125, -1.746673583984375, -1.6673583984375, -1.588043212890625, -1.50872802734375, -1.429412841796875, -1.35009765625, -1.270782470703125, -1.19146728515625, -1.112152099609375, -1.0328369140625, -0.953521728515625, -0.87420654296875, -0.794891357421875, -0.715576171875, -0.636260986328125, -0.55694580078125, -0.477630615234375, -0.3983154296875, -0.319000244140625, -0.23968505859375, -0.160369873046875, -0.0810546875, -0.001739501953125, 0.07757568359375, 0.156890869140625, 0.2362060546875, 0.315521240234375, 0.39483642578125, 0.474151611328125, 0.553466796875, 0.632781982421875, 0.71209716796875, 0.791412353515625, 0.8707275390625, 0.950042724609375, 1.02935791015625, 1.108673095703125, 1.18798828125, 1.267303466796875, 1.34661865234375, 1.425933837890625, 1.5052490234375, 1.584564208984375, 1.66387939453125, 1.743194580078125, 1.822509765625, 1.901824951171875, 1.98114013671875, 2.060455322265625, 2.1397705078125, 2.219085693359375, 2.29840087890625, 2.377716064453125, 2.45703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 12.0, 6.0, 3.0, 8.0, 11.0, 16.0, 18.0, 16.0, 26.0, 32.0, 42.0, 38.0, 41.0, 50.0, 45.0, 46.0, 47.0, 44.0, 54.0, 56.0, 63.0, 46.0, 39.0, 39.0, 42.0, 30.0, 22.0, 25.0, 19.0, 17.0, 9.0, 8.0, 9.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8745269775390625, -0.847686767578125, -0.8208465576171875, -0.79400634765625, -0.7671661376953125, -0.740325927734375, -0.7134857177734375, -0.6866455078125, -0.6598052978515625, -0.632965087890625, -0.6061248779296875, -0.57928466796875, -0.5524444580078125, -0.525604248046875, -0.4987640380859375, -0.471923828125, -0.4450836181640625, -0.418243408203125, -0.3914031982421875, -0.36456298828125, -0.3377227783203125, -0.310882568359375, -0.2840423583984375, -0.2572021484375, -0.2303619384765625, -0.203521728515625, -0.1766815185546875, -0.14984130859375, -0.1230010986328125, -0.096160888671875, -0.0693206787109375, -0.04248046875, -0.0156402587890625, 0.011199951171875, 0.0380401611328125, 0.06488037109375, 0.0917205810546875, 0.118560791015625, 0.1454010009765625, 0.1722412109375, 0.1990814208984375, 0.225921630859375, 0.2527618408203125, 0.27960205078125, 0.3064422607421875, 0.333282470703125, 0.3601226806640625, 0.386962890625, 0.4138031005859375, 0.440643310546875, 0.4674835205078125, 0.49432373046875, 0.5211639404296875, 0.548004150390625, 0.5748443603515625, 0.6016845703125, 0.6285247802734375, 0.655364990234375, 0.6822052001953125, 0.70904541015625, 0.7358856201171875, 0.762725830078125, 0.7895660400390625, 0.81640625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 15.0, 7.0, 16.0, 14.0, 28.0, 27.0, 31.0, 31.0, 47.0, 61.0, 57.0, 54.0, 69.0, 76.0, 69.0, 67.0, 54.0, 40.0, 43.0, 39.0, 34.0, 21.0, 22.0, 19.0, 13.0, 11.0, 7.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.125446319580078, -10.81046199798584, -10.495477676391602, -10.180493354797363, -9.865509033203125, -9.550524711608887, -9.235540390014648, -8.920555114746094, -8.605571746826172, -8.290587425231934, -7.975603103637695, -7.660618782043457, -7.345634460449219, -7.0306501388549805, -6.715665340423584, -6.400681018829346, -6.085696220397949, -5.770711898803711, -5.455727577209473, -5.140743255615234, -4.825758934020996, -4.510774612426758, -4.195789813995361, -3.880805492401123, -3.5658211708068848, -3.2508368492126465, -2.935852527618408, -2.620867967605591, -2.3058836460113525, -1.9908993244171143, -1.6759148836135864, -1.3609304428100586, -1.045945167541504, -0.7309607863426208, -0.4159764051437378, -0.10099202394485474, 0.21399235725402832, 0.5289766788482666, 0.8439611196517944, 1.1589455604553223, 1.4739298820495605, 1.7889142036437988, 2.103898525238037, 2.4188830852508545, 2.7338674068450928, 3.048851728439331, 3.3638362884521484, 3.6788206100463867, 3.993804931640625, 4.308789253234863, 4.623773574829102, 4.93875789642334, 5.253742218017578, 5.568726539611816, 5.883711338043213, 6.198695659637451, 6.5136799812316895, 6.828664302825928, 7.143648624420166, 7.458632946014404, 7.773617744445801, 8.088602066040039, 8.403586387634277, 8.718570709228516, 9.033555030822754]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 9.0, 7.0, 6.0, 9.0, 10.0, 16.0, 20.0, 22.0, 23.0, 25.0, 32.0, 32.0, 30.0, 32.0, 39.0, 49.0, 53.0, 52.0, 40.0, 48.0, 48.0, 55.0, 34.0, 42.0, 34.0, 37.0, 41.0, 29.0, 30.0, 20.0, 15.0, 11.0, 12.0, 6.0, 9.0, 7.0, 10.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.45913028717041, -10.176031112670898, -9.892932891845703, -9.609833717346191, -9.32673454284668, -9.043636322021484, -8.760537147521973, -8.477437973022461, -8.194339752197266, -7.911241054534912, -7.6281418800354, -7.345043182373047, -7.061944007873535, -6.778845310211182, -6.495746612548828, -6.212647438049316, -5.929548263549805, -5.646449565887451, -5.3633503913879395, -5.080251693725586, -4.797152519226074, -4.514053821563721, -4.230955123901367, -3.9478561878204346, -3.664757251739502, -3.3816583156585693, -3.0985593795776367, -2.815460681915283, -2.5323617458343506, -2.249262809753418, -1.966163992881775, -1.6830651760101318, -1.3999652862548828, -1.1168663501739502, -0.8337675333023071, -0.5506686568260193, -0.26756978034973145, 0.015529155731201172, 0.29862797260284424, 0.5817267894744873, 0.8648257255554199, 1.1479246616363525, 1.4310234785079956, 1.7141222953796387, 1.9972212314605713, 2.280320167541504, 2.5634188652038574, 2.84651780128479, 3.1296167373657227, 3.4127156734466553, 3.695814609527588, 3.9789133071899414, 4.262012481689453, 4.545111179351807, 4.82820987701416, 5.111309051513672, 5.394407749176025, 5.677506446838379, 5.960605621337891, 6.243704319000244, 6.526803016662598, 6.809902191162109, 7.093000888824463, 7.376099586486816, 7.659198760986328]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 5.0, 8.0, 12.0, 15.0, 10.0, 23.0, 28.0, 36.0, 54.0, 76.0, 107.0, 168.0, 234.0, 272.0, 413.0, 546.0, 862.0, 1252.0, 1772.0, 2810.0, 4282.0, 6457.0, 10547.0, 18630.0, 35090.0, 75368.0, 189024.0, 504500.0, 1066500.0, 1191142.0, 644324.0, 246337.0, 94199.0, 42651.0, 22444.0, 12514.0, 7520.0, 4834.0, 3039.0, 1873.0, 1307.0, 898.0, 627.0, 435.0, 291.0, 223.0, 152.0, 105.0, 85.0, 55.0, 36.0, 22.0, 20.0, 8.0, 12.0, 11.0, 6.0, 9.0, 7.0, 2.0, 4.0], "bins": [-11.90625, -11.5357666015625, -11.165283203125, -10.7947998046875, -10.42431640625, -10.0538330078125, -9.683349609375, -9.3128662109375, -8.9423828125, -8.5718994140625, -8.201416015625, -7.8309326171875, -7.46044921875, -7.0899658203125, -6.719482421875, -6.3489990234375, -5.978515625, -5.6080322265625, -5.237548828125, -4.8670654296875, -4.49658203125, -4.1260986328125, -3.755615234375, -3.3851318359375, -3.0146484375, -2.6441650390625, -2.273681640625, -1.9031982421875, -1.53271484375, -1.1622314453125, -0.791748046875, -0.4212646484375, -0.05078125, 0.3197021484375, 0.690185546875, 1.0606689453125, 1.43115234375, 1.8016357421875, 2.172119140625, 2.5426025390625, 2.9130859375, 3.2835693359375, 3.654052734375, 4.0245361328125, 4.39501953125, 4.7655029296875, 5.135986328125, 5.5064697265625, 5.876953125, 6.2474365234375, 6.617919921875, 6.9884033203125, 7.35888671875, 7.7293701171875, 8.099853515625, 8.4703369140625, 8.8408203125, 9.2113037109375, 9.581787109375, 9.9522705078125, 10.32275390625, 10.6932373046875, 11.063720703125, 11.4342041015625, 11.8046875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 2.0, 7.0, 2.0, 11.0, 16.0, 12.0, 22.0, 11.0, 32.0, 43.0, 28.0, 31.0, 25.0, 39.0, 46.0, 40.0, 47.0, 51.0, 56.0, 39.0, 45.0, 58.0, 49.0, 41.0, 32.0, 31.0, 37.0, 29.0, 23.0, 16.0, 8.0, 12.0, 14.0, 11.0, 5.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.32275390625, -9.0595703125, -8.79638671875, -8.533203125, -8.27001953125, -8.0068359375, -7.74365234375, -7.48046875, -7.21728515625, -6.9541015625, -6.69091796875, -6.427734375, -6.16455078125, -5.9013671875, -5.63818359375, -5.375, -5.11181640625, -4.8486328125, -4.58544921875, -4.322265625, -4.05908203125, -3.7958984375, -3.53271484375, -3.26953125, -3.00634765625, -2.7431640625, -2.47998046875, -2.216796875, -1.95361328125, -1.6904296875, -1.42724609375, -1.1640625, -0.90087890625, -0.6376953125, -0.37451171875, -0.111328125, 0.15185546875, 0.4150390625, 0.67822265625, 0.94140625, 1.20458984375, 1.4677734375, 1.73095703125, 1.994140625, 2.25732421875, 2.5205078125, 2.78369140625, 3.046875, 3.31005859375, 3.5732421875, 3.83642578125, 4.099609375, 4.36279296875, 4.6259765625, 4.88916015625, 5.15234375, 5.41552734375, 5.6787109375, 5.94189453125, 6.205078125, 6.46826171875, 6.7314453125, 6.99462890625, 7.2578125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 8.0, 9.0, 14.0, 15.0, 16.0, 39.0, 69.0, 89.0, 121.0, 175.0, 242.0, 364.0, 538.0, 896.0, 1297.0, 1826.0, 2771.0, 4235.0, 6239.0, 10028.0, 16407.0, 28726.0, 53989.0, 113963.0, 271265.0, 656415.0, 1152626.0, 1004377.0, 481788.0, 195660.0, 85821.0, 42344.0, 23450.0, 13757.0, 8618.0, 5458.0, 3535.0, 2262.0, 1591.0, 1064.0, 719.0, 472.0, 326.0, 239.0, 152.0, 107.0, 55.0, 34.0, 27.0, 19.0, 14.0, 11.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-14.171875, -13.7528076171875, -13.333740234375, -12.9146728515625, -12.49560546875, -12.0765380859375, -11.657470703125, -11.2384033203125, -10.8193359375, -10.4002685546875, -9.981201171875, -9.5621337890625, -9.14306640625, -8.7239990234375, -8.304931640625, -7.8858642578125, -7.466796875, -7.0477294921875, -6.628662109375, -6.2095947265625, -5.79052734375, -5.3714599609375, -4.952392578125, -4.5333251953125, -4.1142578125, -3.6951904296875, -3.276123046875, -2.8570556640625, -2.43798828125, -2.0189208984375, -1.599853515625, -1.1807861328125, -0.76171875, -0.3426513671875, 0.076416015625, 0.4954833984375, 0.91455078125, 1.3336181640625, 1.752685546875, 2.1717529296875, 2.5908203125, 3.0098876953125, 3.428955078125, 3.8480224609375, 4.26708984375, 4.6861572265625, 5.105224609375, 5.5242919921875, 5.943359375, 6.3624267578125, 6.781494140625, 7.2005615234375, 7.61962890625, 8.0386962890625, 8.457763671875, 8.8768310546875, 9.2958984375, 9.7149658203125, 10.134033203125, 10.5531005859375, 10.97216796875, 11.3912353515625, 11.810302734375, 12.2293701171875, 12.6484375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 6.0, 6.0, 10.0, 14.0, 10.0, 11.0, 22.0, 36.0, 19.0, 32.0, 37.0, 62.0, 71.0, 94.0, 96.0, 120.0, 157.0, 193.0, 197.0, 207.0, 233.0, 232.0, 240.0, 271.0, 244.0, 226.0, 213.0, 194.0, 160.0, 126.0, 97.0, 90.0, 57.0, 52.0, 47.0, 33.0, 31.0, 24.0, 20.0, 25.0, 12.0, 11.0, 10.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-3.9921875, -3.87774658203125, -3.7633056640625, -3.64886474609375, -3.534423828125, -3.41998291015625, -3.3055419921875, -3.19110107421875, -3.07666015625, -2.96221923828125, -2.8477783203125, -2.73333740234375, -2.618896484375, -2.50445556640625, -2.3900146484375, -2.27557373046875, -2.1611328125, -2.04669189453125, -1.9322509765625, -1.81781005859375, -1.703369140625, -1.58892822265625, -1.4744873046875, -1.36004638671875, -1.24560546875, -1.13116455078125, -1.0167236328125, -0.90228271484375, -0.787841796875, -0.67340087890625, -0.5589599609375, -0.44451904296875, -0.330078125, -0.21563720703125, -0.1011962890625, 0.01324462890625, 0.127685546875, 0.24212646484375, 0.3565673828125, 0.47100830078125, 0.58544921875, 0.69989013671875, 0.8143310546875, 0.92877197265625, 1.043212890625, 1.15765380859375, 1.2720947265625, 1.38653564453125, 1.5009765625, 1.61541748046875, 1.7298583984375, 1.84429931640625, 1.958740234375, 2.07318115234375, 2.1876220703125, 2.30206298828125, 2.41650390625, 2.53094482421875, 2.6453857421875, 2.75982666015625, 2.874267578125, 2.98870849609375, 3.1031494140625, 3.21759033203125, 3.33203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 11.0, 8.0, 11.0, 15.0, 15.0, 23.0, 20.0, 47.0, 55.0, 60.0, 76.0, 83.0, 97.0, 82.0, 89.0, 74.0, 56.0, 47.0, 30.0, 28.0, 18.0, 17.0, 16.0, 13.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.70612907409668, -19.1993465423584, -18.69256591796875, -18.18578338623047, -17.679000854492188, -17.172218322753906, -16.665435791015625, -16.158655166625977, -15.651872634887695, -15.145090103149414, -14.63830852508545, -14.131526947021484, -13.624744415283203, -13.117961883544922, -12.611180305480957, -12.104398727416992, -11.597616195678711, -11.09083366394043, -10.584052085876465, -10.0772705078125, -9.570487976074219, -9.063705444335938, -8.556923866271973, -8.050142288208008, -7.543359756469727, -7.0365777015686035, -6.5297956466674805, -6.023013591766357, -5.516231536865234, -5.009449481964111, -4.502667427062988, -3.9958853721618652, -3.4891042709350586, -2.9823222160339355, -2.4755401611328125, -1.9687581062316895, -1.4619760513305664, -0.9551939964294434, -0.4484119415283203, 0.058370113372802734, 0.5651521682739258, 1.0719342231750488, 1.5787162780761719, 2.085498332977295, 2.592280387878418, 3.099062442779541, 3.605844497680664, 4.112626552581787, 4.61940860748291, 5.126190662384033, 5.632972717285156, 6.139754772186279, 6.646536827087402, 7.153318881988525, 7.660100936889648, 8.16688346862793, 8.673665046691895, 9.18044662475586, 9.68722915649414, 10.194011688232422, 10.700793266296387, 11.207574844360352, 11.714357376098633, 12.221139907836914, 12.727921485900879]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 14.0, 18.0, 16.0, 17.0, 17.0, 21.0, 26.0, 31.0, 29.0, 35.0, 43.0, 50.0, 39.0, 46.0, 44.0, 39.0, 50.0, 55.0, 48.0, 40.0, 37.0, 34.0, 31.0, 39.0, 30.0, 21.0, 15.0, 21.0, 14.0, 7.0, 11.0, 9.0, 8.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.488200187683105, -11.170955657958984, -10.853710174560547, -10.536465644836426, -10.219221115112305, -9.901975631713867, -9.584731101989746, -9.267486572265625, -8.950241088867188, -8.632996559143066, -8.315751075744629, -7.998506546020508, -7.681262016296387, -7.364017009735107, -7.046772003173828, -6.729527473449707, -6.412282943725586, -6.095037937164307, -5.7777934074401855, -5.460548400878906, -5.143303871154785, -4.826058864593506, -4.508813858032227, -4.1915693283081055, -3.874324321746826, -3.557079553604126, -3.239834785461426, -2.9225897789001465, -2.6053450107574463, -2.288100242614746, -1.9708553552627563, -1.6536104679107666, -1.3363656997680664, -1.0191209316253662, -0.7018760442733765, -0.3846312165260315, -0.06738638877868652, 0.24985837936401367, 0.5671032667160034, 0.8843481540679932, 1.2015929222106934, 1.5188376903533936, 1.8360825777053833, 2.153327465057373, 2.4705722332000732, 2.7878170013427734, 3.1050620079040527, 3.422306776046753, 3.739551544189453, 4.056796550750732, 4.3740410804748535, 4.691286087036133, 5.008530616760254, 5.325775623321533, 5.6430206298828125, 5.960265159606934, 6.277510166168213, 6.594755172729492, 6.911999702453613, 7.229244709014893, 7.546489715576172, 7.863734245300293, 8.180978775024414, 8.498224258422852, 8.815468788146973]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 11.0, 12.0, 19.0, 22.0, 50.0, 83.0, 122.0, 189.0, 301.0, 501.0, 844.0, 1352.0, 2290.0, 3811.0, 6484.0, 11006.0, 19297.0, 33649.0, 60872.0, 108827.0, 183390.0, 226233.0, 166695.0, 97095.0, 54055.0, 29728.0, 17139.0, 9912.0, 5800.0, 3420.0, 2076.0, 1222.0, 774.0, 486.0, 303.0, 180.0, 99.0, 70.0, 37.0, 27.0, 20.0, 14.0, 16.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6279296875, -1.581939697265625, -1.53594970703125, -1.489959716796875, -1.4439697265625, -1.397979736328125, -1.35198974609375, -1.305999755859375, -1.260009765625, -1.214019775390625, -1.16802978515625, -1.122039794921875, -1.0760498046875, -1.030059814453125, -0.98406982421875, -0.938079833984375, -0.89208984375, -0.846099853515625, -0.80010986328125, -0.754119873046875, -0.7081298828125, -0.662139892578125, -0.61614990234375, -0.570159912109375, -0.524169921875, -0.478179931640625, -0.43218994140625, -0.386199951171875, -0.3402099609375, -0.294219970703125, -0.24822998046875, -0.202239990234375, -0.15625, -0.110260009765625, -0.06427001953125, -0.018280029296875, 0.0277099609375, 0.073699951171875, 0.11968994140625, 0.165679931640625, 0.211669921875, 0.257659912109375, 0.30364990234375, 0.349639892578125, 0.3956298828125, 0.441619873046875, 0.48760986328125, 0.533599853515625, 0.57958984375, 0.625579833984375, 0.67156982421875, 0.717559814453125, 0.7635498046875, 0.809539794921875, 0.85552978515625, 0.901519775390625, 0.947509765625, 0.993499755859375, 1.03948974609375, 1.085479736328125, 1.1314697265625, 1.177459716796875, 1.22344970703125, 1.269439697265625, 1.3154296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 8.0, 16.0, 16.0, 14.0, 15.0, 16.0, 23.0, 33.0, 26.0, 29.0, 31.0, 42.0, 49.0, 53.0, 43.0, 41.0, 52.0, 53.0, 46.0, 44.0, 44.0, 36.0, 28.0, 40.0, 31.0, 27.0, 18.0, 23.0, 21.0, 13.0, 13.0, 10.0, 5.0, 4.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.546875, -12.2095947265625, -11.872314453125, -11.5350341796875, -11.19775390625, -10.8604736328125, -10.523193359375, -10.1859130859375, -9.8486328125, -9.5113525390625, -9.174072265625, -8.8367919921875, -8.49951171875, -8.1622314453125, -7.824951171875, -7.4876708984375, -7.150390625, -6.8131103515625, -6.475830078125, -6.1385498046875, -5.80126953125, -5.4639892578125, -5.126708984375, -4.7894287109375, -4.4521484375, -4.1148681640625, -3.777587890625, -3.4403076171875, -3.10302734375, -2.7657470703125, -2.428466796875, -2.0911865234375, -1.75390625, -1.4166259765625, -1.079345703125, -0.7420654296875, -0.40478515625, -0.0675048828125, 0.269775390625, 0.6070556640625, 0.9443359375, 1.2816162109375, 1.618896484375, 1.9561767578125, 2.29345703125, 2.6307373046875, 2.968017578125, 3.3052978515625, 3.642578125, 3.9798583984375, 4.317138671875, 4.6544189453125, 4.99169921875, 5.3289794921875, 5.666259765625, 6.0035400390625, 6.3408203125, 6.6781005859375, 7.015380859375, 7.3526611328125, 7.68994140625, 8.0272216796875, 8.364501953125, 8.7017822265625, 9.0390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 8.0, 14.0, 10.0, 13.0, 15.0, 30.0, 50.0, 79.0, 105.0, 153.0, 243.0, 352.0, 509.0, 889.0, 1307.0, 2160.0, 3517.0, 5616.0, 9923.0, 18176.0, 48203.0, 476154.0, 395067.0, 44409.0, 17391.0, 9437.0, 5507.0, 3292.0, 2091.0, 1296.0, 837.0, 571.0, 357.0, 240.0, 154.0, 120.0, 90.0, 54.0, 30.0, 33.0, 17.0, 12.0, 9.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.37786865234375, -2.2928466796875, -2.20782470703125, -2.122802734375, -2.03778076171875, -1.9527587890625, -1.86773681640625, -1.78271484375, -1.69769287109375, -1.6126708984375, -1.52764892578125, -1.442626953125, -1.35760498046875, -1.2725830078125, -1.18756103515625, -1.1025390625, -1.01751708984375, -0.9324951171875, -0.84747314453125, -0.762451171875, -0.67742919921875, -0.5924072265625, -0.50738525390625, -0.42236328125, -0.33734130859375, -0.2523193359375, -0.16729736328125, -0.082275390625, 0.00274658203125, 0.0877685546875, 0.17279052734375, 0.2578125, 0.34283447265625, 0.4278564453125, 0.51287841796875, 0.597900390625, 0.68292236328125, 0.7679443359375, 0.85296630859375, 0.93798828125, 1.02301025390625, 1.1080322265625, 1.19305419921875, 1.278076171875, 1.36309814453125, 1.4481201171875, 1.53314208984375, 1.6181640625, 1.70318603515625, 1.7882080078125, 1.87322998046875, 1.958251953125, 2.04327392578125, 2.1282958984375, 2.21331787109375, 2.29833984375, 2.38336181640625, 2.4683837890625, 2.55340576171875, 2.638427734375, 2.72344970703125, 2.8084716796875, 2.89349365234375, 2.978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 2.0, 1.0, 8.0, 8.0, 9.0, 20.0, 10.0, 13.0, 18.0, 19.0, 17.0, 23.0, 26.0, 28.0, 21.0, 28.0, 35.0, 35.0, 41.0, 46.0, 43.0, 41.0, 37.0, 42.0, 35.0, 39.0, 35.0, 36.0, 29.0, 29.0, 28.0, 29.0, 18.0, 19.0, 22.0, 12.0, 18.0, 20.0, 10.0, 14.0, 3.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.8671875, -6.64080810546875, -6.4144287109375, -6.18804931640625, -5.961669921875, -5.73529052734375, -5.5089111328125, -5.28253173828125, -5.05615234375, -4.82977294921875, -4.6033935546875, -4.37701416015625, -4.150634765625, -3.92425537109375, -3.6978759765625, -3.47149658203125, -3.2451171875, -3.01873779296875, -2.7923583984375, -2.56597900390625, -2.339599609375, -2.11322021484375, -1.8868408203125, -1.66046142578125, -1.43408203125, -1.20770263671875, -0.9813232421875, -0.75494384765625, -0.528564453125, -0.30218505859375, -0.0758056640625, 0.15057373046875, 0.376953125, 0.60333251953125, 0.8297119140625, 1.05609130859375, 1.282470703125, 1.50885009765625, 1.7352294921875, 1.96160888671875, 2.18798828125, 2.41436767578125, 2.6407470703125, 2.86712646484375, 3.093505859375, 3.31988525390625, 3.5462646484375, 3.77264404296875, 3.9990234375, 4.22540283203125, 4.4517822265625, 4.67816162109375, 4.904541015625, 5.13092041015625, 5.3572998046875, 5.58367919921875, 5.81005859375, 6.03643798828125, 6.2628173828125, 6.48919677734375, 6.715576171875, 6.94195556640625, 7.1683349609375, 7.39471435546875, 7.62109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 13.0, 26.0, 23.0, 45.0, 70.0, 98.0, 153.0, 207.0, 296.0, 497.0, 818.0, 1344.0, 2290.0, 4027.0, 7239.0, 14558.0, 34102.0, 640338.0, 283509.0, 29545.0, 13040.0, 6732.0, 3808.0, 2227.0, 1306.0, 765.0, 514.0, 310.0, 227.0, 107.0, 93.0, 55.0, 40.0, 41.0, 23.0, 9.0, 8.0, 15.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7911300659179688, -0.7663421630859375, -0.7415542602539062, -0.716766357421875, -0.6919784545898438, -0.6671905517578125, -0.6424026489257812, -0.61761474609375, -0.5928268432617188, -0.5680389404296875, -0.5432510375976562, -0.518463134765625, -0.49367523193359375, -0.4688873291015625, -0.44409942626953125, -0.4193115234375, -0.39452362060546875, -0.3697357177734375, -0.34494781494140625, -0.320159912109375, -0.29537200927734375, -0.2705841064453125, -0.24579620361328125, -0.22100830078125, -0.19622039794921875, -0.1714324951171875, -0.14664459228515625, -0.121856689453125, -0.09706878662109375, -0.0722808837890625, -0.04749298095703125, -0.022705078125, 0.00208282470703125, 0.0268707275390625, 0.05165863037109375, 0.076446533203125, 0.10123443603515625, 0.1260223388671875, 0.15081024169921875, 0.17559814453125, 0.20038604736328125, 0.2251739501953125, 0.24996185302734375, 0.274749755859375, 0.29953765869140625, 0.3243255615234375, 0.34911346435546875, 0.3739013671875, 0.39868927001953125, 0.4234771728515625, 0.44826507568359375, 0.473052978515625, 0.49784088134765625, 0.5226287841796875, 0.5474166870117188, 0.57220458984375, 0.5969924926757812, 0.6217803955078125, 0.6465682983398438, 0.671356201171875, 0.6961441040039062, 0.7209320068359375, 0.7457199096679688, 0.7705078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 16.0, 14.0, 20.0, 18.0, 38.0, 52.0, 40.0, 59.0, 77.0, 85.0, 75.0, 87.0, 77.0, 61.0, 62.0, 45.0, 38.0, 16.0, 25.0, 20.0, 10.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7835369110107422e-05, -2.6979483664035797e-05, -2.6123598217964172e-05, -2.5267712771892548e-05, -2.4411827325820923e-05, -2.3555941879749298e-05, -2.2700056433677673e-05, -2.184417098760605e-05, -2.0988285541534424e-05, -2.01324000954628e-05, -1.9276514649391174e-05, -1.842062920331955e-05, -1.7564743757247925e-05, -1.67088583111763e-05, -1.5852972865104675e-05, -1.499708741903305e-05, -1.4141201972961426e-05, -1.3285316526889801e-05, -1.2429431080818176e-05, -1.1573545634746552e-05, -1.0717660188674927e-05, -9.861774742603302e-06, -9.005889296531677e-06, -8.150003850460052e-06, -7.294118404388428e-06, -6.438232958316803e-06, -5.582347512245178e-06, -4.7264620661735535e-06, -3.870576620101929e-06, -3.014691174030304e-06, -2.158805727958679e-06, -1.3029202818870544e-06, -4.470348358154297e-07, 4.0885061025619507e-07, 1.2647360563278198e-06, 2.1206215023994446e-06, 2.9765069484710693e-06, 3.832392394542694e-06, 4.688277840614319e-06, 5.544163286685944e-06, 6.400048732757568e-06, 7.255934178829193e-06, 8.111819624900818e-06, 8.967705070972443e-06, 9.823590517044067e-06, 1.0679475963115692e-05, 1.1535361409187317e-05, 1.2391246855258942e-05, 1.3247132301330566e-05, 1.4103017747402191e-05, 1.4958903193473816e-05, 1.581478863954544e-05, 1.6670674085617065e-05, 1.752655953168869e-05, 1.8382444977760315e-05, 1.923833042383194e-05, 2.0094215869903564e-05, 2.095010131597519e-05, 2.1805986762046814e-05, 2.266187220811844e-05, 2.3517757654190063e-05, 2.4373643100261688e-05, 2.5229528546333313e-05, 2.6085413992404938e-05, 2.6941299438476562e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 17.0, 20.0, 15.0, 23.0, 44.0, 65.0, 107.0, 106.0, 149.0, 186.0, 267.0, 385.0, 492.0, 666.0, 956.0, 1543.0, 2475.0, 4274.0, 7686.0, 15068.0, 32855.0, 77641.0, 203664.0, 375815.0, 187579.0, 72579.0, 30745.0, 14459.0, 7354.0, 4002.0, 2360.0, 1548.0, 945.0, 661.0, 478.0, 336.0, 257.0, 202.0, 148.0, 80.0, 78.0, 55.0, 48.0, 40.0, 28.0, 11.0, 13.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.033203125, -1.001373291015625, -0.96954345703125, -0.937713623046875, -0.9058837890625, -0.874053955078125, -0.84222412109375, -0.810394287109375, -0.778564453125, -0.746734619140625, -0.71490478515625, -0.683074951171875, -0.6512451171875, -0.619415283203125, -0.58758544921875, -0.555755615234375, -0.52392578125, -0.492095947265625, -0.46026611328125, -0.428436279296875, -0.3966064453125, -0.364776611328125, -0.33294677734375, -0.301116943359375, -0.269287109375, -0.237457275390625, -0.20562744140625, -0.173797607421875, -0.1419677734375, -0.110137939453125, -0.07830810546875, -0.046478271484375, -0.0146484375, 0.017181396484375, 0.04901123046875, 0.080841064453125, 0.1126708984375, 0.144500732421875, 0.17633056640625, 0.208160400390625, 0.239990234375, 0.271820068359375, 0.30364990234375, 0.335479736328125, 0.3673095703125, 0.399139404296875, 0.43096923828125, 0.462799072265625, 0.49462890625, 0.526458740234375, 0.55828857421875, 0.590118408203125, 0.6219482421875, 0.653778076171875, 0.68560791015625, 0.717437744140625, 0.749267578125, 0.781097412109375, 0.81292724609375, 0.844757080078125, 0.8765869140625, 0.908416748046875, 0.94024658203125, 0.972076416015625, 1.00390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 6.0, 4.0, 4.0, 6.0, 7.0, 7.0, 6.0, 16.0, 16.0, 20.0, 30.0, 31.0, 29.0, 51.0, 55.0, 52.0, 52.0, 66.0, 85.0, 77.0, 59.0, 68.0, 46.0, 51.0, 38.0, 19.0, 16.0, 8.0, 19.0, 12.0, 9.0, 14.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2676658630371094, -0.25823211669921875, -0.24879837036132812, -0.2393646240234375, -0.22993087768554688, -0.22049713134765625, -0.21106338500976562, -0.201629638671875, -0.19219589233398438, -0.18276214599609375, -0.17332839965820312, -0.1638946533203125, -0.15446090698242188, -0.14502716064453125, -0.13559341430664062, -0.12615966796875, -0.11672592163085938, -0.10729217529296875, -0.09785842895507812, -0.0884246826171875, -0.07899093627929688, -0.06955718994140625, -0.060123443603515625, -0.050689697265625, -0.041255950927734375, -0.03182220458984375, -0.022388458251953125, -0.0129547119140625, -0.003520965576171875, 0.00591278076171875, 0.015346527099609375, 0.0247802734375, 0.034214019775390625, 0.04364776611328125, 0.053081512451171875, 0.0625152587890625, 0.07194900512695312, 0.08138275146484375, 0.09081649780273438, 0.100250244140625, 0.10968399047851562, 0.11911773681640625, 0.12855148315429688, 0.1379852294921875, 0.14741897583007812, 0.15685272216796875, 0.16628646850585938, 0.17572021484375, 0.18515396118164062, 0.19458770751953125, 0.20402145385742188, 0.2134552001953125, 0.22288894653320312, 0.23232269287109375, 0.24175643920898438, 0.251190185546875, 0.2606239318847656, 0.27005767822265625, 0.2794914245605469, 0.2889251708984375, 0.2983589172363281, 0.30779266357421875, 0.3172264099121094, 0.32666015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 12.0, 13.0, 12.0, 23.0, 25.0, 36.0, 51.0, 71.0, 61.0, 78.0, 98.0, 76.0, 93.0, 70.0, 70.0, 45.0, 37.0, 29.0, 21.0, 17.0, 14.0, 19.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.979188919067383, -18.48151397705078, -17.98383903503418, -17.486164093017578, -16.98849105834961, -16.490816116333008, -15.993141174316406, -15.495466232299805, -14.99779224395752, -14.500117301940918, -14.002443313598633, -13.504768371582031, -13.00709342956543, -12.509419441223145, -12.011744499206543, -11.514070510864258, -11.016395568847656, -10.518720626831055, -10.02104663848877, -9.523371696472168, -9.025696754455566, -8.528022766113281, -8.03034782409668, -7.532673358917236, -7.034997940063477, -6.537323474884033, -6.039648532867432, -5.541974067687988, -5.044299602508545, -4.546625137329102, -4.0489501953125, -3.5512757301330566, -3.0536012649536133, -2.555926561355591, -2.0582520961761475, -1.560577392578125, -1.062902808189392, -0.5652282238006592, -0.06755352020263672, 0.43012094497680664, 0.9277956485748291, 1.425470232963562, 1.923144817352295, 2.4208195209503174, 2.91849422454834, 3.416168689727783, 3.9138433933258057, 4.411518096923828, 4.9091925621032715, 5.406867027282715, 5.904541969299316, 6.40221643447876, 6.899890899658203, 7.397565841674805, 7.895240306854248, 8.392914772033691, 8.890589714050293, 9.388264656066895, 9.88593864440918, 10.383613586425781, 10.881288528442383, 11.378962516784668, 11.87663745880127, 12.374311447143555, 12.871986389160156]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 2.0, 11.0, 10.0, 15.0, 16.0, 15.0, 17.0, 18.0, 20.0, 27.0, 37.0, 30.0, 34.0, 39.0, 49.0, 43.0, 43.0, 46.0, 47.0, 52.0, 48.0, 44.0, 45.0, 37.0, 32.0, 39.0, 38.0, 24.0, 18.0, 18.0, 17.0, 14.0, 10.0, 11.0, 5.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.588478088378906, -11.267852783203125, -10.947226524353027, -10.626601219177246, -10.305974960327148, -9.985349655151367, -9.664724349975586, -9.344099044799805, -9.023472785949707, -8.702847480773926, -8.382221221923828, -8.061595916748047, -7.740970134735107, -7.420344352722168, -7.099719047546387, -6.779093265533447, -6.458467483520508, -6.137841701507568, -5.817215919494629, -5.496590614318848, -5.175964832305908, -4.855339050292969, -4.5347137451171875, -4.214087963104248, -3.8934621810913086, -3.572836399078369, -3.252210855484009, -2.9315853118896484, -2.610959529876709, -2.2903337478637695, -1.9697082042694092, -1.6490826606750488, -1.3284578323364258, -1.0078321695327759, -0.687206506729126, -0.3665808439254761, -0.04595518112182617, 0.27467048168182373, 0.5952961444854736, 0.915921688079834, 1.2365474700927734, 1.5571731328964233, 1.8777987957000732, 2.1984243392944336, 2.519050121307373, 2.8396759033203125, 3.160301446914673, 3.480926990509033, 3.8015527725219727, 4.122178554534912, 4.442804336547852, 4.763429641723633, 5.084055423736572, 5.404681205749512, 5.725306510925293, 6.045932292938232, 6.366558074951172, 6.687183856964111, 7.007809638977051, 7.328434944152832, 7.6490607261657715, 7.969686508178711, 8.290311813354492, 8.610937118530273, 8.931563377380371]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 2.0, 7.0, 6.0, 16.0, 24.0, 25.0, 26.0, 42.0, 52.0, 64.0, 76.0, 111.0, 144.0, 176.0, 264.0, 412.0, 610.0, 861.0, 1381.0, 2079.0, 3464.0, 5967.0, 10358.0, 19767.0, 38164.0, 74685.0, 138321.0, 210152.0, 217471.0, 149045.0, 82583.0, 42125.0, 21696.0, 11504.0, 6417.0, 3669.0, 2287.0, 1421.0, 944.0, 615.0, 438.0, 266.0, 191.0, 154.0, 109.0, 99.0, 56.0, 57.0, 29.0, 29.0, 35.0, 18.0, 12.0, 13.0, 9.0, 6.0, 1.0, 5.0, 2.0, 3.0, 1.0], "bins": [-8.78125, -8.4986572265625, -8.216064453125, -7.9334716796875, -7.65087890625, -7.3682861328125, -7.085693359375, -6.8031005859375, -6.5205078125, -6.2379150390625, -5.955322265625, -5.6727294921875, -5.39013671875, -5.1075439453125, -4.824951171875, -4.5423583984375, -4.259765625, -3.9771728515625, -3.694580078125, -3.4119873046875, -3.12939453125, -2.8468017578125, -2.564208984375, -2.2816162109375, -1.9990234375, -1.7164306640625, -1.433837890625, -1.1512451171875, -0.86865234375, -0.5860595703125, -0.303466796875, -0.0208740234375, 0.26171875, 0.5443115234375, 0.826904296875, 1.1094970703125, 1.39208984375, 1.6746826171875, 1.957275390625, 2.2398681640625, 2.5224609375, 2.8050537109375, 3.087646484375, 3.3702392578125, 3.65283203125, 3.9354248046875, 4.218017578125, 4.5006103515625, 4.783203125, 5.0657958984375, 5.348388671875, 5.6309814453125, 5.91357421875, 6.1961669921875, 6.478759765625, 6.7613525390625, 7.0439453125, 7.3265380859375, 7.609130859375, 7.8917236328125, 8.17431640625, 8.4569091796875, 8.739501953125, 9.0220947265625, 9.3046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 19.0, 14.0, 13.0, 18.0, 30.0, 21.0, 26.0, 28.0, 33.0, 30.0, 38.0, 47.0, 41.0, 43.0, 39.0, 44.0, 46.0, 36.0, 43.0, 46.0, 44.0, 38.0, 29.0, 24.0, 32.0, 26.0, 15.0, 27.0, 14.0, 15.0, 8.0, 7.0, 6.0, 4.0, 7.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2442626953125, -8.949462890625, -8.6546630859375, -8.35986328125, -8.0650634765625, -7.770263671875, -7.4754638671875, -7.1806640625, -6.8858642578125, -6.591064453125, -6.2962646484375, -6.00146484375, -5.7066650390625, -5.411865234375, -5.1170654296875, -4.822265625, -4.5274658203125, -4.232666015625, -3.9378662109375, -3.64306640625, -3.3482666015625, -3.053466796875, -2.7586669921875, -2.4638671875, -2.1690673828125, -1.874267578125, -1.5794677734375, -1.28466796875, -0.9898681640625, -0.695068359375, -0.4002685546875, -0.10546875, 0.1893310546875, 0.484130859375, 0.7789306640625, 1.07373046875, 1.3685302734375, 1.663330078125, 1.9581298828125, 2.2529296875, 2.5477294921875, 2.842529296875, 3.1373291015625, 3.43212890625, 3.7269287109375, 4.021728515625, 4.3165283203125, 4.611328125, 4.9061279296875, 5.200927734375, 5.4957275390625, 5.79052734375, 6.0853271484375, 6.380126953125, 6.6749267578125, 6.9697265625, 7.2645263671875, 7.559326171875, 7.8541259765625, 8.14892578125, 8.4437255859375, 8.738525390625, 9.0333251953125, 9.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 4.0, 9.0, 7.0, 11.0, 20.0, 18.0, 22.0, 29.0, 27.0, 61.0, 76.0, 106.0, 155.0, 266.0, 526.0, 871.0, 1567.0, 3158.0, 7122.0, 17447.0, 47069.0, 128930.0, 284762.0, 307907.0, 154321.0, 56641.0, 21055.0, 8494.0, 3688.0, 1817.0, 925.0, 503.0, 334.0, 176.0, 114.0, 96.0, 55.0, 46.0, 27.0, 27.0, 23.0, 10.0, 12.0, 9.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.078125, -15.59228515625, -15.1064453125, -14.62060546875, -14.134765625, -13.64892578125, -13.1630859375, -12.67724609375, -12.19140625, -11.70556640625, -11.2197265625, -10.73388671875, -10.248046875, -9.76220703125, -9.2763671875, -8.79052734375, -8.3046875, -7.81884765625, -7.3330078125, -6.84716796875, -6.361328125, -5.87548828125, -5.3896484375, -4.90380859375, -4.41796875, -3.93212890625, -3.4462890625, -2.96044921875, -2.474609375, -1.98876953125, -1.5029296875, -1.01708984375, -0.53125, -0.04541015625, 0.4404296875, 0.92626953125, 1.412109375, 1.89794921875, 2.3837890625, 2.86962890625, 3.35546875, 3.84130859375, 4.3271484375, 4.81298828125, 5.298828125, 5.78466796875, 6.2705078125, 6.75634765625, 7.2421875, 7.72802734375, 8.2138671875, 8.69970703125, 9.185546875, 9.67138671875, 10.1572265625, 10.64306640625, 11.12890625, 11.61474609375, 12.1005859375, 12.58642578125, 13.072265625, 13.55810546875, 14.0439453125, 14.52978515625, 15.015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 12.0, 14.0, 12.0, 18.0, 16.0, 20.0, 25.0, 23.0, 22.0, 32.0, 45.0, 32.0, 52.0, 39.0, 45.0, 47.0, 47.0, 44.0, 46.0, 37.0, 45.0, 36.0, 38.0, 35.0, 27.0, 22.0, 27.0, 23.0, 16.0, 10.0, 14.0, 8.0, 13.0, 9.0, 7.0, 12.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.84735107421875, -5.6517333984375, -5.45611572265625, -5.260498046875, -5.06488037109375, -4.8692626953125, -4.67364501953125, -4.47802734375, -4.28240966796875, -4.0867919921875, -3.89117431640625, -3.695556640625, -3.49993896484375, -3.3043212890625, -3.10870361328125, -2.9130859375, -2.71746826171875, -2.5218505859375, -2.32623291015625, -2.130615234375, -1.93499755859375, -1.7393798828125, -1.54376220703125, -1.34814453125, -1.15252685546875, -0.9569091796875, -0.76129150390625, -0.565673828125, -0.37005615234375, -0.1744384765625, 0.02117919921875, 0.216796875, 0.41241455078125, 0.6080322265625, 0.80364990234375, 0.999267578125, 1.19488525390625, 1.3905029296875, 1.58612060546875, 1.78173828125, 1.97735595703125, 2.1729736328125, 2.36859130859375, 2.564208984375, 2.75982666015625, 2.9554443359375, 3.15106201171875, 3.3466796875, 3.54229736328125, 3.7379150390625, 3.93353271484375, 4.129150390625, 4.32476806640625, 4.5203857421875, 4.71600341796875, 4.91162109375, 5.10723876953125, 5.3028564453125, 5.49847412109375, 5.694091796875, 5.88970947265625, 6.0853271484375, 6.28094482421875, 6.4765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 12.0, 22.0, 25.0, 34.0, 45.0, 70.0, 91.0, 125.0, 188.0, 230.0, 371.0, 531.0, 760.0, 1150.0, 1723.0, 2704.0, 4530.0, 7654.0, 13970.0, 28488.0, 61163.0, 136162.0, 244902.0, 256338.0, 149999.0, 69087.0, 31053.0, 15394.0, 8301.0, 4895.0, 2847.0, 1810.0, 1258.0, 842.0, 517.0, 366.0, 247.0, 187.0, 120.0, 94.0, 84.0, 43.0, 29.0, 19.0, 23.0, 16.0, 12.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0], "bins": [-6.08203125, -5.90350341796875, -5.7249755859375, -5.54644775390625, -5.367919921875, -5.18939208984375, -5.0108642578125, -4.83233642578125, -4.65380859375, -4.47528076171875, -4.2967529296875, -4.11822509765625, -3.939697265625, -3.76116943359375, -3.5826416015625, -3.40411376953125, -3.2255859375, -3.04705810546875, -2.8685302734375, -2.69000244140625, -2.511474609375, -2.33294677734375, -2.1544189453125, -1.97589111328125, -1.79736328125, -1.61883544921875, -1.4403076171875, -1.26177978515625, -1.083251953125, -0.90472412109375, -0.7261962890625, -0.54766845703125, -0.369140625, -0.19061279296875, -0.0120849609375, 0.16644287109375, 0.344970703125, 0.52349853515625, 0.7020263671875, 0.88055419921875, 1.05908203125, 1.23760986328125, 1.4161376953125, 1.59466552734375, 1.773193359375, 1.95172119140625, 2.1302490234375, 2.30877685546875, 2.4873046875, 2.66583251953125, 2.8443603515625, 3.02288818359375, 3.201416015625, 3.37994384765625, 3.5584716796875, 3.73699951171875, 3.91552734375, 4.09405517578125, 4.2725830078125, 4.45111083984375, 4.629638671875, 4.80816650390625, 4.9866943359375, 5.16522216796875, 5.34375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 6.0, 12.0, 30.0, 28.0, 54.0, 65.0, 106.0, 161.0, 143.0, 117.0, 99.0, 50.0, 39.0, 22.0, 14.0, 13.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009398460388183594, -0.0009123533964157104, -0.0008848607540130615, -0.0008573681116104126, -0.0008298754692077637, -0.0008023828268051147, -0.0007748901844024658, -0.0007473975419998169, -0.000719904899597168, -0.000692412257194519, -0.0006649196147918701, -0.0006374269723892212, -0.0006099343299865723, -0.0005824416875839233, -0.0005549490451812744, -0.0005274564027786255, -0.0004999637603759766, -0.00047247111797332764, -0.0004449784755706787, -0.0004174858331680298, -0.00038999319076538086, -0.00036250054836273193, -0.000335007905960083, -0.0003075152635574341, -0.00028002262115478516, -0.00025252997875213623, -0.0002250373363494873, -0.00019754469394683838, -0.00017005205154418945, -0.00014255940914154053, -0.0001150667667388916, -8.757412433624268e-05, -6.008148193359375e-05, -3.2588839530944824e-05, -5.0961971282958984e-06, 2.2396445274353027e-05, 4.988908767700195e-05, 7.738173007965088e-05, 0.0001048743724822998, 0.00013236701488494873, 0.00015985965728759766, 0.00018735229969024658, 0.0002148449420928955, 0.00024233758449554443, 0.00026983022689819336, 0.0002973228693008423, 0.0003248155117034912, 0.00035230815410614014, 0.00037980079650878906, 0.000407293438911438, 0.0004347860813140869, 0.00046227872371673584, 0.0004897713661193848, 0.0005172640085220337, 0.0005447566509246826, 0.0005722492933273315, 0.0005997419357299805, 0.0006272345781326294, 0.0006547272205352783, 0.0006822198629379272, 0.0007097125053405762, 0.0007372051477432251, 0.000764697790145874, 0.000792190432548523, 0.0008196830749511719]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 4.0, 7.0, 6.0, 25.0, 29.0, 37.0, 66.0, 82.0, 100.0, 140.0, 222.0, 273.0, 401.0, 616.0, 983.0, 1522.0, 2272.0, 3907.0, 6654.0, 11812.0, 22231.0, 46213.0, 100850.0, 202665.0, 266380.0, 193726.0, 95119.0, 43422.0, 21113.0, 11160.0, 6282.0, 3726.0, 2131.0, 1448.0, 961.0, 650.0, 425.0, 288.0, 188.0, 116.0, 73.0, 73.0, 40.0, 29.0, 20.0, 19.0, 15.0, 5.0, 10.0, 6.0, 2.0, 5.0, 0.0, 4.0], "bins": [-6.10546875, -5.92828369140625, -5.7510986328125, -5.57391357421875, -5.396728515625, -5.21954345703125, -5.0423583984375, -4.86517333984375, -4.68798828125, -4.51080322265625, -4.3336181640625, -4.15643310546875, -3.979248046875, -3.80206298828125, -3.6248779296875, -3.44769287109375, -3.2705078125, -3.09332275390625, -2.9161376953125, -2.73895263671875, -2.561767578125, -2.38458251953125, -2.2073974609375, -2.03021240234375, -1.85302734375, -1.67584228515625, -1.4986572265625, -1.32147216796875, -1.144287109375, -0.96710205078125, -0.7899169921875, -0.61273193359375, -0.435546875, -0.25836181640625, -0.0811767578125, 0.09600830078125, 0.273193359375, 0.45037841796875, 0.6275634765625, 0.80474853515625, 0.98193359375, 1.15911865234375, 1.3363037109375, 1.51348876953125, 1.690673828125, 1.86785888671875, 2.0450439453125, 2.22222900390625, 2.3994140625, 2.57659912109375, 2.7537841796875, 2.93096923828125, 3.108154296875, 3.28533935546875, 3.4625244140625, 3.63970947265625, 3.81689453125, 3.99407958984375, 4.1712646484375, 4.34844970703125, 4.525634765625, 4.70281982421875, 4.8800048828125, 5.05718994140625, 5.234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 8.0, 8.0, 16.0, 12.0, 21.0, 34.0, 26.0, 46.0, 47.0, 69.0, 53.0, 49.0, 79.0, 68.0, 67.0, 54.0, 58.0, 56.0, 35.0, 26.0, 36.0, 23.0, 22.0, 20.0, 9.0, 9.0, 8.0, 9.0, 7.0, 2.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.4459381103515625, -1.396759033203125, -1.3475799560546875, -1.29840087890625, -1.2492218017578125, -1.200042724609375, -1.1508636474609375, -1.1016845703125, -1.0525054931640625, -1.003326416015625, -0.9541473388671875, -0.90496826171875, -0.8557891845703125, -0.806610107421875, -0.7574310302734375, -0.708251953125, -0.6590728759765625, -0.609893798828125, -0.5607147216796875, -0.51153564453125, -0.4623565673828125, -0.413177490234375, -0.3639984130859375, -0.3148193359375, -0.2656402587890625, -0.216461181640625, -0.1672821044921875, -0.11810302734375, -0.0689239501953125, -0.019744873046875, 0.0294342041015625, 0.07861328125, 0.1277923583984375, 0.176971435546875, 0.2261505126953125, 0.27532958984375, 0.3245086669921875, 0.373687744140625, 0.4228668212890625, 0.4720458984375, 0.5212249755859375, 0.570404052734375, 0.6195831298828125, 0.66876220703125, 0.7179412841796875, 0.767120361328125, 0.8162994384765625, 0.865478515625, 0.9146575927734375, 0.963836669921875, 1.0130157470703125, 1.06219482421875, 1.1113739013671875, 1.160552978515625, 1.2097320556640625, 1.2589111328125, 1.3080902099609375, 1.357269287109375, 1.4064483642578125, 1.45562744140625, 1.5048065185546875, 1.553985595703125, 1.6031646728515625, 1.65234375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 7.0, 9.0, 8.0, 17.0, 19.0, 33.0, 36.0, 43.0, 52.0, 76.0, 72.0, 94.0, 89.0, 75.0, 81.0, 63.0, 49.0, 48.0, 33.0, 24.0, 14.0, 21.0, 10.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.804080963134766, -19.30260467529297, -18.801128387451172, -18.299650192260742, -17.798173904418945, -17.29669761657715, -16.79522132873535, -16.293743133544922, -15.792266845703125, -15.290790557861328, -14.789313316345215, -14.287837028503418, -13.786359786987305, -13.284883499145508, -12.783407211303711, -12.281929969787598, -11.7804536819458, -11.278977394104004, -10.77750015258789, -10.276023864746094, -9.77454662322998, -9.273070335388184, -8.77159309387207, -8.270116806030273, -7.768640041351318, -7.267163276672363, -6.765686511993408, -6.264209747314453, -5.762733459472656, -5.261256217956543, -4.759779930114746, -4.258303165435791, -3.7568254470825195, -3.2553486824035645, -2.7538719177246094, -2.2523953914642334, -1.7509186267852783, -1.2494418621063232, -0.7479653358459473, -0.2464885711669922, 0.2549881935119629, 0.7564648985862732, 1.2579416036605835, 1.759418249130249, 2.260895013809204, 2.762371778488159, 3.263848304748535, 3.7653250694274902, 4.266801834106445, 4.7682785987854, 5.2697553634643555, 5.771231651306152, 6.272708892822266, 6.7741851806640625, 7.275661945343018, 7.777138710021973, 8.278615951538086, 8.780092239379883, 9.281569480895996, 9.783045768737793, 10.284523010253906, 10.785999298095703, 11.2874755859375, 11.788952827453613, 12.29042911529541]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 2.0, 16.0, 13.0, 9.0, 17.0, 22.0, 19.0, 17.0, 20.0, 38.0, 30.0, 38.0, 45.0, 39.0, 45.0, 53.0, 69.0, 41.0, 55.0, 41.0, 44.0, 50.0, 32.0, 36.0, 32.0, 24.0, 31.0, 21.0, 13.0, 12.0, 19.0, 12.0, 11.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.721688270568848, -12.337523460388184, -11.95335865020752, -11.569193840026855, -11.185029983520508, -10.800865173339844, -10.41670036315918, -10.032535552978516, -9.648370742797852, -9.264205932617188, -8.880041122436523, -8.49587631225586, -8.111711502075195, -7.7275471687316895, -7.343382835388184, -6.9592180252075195, -6.5750532150268555, -6.190888404846191, -5.806723594665527, -5.4225592613220215, -5.038394451141357, -4.654229640960693, -4.2700653076171875, -3.8859004974365234, -3.5017356872558594, -3.1175708770751953, -2.7334063053131104, -2.3492417335510254, -1.9650769233703613, -1.5809122323989868, -1.1967475414276123, -0.8125829696655273, -0.4284191131591797, -0.044254422187805176, 0.33991026878356934, 0.7240749597549438, 1.1082396507263184, 1.4924043416976929, 1.8765690326690674, 2.2607336044311523, 2.6448984146118164, 3.0290632247924805, 3.4132277965545654, 3.7973923683166504, 4.1815571784973145, 4.5657219886779785, 4.949886322021484, 5.334051132202148, 5.7182159423828125, 6.102380752563477, 6.486545562744141, 6.8707098960876465, 7.2548747062683105, 7.639039516448975, 8.02320384979248, 8.407368659973145, 8.791533470153809, 9.175698280334473, 9.559863090515137, 9.9440279006958, 10.328191757202148, 10.712356567382812, 11.096521377563477, 11.48068618774414, 11.864850997924805]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 4.0, 6.0, 13.0, 7.0, 13.0, 15.0, 14.0, 18.0, 23.0, 20.0, 28.0, 24.0, 33.0, 49.0, 69.0, 121.0, 229.0, 489.0, 1536.0, 6624.0, 1030122.0, 8099.0, 1735.0, 553.0, 261.0, 122.0, 65.0, 58.0, 46.0, 28.0, 30.0, 24.0, 25.0, 16.0, 11.0, 13.0, 10.0, 3.0, 6.0, 9.0, 7.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-261.6222839355469, -253.33265686035156, -245.04302978515625, -236.75341796875, -228.4637908935547, -220.17416381835938, -211.88453674316406, -203.59490966796875, -195.3052978515625, -187.0156707763672, -178.72604370117188, -170.43643188476562, -162.1468048095703, -153.857177734375, -145.5675506591797, -137.27792358398438, -128.98829650878906, -120.69866943359375, -112.40904998779297, -104.11942291259766, -95.82980346679688, -87.54017639160156, -79.25054931640625, -70.96092224121094, -62.671302795410156, -54.38167953491211, -46.09205627441406, -37.80242919921875, -29.512805938720703, -21.223182678222656, -12.933555603027344, -4.643932342529297, 3.64569091796875, 11.935315132141113, 20.224939346313477, 28.514564514160156, 36.8041877746582, 45.09381103515625, 53.38343811035156, 61.67306137084961, 69.96268463134766, 78.25231170654297, 86.54193115234375, 94.83155822753906, 103.12118530273438, 111.41080474853516, 119.70043182373047, 127.99005126953125, 136.27967834472656, 144.56930541992188, 152.8589324951172, 161.1485595703125, 169.43817138671875, 177.72779846191406, 186.01742553710938, 194.3070526123047, 202.5966796875, 210.8863067626953, 219.17593383789062, 227.46554565429688, 235.7551727294922, 244.0447998046875, 252.3344268798828, 260.6240539550781, 268.9136657714844]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 6.0, 16.0, 18.0, 11.0, 19.0, 16.0, 31.0, 33.0, 32.0, 47.0, 81.0, 142.0, 289.0, 792.0, 2469.0, 7362.0, 34942.0, 51402992.0, 14997.0, 4377.0, 1453.0, 520.0, 204.0, 131.0, 75.0, 45.0, 34.0, 33.0, 22.0, 17.0, 15.0, 14.0, 9.0, 14.0, 8.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-245.282958984375, -237.18096923828125, -229.07899475097656, -220.9770050048828, -212.87503051757812, -204.77304077148438, -196.67105102539062, -188.56906127929688, -180.4670867919922, -172.36509704589844, -164.26312255859375, -156.1611328125, -148.05914306640625, -139.95716857910156, -131.8551788330078, -123.7531967163086, -115.65121459960938, -107.54923248291016, -99.44725036621094, -91.34526062011719, -83.24327850341797, -75.14129638671875, -67.039306640625, -58.93732452392578, -50.83534240722656, -42.733360290527344, -34.63137435913086, -26.529390335083008, -18.427406311035156, -10.325424194335938, -2.223438262939453, 5.878547668457031, 13.980499267578125, 22.082483291625977, 30.184467315673828, 38.28645324707031, 46.38843536376953, 54.49041748046875, 62.592403411865234, 70.69438934326172, 78.79637145996094, 86.89835357666016, 95.00033569335938, 103.10232543945312, 111.20430755615234, 119.30628967285156, 127.40827941894531, 135.51025390625, 143.61224365234375, 151.7142333984375, 159.8162078857422, 167.91819763183594, 176.02017211914062, 184.12216186523438, 192.22415161132812, 200.32614135742188, 208.42811584472656, 216.5301055908203, 224.632080078125, 232.73406982421875, 240.8360595703125, 248.9380340576172, 257.0400085449219, 265.1419982910156, 273.2439880371094]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 14.0, 8.0, 19.0, 22.0, 22.0, 32.0, 37.0, 50.0, 52.0, 55.0, 80.0, 66.0, 75.0, 85.0, 68.0, 55.0, 44.0, 43.0, 30.0, 24.0, 16.0, 21.0, 8.0, 9.0, 11.0, 5.0, 1.0, 7.0, 6.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.18997192382812, -122.84699249267578, -118.50402069091797, -114.16104125976562, -109.81806945800781, -105.47509002685547, -101.13211059570312, -96.78913879394531, -92.44615936279297, -88.10317993164062, -83.76020812988281, -79.41722869873047, -75.07424926757812, -70.73127746582031, -66.38829803466797, -62.04532241821289, -57.70234680175781, -53.359371185302734, -49.016395568847656, -44.67341613769531, -40.330440521240234, -35.987464904785156, -31.644487380981445, -27.301509857177734, -22.958534240722656, -18.615558624267578, -14.272581100463867, -9.929604530334473, -5.586627960205078, -1.24365234375, 3.099325180053711, 7.442302703857422, 11.7852783203125, 16.128253936767578, 20.47123146057129, 24.814208984375, 29.157184600830078, 33.500160217285156, 37.8431396484375, 42.18611526489258, 46.529090881347656, 50.872066497802734, 55.21504211425781, 59.558021545410156, 63.900997161865234, 68.24397277832031, 72.58695220947266, 76.929931640625, 81.27290344238281, 85.61588287353516, 89.95885467529297, 94.30183410644531, 98.64480590820312, 102.98778533935547, 107.33076477050781, 111.67373657226562, 116.01671600341797, 120.35969543457031, 124.70266723632812, 129.04563903808594, 133.3886260986328, 137.73159790039062, 142.07456970214844, 146.4175567626953, 150.76052856445312]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 9.0, 7.0, 12.0, 21.0, 16.0, 21.0, 23.0, 30.0, 51.0, 29.0, 34.0, 63.0, 70.0, 58.0, 74.0, 69.0, 52.0, 71.0, 56.0, 38.0, 35.0, 26.0, 23.0, 19.0, 11.0, 14.0, 6.0, 9.0, 11.0, 5.0, 8.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-176.75790405273438, -171.16433715820312, -165.57078552246094, -159.9772186279297, -154.3836669921875, -148.79010009765625, -143.196533203125, -137.6029815673828, -132.00942993164062, -126.4158706665039, -120.82231140136719, -115.22874450683594, -109.63519287109375, -104.0416259765625, -98.44806671142578, -92.85450744628906, -87.26094055175781, -81.6673812866211, -76.07382202148438, -70.48025512695312, -64.88670349121094, -59.29314041137695, -53.69957733154297, -48.10601806640625, -42.51245880126953, -36.91889953613281, -31.32533836364746, -25.73177719116211, -20.13821792602539, -14.544658660888672, -8.951095581054688, -3.3575363159179688, 2.23602294921875, 7.829583168029785, 13.42314338684082, 19.016704559326172, 24.61026382446289, 30.20382308959961, 35.797386169433594, 41.39094543457031, 46.98450469970703, 52.57806396484375, 58.17162322998047, 63.76518630981445, 69.35874938964844, 74.95230102539062, 80.54586791992188, 86.1394271850586, 91.73298645019531, 97.32654571533203, 102.92010498046875, 108.513671875, 114.10722351074219, 119.70079040527344, 125.29434967041016, 130.88790893554688, 136.48147583007812, 142.07504272460938, 147.66859436035156, 153.2621612548828, 158.855712890625, 164.44927978515625, 170.0428466796875, 175.6363983154297, 181.22994995117188]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 10.0, 6.0, 19.0, 31.0, 42.0, 70.0, 119.0, 134.0, 211.0, 338.0, 576.0, 838.0, 1276.0, 2239.0, 3675.0, 6974.0, 13097.0, 27184.0, 63401.0, 164670.0, 506143.0, 2042482.0, 917165.0, 271571.0, 96508.0, 38741.0, 17545.0, 8523.0, 4470.0, 2461.0, 1405.0, 866.0, 492.0, 350.0, 190.0, 156.0, 84.0, 60.0, 38.0, 27.0, 17.0, 28.0, 10.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.615234375, -2.535308837890625, -2.45538330078125, -2.375457763671875, -2.2955322265625, -2.215606689453125, -2.13568115234375, -2.055755615234375, -1.975830078125, -1.895904541015625, -1.81597900390625, -1.736053466796875, -1.6561279296875, -1.576202392578125, -1.49627685546875, -1.416351318359375, -1.33642578125, -1.256500244140625, -1.17657470703125, -1.096649169921875, -1.0167236328125, -0.936798095703125, -0.85687255859375, -0.776947021484375, -0.697021484375, -0.617095947265625, -0.53717041015625, -0.457244873046875, -0.3773193359375, -0.297393798828125, -0.21746826171875, -0.137542724609375, -0.0576171875, 0.022308349609375, 0.10223388671875, 0.182159423828125, 0.2620849609375, 0.342010498046875, 0.42193603515625, 0.501861572265625, 0.581787109375, 0.661712646484375, 0.74163818359375, 0.821563720703125, 0.9014892578125, 0.981414794921875, 1.06134033203125, 1.141265869140625, 1.22119140625, 1.301116943359375, 1.38104248046875, 1.460968017578125, 1.5408935546875, 1.620819091796875, 1.70074462890625, 1.780670166015625, 1.860595703125, 1.940521240234375, 2.02044677734375, 2.100372314453125, 2.1802978515625, 2.260223388671875, 2.34014892578125, 2.420074462890625, 2.5]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 7.0, 5.0, 13.0, 11.0, 16.0, 18.0, 32.0, 25.0, 35.0, 37.0, 62.0, 74.0, 66.0, 75.0, 72.0, 69.0, 78.0, 67.0, 62.0, 42.0, 35.0, 20.0, 22.0, 17.0, 10.0, 2.0, 3.0, 4.0, 7.0, 2.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.364013671875, -0.3539466857910156, -0.34387969970703125, -0.3338127136230469, -0.3237457275390625, -0.3136787414550781, -0.30361175537109375, -0.2935447692871094, -0.283477783203125, -0.2734107971191406, -0.26334381103515625, -0.2532768249511719, -0.2432098388671875, -0.23314285278320312, -0.22307586669921875, -0.21300888061523438, -0.20294189453125, -0.19287490844726562, -0.18280792236328125, -0.17274093627929688, -0.1626739501953125, -0.15260696411132812, -0.14253997802734375, -0.13247299194335938, -0.122406005859375, -0.11233901977539062, -0.10227203369140625, -0.09220504760742188, -0.0821380615234375, -0.07207107543945312, -0.06200408935546875, -0.051937103271484375, -0.0418701171875, -0.031803131103515625, -0.02173614501953125, -0.011669158935546875, -0.0016021728515625, 0.008464813232421875, 0.01853179931640625, 0.028598785400390625, 0.038665771484375, 0.048732757568359375, 0.05879974365234375, 0.06886672973632812, 0.0789337158203125, 0.08900070190429688, 0.09906768798828125, 0.10913467407226562, 0.11920166015625, 0.12926864624023438, 0.13933563232421875, 0.14940261840820312, 0.1594696044921875, 0.16953659057617188, 0.17960357666015625, 0.18967056274414062, 0.199737548828125, 0.20980453491210938, 0.21987152099609375, 0.22993850708007812, 0.2400054931640625, 0.2500724792480469, 0.26013946533203125, 0.2702064514160156, 0.2802734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 9.0, 13.0, 15.0, 30.0, 39.0, 53.0, 72.0, 88.0, 152.0, 265.0, 393.0, 643.0, 1116.0, 1752.0, 3184.0, 5689.0, 11174.0, 22274.0, 49198.0, 117292.0, 311562.0, 933782.0, 1769258.0, 605430.0, 209016.0, 80929.0, 35088.0, 16496.0, 8468.0, 4471.0, 2542.0, 1447.0, 834.0, 527.0, 334.0, 206.0, 129.0, 98.0, 68.0, 41.0, 32.0, 20.0, 18.0, 8.0, 8.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.796875, -1.74127197265625, -1.6856689453125, -1.63006591796875, -1.574462890625, -1.51885986328125, -1.4632568359375, -1.40765380859375, -1.35205078125, -1.29644775390625, -1.2408447265625, -1.18524169921875, -1.129638671875, -1.07403564453125, -1.0184326171875, -0.96282958984375, -0.9072265625, -0.85162353515625, -0.7960205078125, -0.74041748046875, -0.684814453125, -0.62921142578125, -0.5736083984375, -0.51800537109375, -0.46240234375, -0.40679931640625, -0.3511962890625, -0.29559326171875, -0.239990234375, -0.18438720703125, -0.1287841796875, -0.07318115234375, -0.017578125, 0.03802490234375, 0.0936279296875, 0.14923095703125, 0.204833984375, 0.26043701171875, 0.3160400390625, 0.37164306640625, 0.42724609375, 0.48284912109375, 0.5384521484375, 0.59405517578125, 0.649658203125, 0.70526123046875, 0.7608642578125, 0.81646728515625, 0.8720703125, 0.92767333984375, 0.9832763671875, 1.03887939453125, 1.094482421875, 1.15008544921875, 1.2056884765625, 1.26129150390625, 1.31689453125, 1.37249755859375, 1.4281005859375, 1.48370361328125, 1.539306640625, 1.59490966796875, 1.6505126953125, 1.70611572265625, 1.76171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 8.0, 8.0, 16.0, 22.0, 26.0, 37.0, 36.0, 41.0, 67.0, 66.0, 83.0, 88.0, 119.0, 142.0, 183.0, 204.0, 234.0, 304.0, 430.0, 387.0, 292.0, 254.0, 207.0, 157.0, 155.0, 93.0, 84.0, 66.0, 44.0, 35.0, 41.0, 25.0, 22.0, 17.0, 15.0, 12.0, 7.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5947265625, -0.576141357421875, -0.55755615234375, -0.538970947265625, -0.5203857421875, -0.501800537109375, -0.48321533203125, -0.464630126953125, -0.446044921875, -0.427459716796875, -0.40887451171875, -0.390289306640625, -0.3717041015625, -0.353118896484375, -0.33453369140625, -0.315948486328125, -0.29736328125, -0.278778076171875, -0.26019287109375, -0.241607666015625, -0.2230224609375, -0.204437255859375, -0.18585205078125, -0.167266845703125, -0.148681640625, -0.130096435546875, -0.11151123046875, -0.092926025390625, -0.0743408203125, -0.055755615234375, -0.03717041015625, -0.018585205078125, 0.0, 0.018585205078125, 0.03717041015625, 0.055755615234375, 0.0743408203125, 0.092926025390625, 0.11151123046875, 0.130096435546875, 0.148681640625, 0.167266845703125, 0.18585205078125, 0.204437255859375, 0.2230224609375, 0.241607666015625, 0.26019287109375, 0.278778076171875, 0.29736328125, 0.315948486328125, 0.33453369140625, 0.353118896484375, 0.3717041015625, 0.390289306640625, 0.40887451171875, 0.427459716796875, 0.446044921875, 0.464630126953125, 0.48321533203125, 0.501800537109375, 0.5203857421875, 0.538970947265625, 0.55755615234375, 0.576141357421875, 0.5947265625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 21.0, 32.0, 24.0, 64.0, 73.0, 89.0, 119.0, 118.0, 119.0, 82.0, 77.0, 42.0, 33.0, 19.0, 25.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.949253559112549, -7.715593338012695, -7.48193359375, -7.2482733726501465, -7.014613628387451, -6.780953407287598, -6.547293663024902, -6.313633441925049, -6.079973220825195, -5.846312999725342, -5.6126532554626465, -5.378993034362793, -5.145333290100098, -4.911673069000244, -4.678012847900391, -4.444353103637695, -4.210693359375, -3.9770333766937256, -3.743373394012451, -3.5097131729125977, -3.2760534286499023, -3.042393207550049, -2.8087332248687744, -2.5750732421875, -2.3414132595062256, -2.107753276824951, -1.8740932941436768, -1.6404331922531128, -1.4067732095718384, -1.173113226890564, -0.939453125, -0.7057931423187256, -0.4721336364746094, -0.23847362399101257, -0.0048136115074157715, 0.22884643077850342, 0.46250641345977783, 0.6961663961410522, 0.9298264980316162, 1.1634864807128906, 1.397146463394165, 1.6308064460754395, 1.8644664287567139, 2.0981264114379883, 2.331786632537842, 2.565446376800537, 2.7991065979003906, 3.032766580581665, 3.2664265632629395, 3.500086545944214, 3.7337465286254883, 3.967406749725342, 4.201066493988037, 4.434726715087891, 4.668386459350586, 4.9020466804504395, 5.135706901550293, 5.3693671226501465, 5.603026866912842, 5.836687088012695, 6.070346832275391, 6.304007053375244, 6.537667274475098, 6.771327018737793, 7.004986763000488]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 3.0, 5.0, 11.0, 7.0, 10.0, 20.0, 18.0, 21.0, 25.0, 22.0, 25.0, 23.0, 39.0, 41.0, 37.0, 36.0, 45.0, 42.0, 49.0, 41.0, 39.0, 39.0, 42.0, 40.0, 32.0, 35.0, 40.0, 34.0, 18.0, 30.0, 25.0, 24.0, 6.0, 11.0, 14.0, 13.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7472054958343506, -3.6028153896331787, -3.458425283432007, -3.314034938812256, -3.169644832611084, -3.025254726409912, -2.8808646202087402, -2.7364745140075684, -2.5920844078063965, -2.4476943016052246, -2.3033041954040527, -2.158914089202881, -2.01452374458313, -1.870133638381958, -1.7257435321807861, -1.5813533067703247, -1.4369630813598633, -1.2925729751586914, -1.14818274974823, -1.003792643547058, -0.8594024777412415, -0.7150123119354248, -0.5706222057342529, -0.4262319803237915, -0.28184187412261963, -0.13745172321796417, 0.006938427686691284, 0.15132856369018555, 0.2957187294960022, 0.44010889530181885, 0.5844990015029907, 0.7288892269134521, 0.8732790946960449, 1.0176692008972168, 1.1620594263076782, 1.30644953250885, 1.4508397579193115, 1.5952298641204834, 1.7396199703216553, 1.8840101957321167, 2.028400421142578, 2.17279052734375, 2.317180633544922, 2.4615707397460938, 2.6059610843658447, 2.7503511905670166, 2.8947412967681885, 3.0391316413879395, 3.1835215091705322, 3.327911615371704, 3.472301721572876, 3.616692066192627, 3.761082172393799, 3.9054722785949707, 4.049862384796143, 4.1942524909973145, 4.338642597198486, 4.483032703399658, 4.62742280960083, 4.771812915802002, 4.916203022003174, 5.060593605041504, 5.204983711242676, 5.349373817443848, 5.4937639236450195]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 3.0, 11.0, 17.0, 20.0, 30.0, 36.0, 49.0, 71.0, 86.0, 148.0, 227.0, 343.0, 456.0, 832.0, 1378.0, 2131.0, 3878.0, 7179.0, 14118.0, 29273.0, 66237.0, 158265.0, 310146.0, 250435.0, 110411.0, 47238.0, 21655.0, 10507.0, 5609.0, 3018.0, 1722.0, 1019.0, 696.0, 434.0, 266.0, 186.0, 121.0, 83.0, 62.0, 46.0, 30.0, 29.0, 14.0, 10.0, 10.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0793304443359375, -1.040496826171875, -1.0016632080078125, -0.96282958984375, -0.9239959716796875, -0.885162353515625, -0.8463287353515625, -0.8074951171875, -0.7686614990234375, -0.729827880859375, -0.6909942626953125, -0.65216064453125, -0.6133270263671875, -0.574493408203125, -0.5356597900390625, -0.496826171875, -0.4579925537109375, -0.419158935546875, -0.3803253173828125, -0.34149169921875, -0.3026580810546875, -0.263824462890625, -0.2249908447265625, -0.1861572265625, -0.1473236083984375, -0.108489990234375, -0.0696563720703125, -0.03082275390625, 0.0080108642578125, 0.046844482421875, 0.0856781005859375, 0.12451171875, 0.1633453369140625, 0.202178955078125, 0.2410125732421875, 0.27984619140625, 0.3186798095703125, 0.357513427734375, 0.3963470458984375, 0.4351806640625, 0.4740142822265625, 0.512847900390625, 0.5516815185546875, 0.59051513671875, 0.6293487548828125, 0.668182373046875, 0.7070159912109375, 0.745849609375, 0.7846832275390625, 0.823516845703125, 0.8623504638671875, 0.90118408203125, 0.9400177001953125, 0.978851318359375, 1.0176849365234375, 1.0565185546875, 1.0953521728515625, 1.134185791015625, 1.1730194091796875, 1.21185302734375, 1.2506866455078125, 1.289520263671875, 1.3283538818359375, 1.3671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 11.0, 13.0, 15.0, 15.0, 18.0, 17.0, 28.0, 27.0, 37.0, 44.0, 54.0, 59.0, 46.0, 58.0, 65.0, 52.0, 69.0, 59.0, 65.0, 44.0, 36.0, 32.0, 32.0, 15.0, 14.0, 8.0, 8.0, 4.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.308349609375, -0.2990570068359375, -0.289764404296875, -0.2804718017578125, -0.27117919921875, -0.2618865966796875, -0.252593994140625, -0.2433013916015625, -0.2340087890625, -0.2247161865234375, -0.215423583984375, -0.2061309814453125, -0.19683837890625, -0.1875457763671875, -0.178253173828125, -0.1689605712890625, -0.15966796875, -0.1503753662109375, -0.141082763671875, -0.1317901611328125, -0.12249755859375, -0.1132049560546875, -0.103912353515625, -0.0946197509765625, -0.0853271484375, -0.0760345458984375, -0.066741943359375, -0.0574493408203125, -0.04815673828125, -0.0388641357421875, -0.029571533203125, -0.0202789306640625, -0.010986328125, -0.0016937255859375, 0.007598876953125, 0.0168914794921875, 0.02618408203125, 0.0354766845703125, 0.044769287109375, 0.0540618896484375, 0.0633544921875, 0.0726470947265625, 0.081939697265625, 0.0912322998046875, 0.10052490234375, 0.1098175048828125, 0.119110107421875, 0.1284027099609375, 0.1376953125, 0.1469879150390625, 0.156280517578125, 0.1655731201171875, 0.17486572265625, 0.1841583251953125, 0.193450927734375, 0.2027435302734375, 0.2120361328125, 0.2213287353515625, 0.230621337890625, 0.2399139404296875, 0.24920654296875, 0.2584991455078125, 0.267791748046875, 0.2770843505859375, 0.286376953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 6.0, 18.0, 42.0, 48.0, 48.0, 96.0, 172.0, 324.0, 632.0, 1308.0, 2899.0, 6806.0, 19376.0, 68708.0, 334955.0, 474077.0, 98070.0, 25700.0, 8555.0, 3401.0, 1552.0, 809.0, 398.0, 239.0, 123.0, 73.0, 26.0, 28.0, 8.0, 14.0, 17.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.939453125, -1.87506103515625, -1.8106689453125, -1.74627685546875, -1.681884765625, -1.61749267578125, -1.5531005859375, -1.48870849609375, -1.42431640625, -1.35992431640625, -1.2955322265625, -1.23114013671875, -1.166748046875, -1.10235595703125, -1.0379638671875, -0.97357177734375, -0.9091796875, -0.84478759765625, -0.7803955078125, -0.71600341796875, -0.651611328125, -0.58721923828125, -0.5228271484375, -0.45843505859375, -0.39404296875, -0.32965087890625, -0.2652587890625, -0.20086669921875, -0.136474609375, -0.07208251953125, -0.0076904296875, 0.05670166015625, 0.12109375, 0.18548583984375, 0.2498779296875, 0.31427001953125, 0.378662109375, 0.44305419921875, 0.5074462890625, 0.57183837890625, 0.63623046875, 0.70062255859375, 0.7650146484375, 0.82940673828125, 0.893798828125, 0.95819091796875, 1.0225830078125, 1.08697509765625, 1.1513671875, 1.21575927734375, 1.2801513671875, 1.34454345703125, 1.408935546875, 1.47332763671875, 1.5377197265625, 1.60211181640625, 1.66650390625, 1.73089599609375, 1.7952880859375, 1.85968017578125, 1.924072265625, 1.98846435546875, 2.0528564453125, 2.11724853515625, 2.181640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 7.0, 5.0, 15.0, 8.0, 19.0, 21.0, 13.0, 18.0, 22.0, 25.0, 27.0, 34.0, 39.0, 40.0, 28.0, 37.0, 41.0, 46.0, 34.0, 47.0, 52.0, 52.0, 35.0, 34.0, 30.0, 31.0, 33.0, 30.0, 27.0, 26.0, 14.0, 16.0, 13.0, 15.0, 17.0, 6.0, 10.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.309814453125, -1.26513671875, -1.220458984375, -1.17578125, -1.131103515625, -1.08642578125, -1.041748046875, -0.9970703125, -0.952392578125, -0.90771484375, -0.863037109375, -0.818359375, -0.773681640625, -0.72900390625, -0.684326171875, -0.6396484375, -0.594970703125, -0.55029296875, -0.505615234375, -0.4609375, -0.416259765625, -0.37158203125, -0.326904296875, -0.2822265625, -0.237548828125, -0.19287109375, -0.148193359375, -0.103515625, -0.058837890625, -0.01416015625, 0.030517578125, 0.0751953125, 0.119873046875, 0.16455078125, 0.209228515625, 0.25390625, 0.298583984375, 0.34326171875, 0.387939453125, 0.4326171875, 0.477294921875, 0.52197265625, 0.566650390625, 0.611328125, 0.656005859375, 0.70068359375, 0.745361328125, 0.7900390625, 0.834716796875, 0.87939453125, 0.924072265625, 0.96875, 1.013427734375, 1.05810546875, 1.102783203125, 1.1474609375, 1.192138671875, 1.23681640625, 1.281494140625, 1.326171875, 1.370849609375, 1.41552734375, 1.460205078125, 1.5048828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 15.0, 10.0, 14.0, 21.0, 27.0, 45.0, 62.0, 98.0, 150.0, 309.0, 527.0, 1010.0, 2322.0, 6544.0, 26325.0, 302033.0, 653585.0, 40749.0, 8888.0, 3026.0, 1297.0, 629.0, 322.0, 173.0, 130.0, 82.0, 51.0, 25.0, 16.0, 23.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.72528076171875, -5.5286865234375, -5.33209228515625, -5.135498046875, -4.93890380859375, -4.7423095703125, -4.54571533203125, -4.34912109375, -4.15252685546875, -3.9559326171875, -3.75933837890625, -3.562744140625, -3.36614990234375, -3.1695556640625, -2.97296142578125, -2.7763671875, -2.57977294921875, -2.3831787109375, -2.18658447265625, -1.989990234375, -1.79339599609375, -1.5968017578125, -1.40020751953125, -1.20361328125, -1.00701904296875, -0.8104248046875, -0.61383056640625, -0.417236328125, -0.22064208984375, -0.0240478515625, 0.17254638671875, 0.369140625, 0.56573486328125, 0.7623291015625, 0.95892333984375, 1.155517578125, 1.35211181640625, 1.5487060546875, 1.74530029296875, 1.94189453125, 2.13848876953125, 2.3350830078125, 2.53167724609375, 2.728271484375, 2.92486572265625, 3.1214599609375, 3.31805419921875, 3.5146484375, 3.71124267578125, 3.9078369140625, 4.10443115234375, 4.301025390625, 4.49761962890625, 4.6942138671875, 4.89080810546875, 5.08740234375, 5.28399658203125, 5.4805908203125, 5.67718505859375, 5.873779296875, 6.07037353515625, 6.2669677734375, 6.46356201171875, 6.66015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 7.0, 14.0, 19.0, 26.0, 32.0, 50.0, 74.0, 89.0, 119.0, 114.0, 115.0, 97.0, 73.0, 35.0, 34.0, 20.0, 14.0, 13.0, 7.0, 9.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002779960632324219, -0.00026969611644744873, -0.0002613961696624756, -0.00025309622287750244, -0.0002447962760925293, -0.00023649632930755615, -0.000228196382522583, -0.00021989643573760986, -0.00021159648895263672, -0.00020329654216766357, -0.00019499659538269043, -0.00018669664859771729, -0.00017839670181274414, -0.000170096755027771, -0.00016179680824279785, -0.0001534968614578247, -0.00014519691467285156, -0.00013689696788787842, -0.00012859702110290527, -0.00012029707431793213, -0.00011199712753295898, -0.00010369718074798584, -9.53972339630127e-05, -8.709728717803955e-05, -7.87973403930664e-05, -7.049739360809326e-05, -6.219744682312012e-05, -5.389750003814697e-05, -4.559755325317383e-05, -3.7297606468200684e-05, -2.899765968322754e-05, -2.0697712898254395e-05, -1.239776611328125e-05, -4.0978193283081055e-06, 4.202127456665039e-06, 1.2502074241638184e-05, 2.0802021026611328e-05, 2.9101967811584473e-05, 3.740191459655762e-05, 4.570186138153076e-05, 5.4001808166503906e-05, 6.230175495147705e-05, 7.06017017364502e-05, 7.890164852142334e-05, 8.720159530639648e-05, 9.550154209136963e-05, 0.00010380148887634277, 0.00011210143566131592, 0.00012040138244628906, 0.0001287013292312622, 0.00013700127601623535, 0.0001453012228012085, 0.00015360116958618164, 0.00016190111637115479, 0.00017020106315612793, 0.00017850100994110107, 0.00018680095672607422, 0.00019510090351104736, 0.0002034008502960205, 0.00021170079708099365, 0.0002200007438659668, 0.00022830069065093994, 0.00023660063743591309, 0.00024490058422088623, 0.0002532005310058594]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 13.0, 25.0, 39.0, 43.0, 61.0, 91.0, 162.0, 218.0, 324.0, 581.0, 1020.0, 1775.0, 3596.0, 7283.0, 18157.0, 59354.0, 483668.0, 389395.0, 52491.0, 16116.0, 6662.0, 3264.0, 1750.0, 917.0, 555.0, 330.0, 206.0, 150.0, 94.0, 43.0, 45.0, 27.0, 27.0, 22.0, 16.0, 6.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.703125, -4.568572998046875, -4.43402099609375, -4.299468994140625, -4.1649169921875, -4.030364990234375, -3.89581298828125, -3.761260986328125, -3.626708984375, -3.492156982421875, -3.35760498046875, -3.223052978515625, -3.0885009765625, -2.953948974609375, -2.81939697265625, -2.684844970703125, -2.55029296875, -2.415740966796875, -2.28118896484375, -2.146636962890625, -2.0120849609375, -1.877532958984375, -1.74298095703125, -1.608428955078125, -1.473876953125, -1.339324951171875, -1.20477294921875, -1.070220947265625, -0.9356689453125, -0.801116943359375, -0.66656494140625, -0.532012939453125, -0.3974609375, -0.262908935546875, -0.12835693359375, 0.006195068359375, 0.1407470703125, 0.275299072265625, 0.40985107421875, 0.544403076171875, 0.678955078125, 0.813507080078125, 0.94805908203125, 1.082611083984375, 1.2171630859375, 1.351715087890625, 1.48626708984375, 1.620819091796875, 1.75537109375, 1.889923095703125, 2.02447509765625, 2.159027099609375, 2.2935791015625, 2.428131103515625, 2.56268310546875, 2.697235107421875, 2.831787109375, 2.966339111328125, 3.10089111328125, 3.235443115234375, 3.3699951171875, 3.504547119140625, 3.63909912109375, 3.773651123046875, 3.908203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 10.0, 10.0, 15.0, 19.0, 25.0, 46.0, 65.0, 115.0, 130.0, 151.0, 130.0, 83.0, 52.0, 22.0, 27.0, 28.0, 16.0, 16.0, 9.0, 0.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.974609375, -2.878936767578125, -2.78326416015625, -2.687591552734375, -2.5919189453125, -2.496246337890625, -2.40057373046875, -2.304901123046875, -2.209228515625, -2.113555908203125, -2.01788330078125, -1.922210693359375, -1.8265380859375, -1.730865478515625, -1.63519287109375, -1.539520263671875, -1.44384765625, -1.348175048828125, -1.25250244140625, -1.156829833984375, -1.0611572265625, -0.965484619140625, -0.86981201171875, -0.774139404296875, -0.678466796875, -0.582794189453125, -0.48712158203125, -0.391448974609375, -0.2957763671875, -0.200103759765625, -0.10443115234375, -0.008758544921875, 0.0869140625, 0.182586669921875, 0.27825927734375, 0.373931884765625, 0.4696044921875, 0.565277099609375, 0.66094970703125, 0.756622314453125, 0.852294921875, 0.947967529296875, 1.04364013671875, 1.139312744140625, 1.2349853515625, 1.330657958984375, 1.42633056640625, 1.522003173828125, 1.61767578125, 1.713348388671875, 1.80902099609375, 1.904693603515625, 2.0003662109375, 2.096038818359375, 2.19171142578125, 2.287384033203125, 2.383056640625, 2.478729248046875, 2.57440185546875, 2.670074462890625, 2.7657470703125, 2.861419677734375, 2.95709228515625, 3.052764892578125, 3.1484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 8.0, 28.0, 48.0, 73.0, 116.0, 129.0, 151.0, 121.0, 94.0, 75.0, 44.0, 23.0, 21.0, 15.0, 9.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.571746826171875, -15.911078453063965, -15.250410079956055, -14.589741706848145, -13.929073333740234, -13.268404006958008, -12.607735633850098, -11.947067260742188, -11.286398887634277, -10.625730514526367, -9.965062141418457, -9.304393768310547, -8.64372444152832, -7.983056545257568, -7.3223876953125, -6.66171932220459, -6.00105094909668, -5.3403825759887695, -4.679714202880859, -4.019045352935791, -3.358376979827881, -2.6977086067199707, -2.0370399951934814, -1.3763713836669922, -0.715703010559082, -0.055034518241882324, 0.6056339740753174, 1.266302466392517, 1.9269709587097168, 2.587639331817627, 3.248307943344116, 3.9089765548706055, 4.569644927978516, 5.230313301086426, 5.890981674194336, 6.551650524139404, 7.2123188972473145, 7.872987270355225, 8.533656120300293, 9.194324493408203, 9.854992866516113, 10.515661239624023, 11.176329612731934, 11.836997985839844, 12.49766731262207, 13.158334732055664, 13.81900405883789, 14.4796724319458, 15.140340805053711, 15.801009178161621, 16.46167755126953, 17.122346878051758, 17.78301429748535, 18.443683624267578, 19.104351043701172, 19.7650203704834, 20.425689697265625, 21.08635902404785, 21.747026443481445, 22.407695770263672, 23.068363189697266, 23.729032516479492, 24.389699935913086, 25.050369262695312, 25.711036682128906]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 5.0, 5.0, 6.0, 9.0, 12.0, 10.0, 24.0, 31.0, 35.0, 67.0, 125.0, 120.0, 143.0, 113.0, 98.0, 54.0, 47.0, 23.0, 12.0, 9.0, 9.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.483970642089844, -33.58161544799805, -32.67926025390625, -31.776906967163086, -30.874553680419922, -29.972198486328125, -29.069843292236328, -28.16748809814453, -27.265134811401367, -26.36277961730957, -25.460426330566406, -24.55807113647461, -23.655715942382812, -22.75336265563965, -21.85100746154785, -20.948654174804688, -20.04629898071289, -19.143943786621094, -18.24159049987793, -17.339235305786133, -16.43688201904297, -15.534526824951172, -14.632171630859375, -13.729817390441895, -12.827463150024414, -11.925108909606934, -11.022754669189453, -10.120399475097656, -9.218045234680176, -8.315690994262695, -7.413336277008057, -6.510981559753418, -5.60862922668457, -4.70627498626709, -3.803920269012451, -2.9015657901763916, -1.999211311340332, -1.0968570709228516, -0.1945023536682129, 0.7078523635864258, 1.6102066040039062, 2.512561082839966, 3.4149155616760254, 4.317270278930664, 5.2196245193481445, 6.121978759765625, 7.024333477020264, 7.926688194274902, 8.829042434692383, 9.731396675109863, 10.633750915527344, 11.53610610961914, 12.438460350036621, 13.340814590454102, 14.243169784545898, 15.145524024963379, 16.04787826538086, 16.950233459472656, 17.85258674621582, 18.754941940307617, 19.65729522705078, 20.559650421142578, 21.462005615234375, 22.364360809326172, 23.266714096069336]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 11.0, 13.0, 8.0, 22.0, 24.0, 37.0, 52.0, 79.0, 140.0, 205.0, 414.0, 798.0, 1553.0, 3473.0, 8228.0, 22081.0, 75297.0, 455787.0, 3361426.0, 197946.0, 43597.0, 13729.0, 5037.0, 2140.0, 985.0, 515.0, 285.0, 146.0, 94.0, 43.0, 27.0, 22.0, 19.0, 11.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.50958251953125, -5.3277587890625, -5.14593505859375, -4.964111328125, -4.78228759765625, -4.6004638671875, -4.41864013671875, -4.23681640625, -4.05499267578125, -3.8731689453125, -3.69134521484375, -3.509521484375, -3.32769775390625, -3.1458740234375, -2.96405029296875, -2.7822265625, -2.60040283203125, -2.4185791015625, -2.23675537109375, -2.054931640625, -1.87310791015625, -1.6912841796875, -1.50946044921875, -1.32763671875, -1.14581298828125, -0.9639892578125, -0.78216552734375, -0.600341796875, -0.41851806640625, -0.2366943359375, -0.05487060546875, 0.126953125, 0.30877685546875, 0.4906005859375, 0.67242431640625, 0.854248046875, 1.03607177734375, 1.2178955078125, 1.39971923828125, 1.58154296875, 1.76336669921875, 1.9451904296875, 2.12701416015625, 2.308837890625, 2.49066162109375, 2.6724853515625, 2.85430908203125, 3.0361328125, 3.21795654296875, 3.3997802734375, 3.58160400390625, 3.763427734375, 3.94525146484375, 4.1270751953125, 4.30889892578125, 4.49072265625, 4.67254638671875, 4.8543701171875, 5.03619384765625, 5.218017578125, 5.39984130859375, 5.5816650390625, 5.76348876953125, 5.9453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 12.0, 8.0, 12.0, 14.0, 12.0, 22.0, 19.0, 28.0, 40.0, 31.0, 47.0, 50.0, 33.0, 52.0, 55.0, 54.0, 51.0, 42.0, 64.0, 47.0, 50.0, 51.0, 41.0, 34.0, 17.0, 21.0, 16.0, 13.0, 14.0, 7.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27880859375, -0.2700157165527344, -0.26122283935546875, -0.2524299621582031, -0.2436370849609375, -0.23484420776367188, -0.22605133056640625, -0.21725845336914062, -0.208465576171875, -0.19967269897460938, -0.19087982177734375, -0.18208694458007812, -0.1732940673828125, -0.16450119018554688, -0.15570831298828125, -0.14691543579101562, -0.13812255859375, -0.12932968139648438, -0.12053680419921875, -0.11174392700195312, -0.1029510498046875, -0.09415817260742188, -0.08536529541015625, -0.07657241821289062, -0.067779541015625, -0.058986663818359375, -0.05019378662109375, -0.041400909423828125, -0.0326080322265625, -0.023815155029296875, -0.01502227783203125, -0.006229400634765625, 0.0025634765625, 0.011356353759765625, 0.02014923095703125, 0.028942108154296875, 0.0377349853515625, 0.046527862548828125, 0.05532073974609375, 0.06411361694335938, 0.072906494140625, 0.08169937133789062, 0.09049224853515625, 0.09928512573242188, 0.1080780029296875, 0.11687088012695312, 0.12566375732421875, 0.13445663452148438, 0.14324951171875, 0.15204238891601562, 0.16083526611328125, 0.16962814331054688, 0.1784210205078125, 0.18721389770507812, 0.19600677490234375, 0.20479965209960938, 0.213592529296875, 0.22238540649414062, 0.23117828369140625, 0.23997116088867188, 0.2487640380859375, 0.2575569152832031, 0.26634979248046875, 0.2751426696777344, 0.283935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 9.0, 12.0, 32.0, 37.0, 46.0, 84.0, 118.0, 154.0, 241.0, 331.0, 495.0, 755.0, 1144.0, 1707.0, 2624.0, 3976.0, 6441.0, 10563.0, 17947.0, 32962.0, 66478.0, 161769.0, 572077.0, 2630903.0, 423864.0, 132449.0, 56454.0, 28906.0, 15863.0, 9477.0, 5798.0, 3641.0, 2355.0, 1529.0, 971.0, 624.0, 479.0, 290.0, 207.0, 136.0, 94.0, 64.0, 39.0, 34.0, 28.0, 27.0, 13.0, 5.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.8125, -2.7257080078125, -2.638916015625, -2.5521240234375, -2.46533203125, -2.3785400390625, -2.291748046875, -2.2049560546875, -2.1181640625, -2.0313720703125, -1.944580078125, -1.8577880859375, -1.77099609375, -1.6842041015625, -1.597412109375, -1.5106201171875, -1.423828125, -1.3370361328125, -1.250244140625, -1.1634521484375, -1.07666015625, -0.9898681640625, -0.903076171875, -0.8162841796875, -0.7294921875, -0.6427001953125, -0.555908203125, -0.4691162109375, -0.38232421875, -0.2955322265625, -0.208740234375, -0.1219482421875, -0.03515625, 0.0516357421875, 0.138427734375, 0.2252197265625, 0.31201171875, 0.3988037109375, 0.485595703125, 0.5723876953125, 0.6591796875, 0.7459716796875, 0.832763671875, 0.9195556640625, 1.00634765625, 1.0931396484375, 1.179931640625, 1.2667236328125, 1.353515625, 1.4403076171875, 1.527099609375, 1.6138916015625, 1.70068359375, 1.7874755859375, 1.874267578125, 1.9610595703125, 2.0478515625, 2.1346435546875, 2.221435546875, 2.3082275390625, 2.39501953125, 2.4818115234375, 2.568603515625, 2.6553955078125, 2.7421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 14.0, 17.0, 17.0, 23.0, 22.0, 50.0, 40.0, 55.0, 94.0, 128.0, 168.0, 286.0, 474.0, 1334.0, 465.0, 265.0, 151.0, 105.0, 75.0, 61.0, 40.0, 39.0, 22.0, 16.0, 16.0, 12.0, 9.0, 11.0, 5.0, 5.0, 1.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.5792617797851562, -0.5608673095703125, -0.5424728393554688, -0.524078369140625, -0.5056838989257812, -0.4872894287109375, -0.46889495849609375, -0.45050048828125, -0.43210601806640625, -0.4137115478515625, -0.39531707763671875, -0.376922607421875, -0.35852813720703125, -0.3401336669921875, -0.32173919677734375, -0.3033447265625, -0.28495025634765625, -0.2665557861328125, -0.24816131591796875, -0.229766845703125, -0.21137237548828125, -0.1929779052734375, -0.17458343505859375, -0.15618896484375, -0.13779449462890625, -0.1194000244140625, -0.10100555419921875, -0.082611083984375, -0.06421661376953125, -0.0458221435546875, -0.02742767333984375, -0.009033203125, 0.00936126708984375, 0.0277557373046875, 0.04615020751953125, 0.064544677734375, 0.08293914794921875, 0.1013336181640625, 0.11972808837890625, 0.13812255859375, 0.15651702880859375, 0.1749114990234375, 0.19330596923828125, 0.211700439453125, 0.23009490966796875, 0.2484893798828125, 0.26688385009765625, 0.2852783203125, 0.30367279052734375, 0.3220672607421875, 0.34046173095703125, 0.358856201171875, 0.37725067138671875, 0.3956451416015625, 0.41403961181640625, 0.43243408203125, 0.45082855224609375, 0.4692230224609375, 0.48761749267578125, 0.506011962890625, 0.5244064331054688, 0.5428009033203125, 0.5611953735351562, 0.57958984375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 6.0, 15.0, 28.0, 66.0, 139.0, 260.0, 233.0, 130.0, 59.0, 26.0, 13.0, 5.0, 10.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.488038063049316, -8.160572052001953, -7.833106517791748, -7.505640983581543, -7.17817497253418, -6.850709438323975, -6.5232439041137695, -6.195777893066406, -5.868312358856201, -5.540846824645996, -5.213380813598633, -4.885915279388428, -4.558449745178223, -4.230983734130859, -3.9035181999206543, -3.57605242729187, -3.248586654663086, -2.9211208820343018, -2.5936551094055176, -2.2661895751953125, -1.9387238025665283, -1.6112580299377441, -1.2837923765182495, -0.9563267230987549, -0.6288609504699707, -0.3013952374458313, 0.026070475578308105, 0.3535361886024475, 0.6810019016265869, 1.008467674255371, 1.3359333276748657, 1.6633989810943604, 1.9908638000488281, 2.3183295726776123, 2.6457953453063965, 2.9732608795166016, 3.3007266521453857, 3.62819242477417, 3.955657958984375, 4.283123970031738, 4.610589504241943, 4.938055038452148, 5.265521049499512, 5.592986583709717, 5.920452117919922, 6.247918128967285, 6.57538366317749, 6.902849197387695, 7.230315208435059, 7.557780742645264, 7.885246753692627, 8.212712287902832, 8.540178298950195, 8.867643356323242, 9.195109367370605, 9.522575378417969, 9.850040435791016, 10.177506446838379, 10.504971504211426, 10.832437515258789, 11.159903526306152, 11.487369537353516, 11.814834594726562, 12.142300605773926, 12.469766616821289]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 11.0, 7.0, 21.0, 17.0, 22.0, 27.0, 39.0, 44.0, 60.0, 69.0, 82.0, 71.0, 72.0, 63.0, 71.0, 61.0, 50.0, 53.0, 39.0, 27.0, 24.0, 13.0, 16.0, 8.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.937816858291626, -3.8137850761413574, -3.689753293991089, -3.5657215118408203, -3.4416894912719727, -3.317657947540283, -3.1936259269714355, -3.069594144821167, -2.9455623626708984, -2.82153058052063, -2.6974987983703613, -2.5734670162200928, -2.449435234069824, -2.3254032135009766, -2.201371431350708, -2.0773396492004395, -1.953307867050171, -1.8292760848999023, -1.7052443027496338, -1.5812124013900757, -1.4571806192398071, -1.3331488370895386, -1.2091169357299805, -1.085085153579712, -0.9610533714294434, -0.8370215892791748, -0.7129897475242615, -0.5889579057693481, -0.4649261236190796, -0.34089434146881104, -0.2168624997138977, -0.09283065795898438, 0.03120136260986328, 0.15523317456245422, 0.27926498651504517, 0.4032967984676361, 0.527328610420227, 0.6513603925704956, 0.7753922343254089, 0.8994240760803223, 1.0234558582305908, 1.1474876403808594, 1.271519422531128, 1.395551323890686, 1.5195831060409546, 1.6436148881912231, 1.7676467895507812, 1.8916785717010498, 2.0157103538513184, 2.139742136001587, 2.2637739181518555, 2.387805700302124, 2.5118374824523926, 2.6358695030212402, 2.759901285171509, 2.8839330673217773, 3.007964849472046, 3.1319966316223145, 3.256028413772583, 3.3800601959228516, 3.504092216491699, 3.6281237602233887, 3.7521557807922363, 3.876187562942505, 4.000219345092773]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 25.0, 27.0, 67.0, 112.0, 169.0, 293.0, 570.0, 1057.0, 2014.0, 4482.0, 9797.0, 23089.0, 59292.0, 151883.0, 318831.0, 276901.0, 119913.0, 46138.0, 18532.0, 7855.0, 3665.0, 1808.0, 914.0, 436.0, 264.0, 147.0, 76.0, 53.0, 33.0, 18.0, 15.0, 6.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.474609375, -3.38037109375, -3.2861328125, -3.19189453125, -3.09765625, -3.00341796875, -2.9091796875, -2.81494140625, -2.720703125, -2.62646484375, -2.5322265625, -2.43798828125, -2.34375, -2.24951171875, -2.1552734375, -2.06103515625, -1.966796875, -1.87255859375, -1.7783203125, -1.68408203125, -1.58984375, -1.49560546875, -1.4013671875, -1.30712890625, -1.212890625, -1.11865234375, -1.0244140625, -0.93017578125, -0.8359375, -0.74169921875, -0.6474609375, -0.55322265625, -0.458984375, -0.36474609375, -0.2705078125, -0.17626953125, -0.08203125, 0.01220703125, 0.1064453125, 0.20068359375, 0.294921875, 0.38916015625, 0.4833984375, 0.57763671875, 0.671875, 0.76611328125, 0.8603515625, 0.95458984375, 1.048828125, 1.14306640625, 1.2373046875, 1.33154296875, 1.42578125, 1.52001953125, 1.6142578125, 1.70849609375, 1.802734375, 1.89697265625, 1.9912109375, 2.08544921875, 2.1796875, 2.27392578125, 2.3681640625, 2.46240234375, 2.556640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 12.0, 11.0, 6.0, 15.0, 15.0, 19.0, 27.0, 27.0, 34.0, 38.0, 44.0, 41.0, 54.0, 60.0, 54.0, 58.0, 46.0, 57.0, 52.0, 41.0, 49.0, 39.0, 44.0, 25.0, 26.0, 19.0, 16.0, 11.0, 9.0, 4.0, 4.0, 10.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29736328125, -0.2881011962890625, -0.278839111328125, -0.2695770263671875, -0.26031494140625, -0.2510528564453125, -0.241790771484375, -0.2325286865234375, -0.2232666015625, -0.2140045166015625, -0.204742431640625, -0.1954803466796875, -0.18621826171875, -0.1769561767578125, -0.167694091796875, -0.1584320068359375, -0.149169921875, -0.1399078369140625, -0.130645751953125, -0.1213836669921875, -0.11212158203125, -0.1028594970703125, -0.093597412109375, -0.0843353271484375, -0.0750732421875, -0.0658111572265625, -0.056549072265625, -0.0472869873046875, -0.03802490234375, -0.0287628173828125, -0.019500732421875, -0.0102386474609375, -0.0009765625, 0.0082855224609375, 0.017547607421875, 0.0268096923828125, 0.03607177734375, 0.0453338623046875, 0.054595947265625, 0.0638580322265625, 0.0731201171875, 0.0823822021484375, 0.091644287109375, 0.1009063720703125, 0.11016845703125, 0.1194305419921875, 0.128692626953125, 0.1379547119140625, 0.147216796875, 0.1564788818359375, 0.165740966796875, 0.1750030517578125, 0.18426513671875, 0.1935272216796875, 0.202789306640625, 0.2120513916015625, 0.2213134765625, 0.2305755615234375, 0.239837646484375, 0.2490997314453125, 0.25836181640625, 0.2676239013671875, 0.276885986328125, 0.2861480712890625, 0.29541015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 18.0, 20.0, 29.0, 57.0, 150.0, 386.0, 923.0, 2853.0, 11241.0, 62662.0, 469477.0, 428968.0, 56219.0, 11012.0, 2939.0, 936.0, 372.0, 145.0, 70.0, 31.0, 13.0, 14.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.54522705078125, -5.4029541015625, -5.26068115234375, -5.118408203125, -4.97613525390625, -4.8338623046875, -4.69158935546875, -4.54931640625, -4.40704345703125, -4.2647705078125, -4.12249755859375, -3.980224609375, -3.83795166015625, -3.6956787109375, -3.55340576171875, -3.4111328125, -3.26885986328125, -3.1265869140625, -2.98431396484375, -2.842041015625, -2.69976806640625, -2.5574951171875, -2.41522216796875, -2.27294921875, -2.13067626953125, -1.9884033203125, -1.84613037109375, -1.703857421875, -1.56158447265625, -1.4193115234375, -1.27703857421875, -1.134765625, -0.99249267578125, -0.8502197265625, -0.70794677734375, -0.565673828125, -0.42340087890625, -0.2811279296875, -0.13885498046875, 0.00341796875, 0.14569091796875, 0.2879638671875, 0.43023681640625, 0.572509765625, 0.71478271484375, 0.8570556640625, 0.99932861328125, 1.1416015625, 1.28387451171875, 1.4261474609375, 1.56842041015625, 1.710693359375, 1.85296630859375, 1.9952392578125, 2.13751220703125, 2.27978515625, 2.42205810546875, 2.5643310546875, 2.70660400390625, 2.848876953125, 2.99114990234375, 3.1334228515625, 3.27569580078125, 3.41796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 15.0, 12.0, 16.0, 26.0, 23.0, 26.0, 30.0, 28.0, 44.0, 53.0, 52.0, 64.0, 68.0, 56.0, 56.0, 63.0, 50.0, 55.0, 45.0, 28.0, 25.0, 34.0, 31.0, 24.0, 18.0, 10.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.4354705810546875, -1.385589599609375, -1.3357086181640625, -1.28582763671875, -1.2359466552734375, -1.186065673828125, -1.1361846923828125, -1.0863037109375, -1.0364227294921875, -0.986541748046875, -0.9366607666015625, -0.88677978515625, -0.8368988037109375, -0.787017822265625, -0.7371368408203125, -0.687255859375, -0.6373748779296875, -0.587493896484375, -0.5376129150390625, -0.48773193359375, -0.4378509521484375, -0.387969970703125, -0.3380889892578125, -0.2882080078125, -0.2383270263671875, -0.188446044921875, -0.1385650634765625, -0.08868408203125, -0.0388031005859375, 0.011077880859375, 0.0609588623046875, 0.11083984375, 0.1607208251953125, 0.210601806640625, 0.2604827880859375, 0.31036376953125, 0.3602447509765625, 0.410125732421875, 0.4600067138671875, 0.5098876953125, 0.5597686767578125, 0.609649658203125, 0.6595306396484375, 0.70941162109375, 0.7592926025390625, 0.809173583984375, 0.8590545654296875, 0.908935546875, 0.9588165283203125, 1.008697509765625, 1.0585784912109375, 1.10845947265625, 1.1583404541015625, 1.208221435546875, 1.2581024169921875, 1.3079833984375, 1.3578643798828125, 1.407745361328125, 1.4576263427734375, 1.50750732421875, 1.5573883056640625, 1.607269287109375, 1.6571502685546875, 1.70703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 15.0, 14.0, 21.0, 32.0, 61.0, 96.0, 168.0, 325.0, 709.0, 1573.0, 4103.0, 14641.0, 73189.0, 523355.0, 364744.0, 48992.0, 10676.0, 3331.0, 1265.0, 547.0, 278.0, 158.0, 92.0, 51.0, 33.0, 20.0, 16.0, 5.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.98828125, -5.816650390625, -5.64501953125, -5.473388671875, -5.3017578125, -5.130126953125, -4.95849609375, -4.786865234375, -4.615234375, -4.443603515625, -4.27197265625, -4.100341796875, -3.9287109375, -3.757080078125, -3.58544921875, -3.413818359375, -3.2421875, -3.070556640625, -2.89892578125, -2.727294921875, -2.5556640625, -2.384033203125, -2.21240234375, -2.040771484375, -1.869140625, -1.697509765625, -1.52587890625, -1.354248046875, -1.1826171875, -1.010986328125, -0.83935546875, -0.667724609375, -0.49609375, -0.324462890625, -0.15283203125, 0.018798828125, 0.1904296875, 0.362060546875, 0.53369140625, 0.705322265625, 0.876953125, 1.048583984375, 1.22021484375, 1.391845703125, 1.5634765625, 1.735107421875, 1.90673828125, 2.078369140625, 2.25, 2.421630859375, 2.59326171875, 2.764892578125, 2.9365234375, 3.108154296875, 3.27978515625, 3.451416015625, 3.623046875, 3.794677734375, 3.96630859375, 4.137939453125, 4.3095703125, 4.481201171875, 4.65283203125, 4.824462890625, 4.99609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 10.0, 17.0, 21.0, 28.0, 34.0, 51.0, 60.0, 62.0, 75.0, 73.0, 97.0, 89.0, 78.0, 52.0, 36.0, 39.0, 34.0, 27.0, 17.0, 20.0, 10.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003077983856201172, -0.0002982728183269501, -0.00028874725103378296, -0.00027922168374061584, -0.00026969611644744873, -0.0002601705491542816, -0.0002506449818611145, -0.0002411194145679474, -0.00023159384727478027, -0.00022206827998161316, -0.00021254271268844604, -0.00020301714539527893, -0.00019349157810211182, -0.0001839660108089447, -0.0001744404435157776, -0.00016491487622261047, -0.00015538930892944336, -0.00014586374163627625, -0.00013633817434310913, -0.00012681260704994202, -0.0001172870397567749, -0.00010776147246360779, -9.823590517044067e-05, -8.871033787727356e-05, -7.918477058410645e-05, -6.965920329093933e-05, -6.013363599777222e-05, -5.06080687046051e-05, -4.108250141143799e-05, -3.1556934118270874e-05, -2.203136682510376e-05, -1.2505799531936646e-05, -2.9802322387695312e-06, 6.545335054397583e-06, 1.6070902347564697e-05, 2.559646964073181e-05, 3.5122036933898926e-05, 4.464760422706604e-05, 5.4173171520233154e-05, 6.369873881340027e-05, 7.322430610656738e-05, 8.27498733997345e-05, 9.227544069290161e-05, 0.00010180100798606873, 0.00011132657527923584, 0.00012085214257240295, 0.00013037770986557007, 0.00013990327715873718, 0.0001494288444519043, 0.0001589544117450714, 0.00016847997903823853, 0.00017800554633140564, 0.00018753111362457275, 0.00019705668091773987, 0.00020658224821090698, 0.0002161078155040741, 0.0002256333827972412, 0.00023515895009040833, 0.00024468451738357544, 0.00025421008467674255, 0.00026373565196990967, 0.0002732612192630768, 0.0002827867865562439, 0.000292312353849411, 0.0003018379211425781]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 10.0, 19.0, 24.0, 30.0, 51.0, 76.0, 120.0, 226.0, 366.0, 690.0, 1314.0, 2611.0, 5269.0, 11980.0, 30001.0, 85346.0, 266451.0, 399266.0, 159118.0, 50736.0, 18796.0, 8080.0, 3778.0, 1834.0, 1003.0, 525.0, 314.0, 198.0, 134.0, 65.0, 34.0, 28.0, 20.0, 10.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.142303466796875, -2.05023193359375, -1.958160400390625, -1.8660888671875, -1.774017333984375, -1.68194580078125, -1.589874267578125, -1.497802734375, -1.405731201171875, -1.31365966796875, -1.221588134765625, -1.1295166015625, -1.037445068359375, -0.94537353515625, -0.853302001953125, -0.76123046875, -0.669158935546875, -0.57708740234375, -0.485015869140625, -0.3929443359375, -0.300872802734375, -0.20880126953125, -0.116729736328125, -0.024658203125, 0.067413330078125, 0.15948486328125, 0.251556396484375, 0.3436279296875, 0.435699462890625, 0.52777099609375, 0.619842529296875, 0.7119140625, 0.803985595703125, 0.89605712890625, 0.988128662109375, 1.0802001953125, 1.172271728515625, 1.26434326171875, 1.356414794921875, 1.448486328125, 1.540557861328125, 1.63262939453125, 1.724700927734375, 1.8167724609375, 1.908843994140625, 2.00091552734375, 2.092987060546875, 2.18505859375, 2.277130126953125, 2.36920166015625, 2.461273193359375, 2.5533447265625, 2.645416259765625, 2.73748779296875, 2.829559326171875, 2.921630859375, 3.013702392578125, 3.10577392578125, 3.197845458984375, 3.2899169921875, 3.381988525390625, 3.47406005859375, 3.566131591796875, 3.658203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 6.0, 12.0, 10.0, 15.0, 19.0, 18.0, 24.0, 25.0, 23.0, 36.0, 46.0, 50.0, 54.0, 58.0, 62.0, 66.0, 68.0, 68.0, 68.0, 44.0, 37.0, 31.0, 23.0, 28.0, 23.0, 14.0, 9.0, 10.0, 12.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4306640625, -1.3876953125, -1.3447265625, -1.3017578125, -1.2587890625, -1.2158203125, -1.1728515625, -1.1298828125, -1.0869140625, -1.0439453125, -1.0009765625, -0.9580078125, -0.9150390625, -0.8720703125, -0.8291015625, -0.7861328125, -0.7431640625, -0.7001953125, -0.6572265625, -0.6142578125, -0.5712890625, -0.5283203125, -0.4853515625, -0.4423828125, -0.3994140625, -0.3564453125, -0.3134765625, -0.2705078125, -0.2275390625, -0.1845703125, -0.1416015625, -0.0986328125, -0.0556640625, -0.0126953125, 0.0302734375, 0.0732421875, 0.1162109375, 0.1591796875, 0.2021484375, 0.2451171875, 0.2880859375, 0.3310546875, 0.3740234375, 0.4169921875, 0.4599609375, 0.5029296875, 0.5458984375, 0.5888671875, 0.6318359375, 0.6748046875, 0.7177734375, 0.7607421875, 0.8037109375, 0.8466796875, 0.8896484375, 0.9326171875, 0.9755859375, 1.0185546875, 1.0615234375, 1.1044921875, 1.1474609375, 1.1904296875, 1.2333984375, 1.2763671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 13.0, 15.0, 22.0, 62.0, 99.0, 151.0, 167.0, 149.0, 128.0, 73.0, 48.0, 24.0, 15.0, 9.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.550960540771484, -23.866518020629883, -23.18207359313965, -22.497631072998047, -21.813186645507812, -21.12874412536621, -20.44430160522461, -19.759857177734375, -19.07541275024414, -18.39097023010254, -17.706525802612305, -17.022083282470703, -16.33763885498047, -15.653196334838867, -14.96875286102295, -14.284309387207031, -13.59986686706543, -12.915423393249512, -12.230979919433594, -11.546537399291992, -10.862092971801758, -10.177650451660156, -9.493206977844238, -8.80876350402832, -8.124320030212402, -7.439876556396484, -6.755433082580566, -6.070990085601807, -5.386546611785889, -4.702103137969971, -4.017660140991211, -3.333216667175293, -2.648775100708008, -1.9643317461013794, -1.279888391494751, -0.5954451560974121, 0.08899831771850586, 0.7734417915344238, 1.4578847885131836, 2.1423282623291016, 2.8267717361450195, 3.5112152099609375, 4.1956586837768555, 4.880101680755615, 5.564545154571533, 6.248988628387451, 6.933431625366211, 7.617875099182129, 8.302318572998047, 8.986762046813965, 9.671205520629883, 10.355648040771484, 11.040092468261719, 11.72453498840332, 12.408978462219238, 13.093421936035156, 13.777865409851074, 14.462308883666992, 15.14675235748291, 15.831195831298828, 16.51563835144043, 17.200082778930664, 17.884525299072266, 18.5689697265625, 19.2534122467041]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 8.0, 12.0, 16.0, 15.0, 32.0, 39.0, 40.0, 51.0, 53.0, 61.0, 62.0, 67.0, 78.0, 66.0, 67.0, 59.0, 48.0, 37.0, 38.0, 36.0, 21.0, 19.0, 13.0, 10.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.812142372131348, -13.426776885986328, -13.041411399841309, -12.656045913696289, -12.27068042755127, -11.88531494140625, -11.49994945526123, -11.114583969116211, -10.729218482971191, -10.343852996826172, -9.958487510681152, -9.573122024536133, -9.187756538391113, -8.802391052246094, -8.417025566101074, -8.031660079956055, -7.646294116973877, -7.260928630828857, -6.875563144683838, -6.490197658538818, -6.104832172393799, -5.719466686248779, -5.334100723266602, -4.948735237121582, -4.5633697509765625, -4.178004264831543, -3.7926387786865234, -3.407273292541504, -3.0219078063964844, -2.636542320251465, -2.251176595687866, -1.8658111095428467, -1.4804458618164062, -1.0950803756713867, -0.7097148299217224, -0.3243492841720581, 0.061016201972961426, 0.44638168811798096, 0.83174729347229, 1.2171127796173096, 1.602478265762329, 1.9878437519073486, 2.373209238052368, 2.758574962615967, 3.1439404487609863, 3.529305934906006, 3.9146714210510254, 4.300036907196045, 4.6854023933410645, 5.070767879486084, 5.4561333656311035, 5.841498851776123, 6.226864337921143, 6.612229824066162, 6.99759578704834, 7.382961273193359, 7.768326759338379, 8.153692245483398, 8.539057731628418, 8.924423217773438, 9.309788703918457, 9.695154190063477, 10.080519676208496, 10.465885162353516, 10.851250648498535]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 10.0, 12.0, 19.0, 39.0, 76.0, 131.0, 206.0, 424.0, 826.0, 1560.0, 3236.0, 7110.0, 17254.0, 48061.0, 171808.0, 2350738.0, 1365173.0, 156433.0, 44480.0, 15733.0, 6116.0, 2523.0, 1147.0, 514.0, 264.0, 144.0, 88.0, 49.0, 35.0, 20.0, 20.0, 8.0, 10.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.77734375, -4.5859375, -4.39453125, -4.203125, -4.01171875, -3.8203125, -3.62890625, -3.4375, -3.24609375, -3.0546875, -2.86328125, -2.671875, -2.48046875, -2.2890625, -2.09765625, -1.90625, -1.71484375, -1.5234375, -1.33203125, -1.140625, -0.94921875, -0.7578125, -0.56640625, -0.375, -0.18359375, 0.0078125, 0.19921875, 0.390625, 0.58203125, 0.7734375, 0.96484375, 1.15625, 1.34765625, 1.5390625, 1.73046875, 1.921875, 2.11328125, 2.3046875, 2.49609375, 2.6875, 2.87890625, 3.0703125, 3.26171875, 3.453125, 3.64453125, 3.8359375, 4.02734375, 4.21875, 4.41015625, 4.6015625, 4.79296875, 4.984375, 5.17578125, 5.3671875, 5.55859375, 5.75, 5.94140625, 6.1328125, 6.32421875, 6.515625, 6.70703125, 6.8984375, 7.08984375, 7.28125, 7.47265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 12.0, 6.0, 9.0, 10.0, 19.0, 18.0, 12.0, 40.0, 31.0, 45.0, 36.0, 30.0, 53.0, 73.0, 57.0, 60.0, 43.0, 55.0, 59.0, 60.0, 53.0, 40.0, 35.0, 26.0, 25.0, 23.0, 20.0, 14.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.323272705078125, -0.31329345703125, -0.303314208984375, -0.2933349609375, -0.283355712890625, -0.27337646484375, -0.263397216796875, -0.25341796875, -0.243438720703125, -0.23345947265625, -0.223480224609375, -0.2135009765625, -0.203521728515625, -0.19354248046875, -0.183563232421875, -0.173583984375, -0.163604736328125, -0.15362548828125, -0.143646240234375, -0.1336669921875, -0.123687744140625, -0.11370849609375, -0.103729248046875, -0.09375, -0.083770751953125, -0.07379150390625, -0.063812255859375, -0.0538330078125, -0.043853759765625, -0.03387451171875, -0.023895263671875, -0.013916015625, -0.003936767578125, 0.00604248046875, 0.016021728515625, 0.0260009765625, 0.035980224609375, 0.04595947265625, 0.055938720703125, 0.06591796875, 0.075897216796875, 0.08587646484375, 0.095855712890625, 0.1058349609375, 0.115814208984375, 0.12579345703125, 0.135772705078125, 0.145751953125, 0.155731201171875, 0.16571044921875, 0.175689697265625, 0.1856689453125, 0.195648193359375, 0.20562744140625, 0.215606689453125, 0.2255859375, 0.235565185546875, 0.24554443359375, 0.255523681640625, 0.2655029296875, 0.275482177734375, 0.28546142578125, 0.295440673828125, 0.305419921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 9.0, 13.0, 16.0, 19.0, 32.0, 43.0, 86.0, 191.0, 343.0, 1044.0, 3860.0, 20898.0, 193839.0, 3587231.0, 348608.0, 30446.0, 5373.0, 1297.0, 456.0, 201.0, 90.0, 42.0, 32.0, 18.0, 17.0, 10.0, 10.0, 14.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.56494140625, -10.2080078125, -9.85107421875, -9.494140625, -9.13720703125, -8.7802734375, -8.42333984375, -8.06640625, -7.70947265625, -7.3525390625, -6.99560546875, -6.638671875, -6.28173828125, -5.9248046875, -5.56787109375, -5.2109375, -4.85400390625, -4.4970703125, -4.14013671875, -3.783203125, -3.42626953125, -3.0693359375, -2.71240234375, -2.35546875, -1.99853515625, -1.6416015625, -1.28466796875, -0.927734375, -0.57080078125, -0.2138671875, 0.14306640625, 0.5, 0.85693359375, 1.2138671875, 1.57080078125, 1.927734375, 2.28466796875, 2.6416015625, 2.99853515625, 3.35546875, 3.71240234375, 4.0693359375, 4.42626953125, 4.783203125, 5.14013671875, 5.4970703125, 5.85400390625, 6.2109375, 6.56787109375, 6.9248046875, 7.28173828125, 7.638671875, 7.99560546875, 8.3525390625, 8.70947265625, 9.06640625, 9.42333984375, 9.7802734375, 10.13720703125, 10.494140625, 10.85107421875, 11.2080078125, 11.56494140625, 11.921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 11.0, 10.0, 4.0, 10.0, 11.0, 11.0, 26.0, 24.0, 52.0, 63.0, 66.0, 116.0, 182.0, 294.0, 486.0, 1102.0, 610.0, 297.0, 218.0, 114.0, 107.0, 65.0, 56.0, 36.0, 29.0, 15.0, 18.0, 12.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.888671875, -0.858795166015625, -0.82891845703125, -0.799041748046875, -0.7691650390625, -0.739288330078125, -0.70941162109375, -0.679534912109375, -0.649658203125, -0.619781494140625, -0.58990478515625, -0.560028076171875, -0.5301513671875, -0.500274658203125, -0.47039794921875, -0.440521240234375, -0.41064453125, -0.380767822265625, -0.35089111328125, -0.321014404296875, -0.2911376953125, -0.261260986328125, -0.23138427734375, -0.201507568359375, -0.171630859375, -0.141754150390625, -0.11187744140625, -0.082000732421875, -0.0521240234375, -0.022247314453125, 0.00762939453125, 0.037506103515625, 0.0673828125, 0.097259521484375, 0.12713623046875, 0.157012939453125, 0.1868896484375, 0.216766357421875, 0.24664306640625, 0.276519775390625, 0.306396484375, 0.336273193359375, 0.36614990234375, 0.396026611328125, 0.4259033203125, 0.455780029296875, 0.48565673828125, 0.515533447265625, 0.54541015625, 0.575286865234375, 0.60516357421875, 0.635040283203125, 0.6649169921875, 0.694793701171875, 0.72467041015625, 0.754547119140625, 0.784423828125, 0.814300537109375, 0.84417724609375, 0.874053955078125, 0.9039306640625, 0.933807373046875, 0.96368408203125, 0.993560791015625, 1.0234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 28.0, 62.0, 82.0, 133.0, 179.0, 189.0, 129.0, 89.0, 34.0, 25.0, 21.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.062541007995605, -8.715465545654297, -8.368391036987305, -8.021315574645996, -7.674240589141846, -7.327165603637695, -6.980090141296387, -6.633015155792236, -6.285940170288086, -5.9388651847839355, -5.591790199279785, -5.244714736938477, -4.897639751434326, -4.550564765930176, -4.203489303588867, -3.856414318084717, -3.5093393325805664, -3.162264347076416, -2.8151891231536865, -2.468113899230957, -2.1210389137268066, -1.7739638090133667, -1.4268887042999268, -1.0798134803771973, -0.7327384948730469, -0.38566339015960693, -0.03858828544616699, 0.30848681926727295, 0.6555619239807129, 1.0026370286941528, 1.3497121334075928, 1.6967873573303223, 2.043863296508789, 2.3909382820129395, 2.738013505935669, 3.0850887298583984, 3.432163715362549, 3.779238700866699, 4.126314163208008, 4.473389148712158, 4.820464134216309, 5.167539119720459, 5.514614105224609, 5.861689567565918, 6.208764553070068, 6.555839538574219, 6.902915000915527, 7.249989986419678, 7.597064971923828, 7.9441399574279785, 8.291214942932129, 8.638290405273438, 8.98536491394043, 9.332440376281738, 9.679515838623047, 10.026590347290039, 10.373665809631348, 10.720741271972656, 11.067815780639648, 11.414891242980957, 11.761966705322266, 12.109041213989258, 12.456116676330566, 12.803192138671875, 13.150266647338867]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 7.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 25.0, 20.0, 21.0, 28.0, 31.0, 26.0, 37.0, 25.0, 39.0, 30.0, 44.0, 40.0, 36.0, 38.0, 54.0, 39.0, 43.0, 39.0, 38.0, 32.0, 37.0, 34.0, 27.0, 25.0, 25.0, 15.0, 25.0, 21.0, 14.0, 8.0, 3.0, 5.0, 6.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5986080169677734, -3.4780592918395996, -3.357510805130005, -3.236962080001831, -3.1164133548736572, -2.9958648681640625, -2.8753161430358887, -2.754767417907715, -2.63421893119812, -2.5136702060699463, -2.3931217193603516, -2.2725729942321777, -2.152024269104004, -2.031475782394409, -1.9109270572662354, -1.790378451347351, -1.6698297262191772, -1.549281120300293, -1.4287323951721191, -1.3081837892532349, -1.1876351833343506, -1.0670864582061768, -0.9465378522872925, -0.8259892463684082, -0.7054405808448792, -0.5848919153213501, -0.4643433094024658, -0.34379464387893677, -0.2232460081577301, -0.10269737243652344, 0.017851293087005615, 0.1383998990058899, 0.25894856452941895, 0.3794972002506256, 0.5000458359718323, 0.6205945014953613, 0.7411431074142456, 0.8616917729377747, 0.9822404384613037, 1.102789044380188, 1.2233376502990723, 1.3438862562179565, 1.4644349813461304, 1.5849835872650146, 1.705532193183899, 1.8260807991027832, 1.946629524230957, 2.067178249359131, 2.1877269744873047, 2.3082756996154785, 2.4288241863250732, 2.549372911453247, 2.669921636581421, 2.7904701232910156, 2.9110188484191895, 3.0315675735473633, 3.152116060256958, 3.272664785385132, 3.3932132720947266, 3.5137619972229004, 3.634310722351074, 3.754859209060669, 3.8754079341888428, 3.9959564208984375, 4.116505146026611]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 7.0, 14.0, 17.0, 31.0, 53.0, 118.0, 190.0, 455.0, 1101.0, 2839.0, 8572.0, 28701.0, 106903.0, 362398.0, 378425.0, 113748.0, 30822.0, 9034.0, 3035.0, 1100.0, 490.0, 215.0, 100.0, 52.0, 39.0, 20.0, 12.0, 16.0, 8.0, 10.0, 2.0, 4.0, 3.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.50140380859375, -4.3348388671875, -4.16827392578125, -4.001708984375, -3.83514404296875, -3.6685791015625, -3.50201416015625, -3.33544921875, -3.16888427734375, -3.0023193359375, -2.83575439453125, -2.669189453125, -2.50262451171875, -2.3360595703125, -2.16949462890625, -2.0029296875, -1.83636474609375, -1.6697998046875, -1.50323486328125, -1.336669921875, -1.17010498046875, -1.0035400390625, -0.83697509765625, -0.67041015625, -0.50384521484375, -0.3372802734375, -0.17071533203125, -0.004150390625, 0.16241455078125, 0.3289794921875, 0.49554443359375, 0.662109375, 0.82867431640625, 0.9952392578125, 1.16180419921875, 1.328369140625, 1.49493408203125, 1.6614990234375, 1.82806396484375, 1.99462890625, 2.16119384765625, 2.3277587890625, 2.49432373046875, 2.660888671875, 2.82745361328125, 2.9940185546875, 3.16058349609375, 3.3271484375, 3.49371337890625, 3.6602783203125, 3.82684326171875, 3.993408203125, 4.15997314453125, 4.3265380859375, 4.49310302734375, 4.65966796875, 4.82623291015625, 4.9927978515625, 5.15936279296875, 5.325927734375, 5.49249267578125, 5.6590576171875, 5.82562255859375, 5.9921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 5.0, 6.0, 9.0, 11.0, 21.0, 26.0, 27.0, 27.0, 29.0, 47.0, 32.0, 60.0, 54.0, 57.0, 53.0, 64.0, 68.0, 47.0, 45.0, 54.0, 55.0, 44.0, 32.0, 29.0, 21.0, 17.0, 11.0, 13.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.3054962158203125, -0.293853759765625, -0.2822113037109375, -0.27056884765625, -0.2589263916015625, -0.247283935546875, -0.2356414794921875, -0.2239990234375, -0.2123565673828125, -0.200714111328125, -0.1890716552734375, -0.17742919921875, -0.1657867431640625, -0.154144287109375, -0.1425018310546875, -0.130859375, -0.1192169189453125, -0.107574462890625, -0.0959320068359375, -0.08428955078125, -0.0726470947265625, -0.061004638671875, -0.0493621826171875, -0.0377197265625, -0.0260772705078125, -0.014434814453125, -0.0027923583984375, 0.00885009765625, 0.0204925537109375, 0.032135009765625, 0.0437774658203125, 0.055419921875, 0.0670623779296875, 0.078704833984375, 0.0903472900390625, 0.10198974609375, 0.1136322021484375, 0.125274658203125, 0.1369171142578125, 0.1485595703125, 0.1602020263671875, 0.171844482421875, 0.1834869384765625, 0.19512939453125, 0.2067718505859375, 0.218414306640625, 0.2300567626953125, 0.24169921875, 0.2533416748046875, 0.264984130859375, 0.2766265869140625, 0.28826904296875, 0.2999114990234375, 0.311553955078125, 0.3231964111328125, 0.3348388671875, 0.3464813232421875, 0.358123779296875, 0.3697662353515625, 0.38140869140625, 0.3930511474609375, 0.404693603515625, 0.4163360595703125, 0.427978515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 5.0, 7.0, 9.0, 8.0, 17.0, 18.0, 28.0, 49.0, 55.0, 80.0, 104.0, 160.0, 294.0, 456.0, 824.0, 1506.0, 2927.0, 6691.0, 17015.0, 48352.0, 155621.0, 405852.0, 275081.0, 85562.0, 28588.0, 10263.0, 4218.0, 1980.0, 1084.0, 625.0, 393.0, 211.0, 120.0, 108.0, 84.0, 43.0, 40.0, 21.0, 10.0, 4.0, 10.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.08203125, -4.93145751953125, -4.7808837890625, -4.63031005859375, -4.479736328125, -4.32916259765625, -4.1785888671875, -4.02801513671875, -3.87744140625, -3.72686767578125, -3.5762939453125, -3.42572021484375, -3.275146484375, -3.12457275390625, -2.9739990234375, -2.82342529296875, -2.6728515625, -2.52227783203125, -2.3717041015625, -2.22113037109375, -2.070556640625, -1.91998291015625, -1.7694091796875, -1.61883544921875, -1.46826171875, -1.31768798828125, -1.1671142578125, -1.01654052734375, -0.865966796875, -0.71539306640625, -0.5648193359375, -0.41424560546875, -0.263671875, -0.11309814453125, 0.0374755859375, 0.18804931640625, 0.338623046875, 0.48919677734375, 0.6397705078125, 0.79034423828125, 0.94091796875, 1.09149169921875, 1.2420654296875, 1.39263916015625, 1.543212890625, 1.69378662109375, 1.8443603515625, 1.99493408203125, 2.1455078125, 2.29608154296875, 2.4466552734375, 2.59722900390625, 2.747802734375, 2.89837646484375, 3.0489501953125, 3.19952392578125, 3.35009765625, 3.50067138671875, 3.6512451171875, 3.80181884765625, 3.952392578125, 4.10296630859375, 4.2535400390625, 4.40411376953125, 4.5546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 16.0, 12.0, 20.0, 20.0, 21.0, 33.0, 37.0, 33.0, 46.0, 43.0, 58.0, 51.0, 63.0, 60.0, 51.0, 60.0, 55.0, 51.0, 57.0, 35.0, 35.0, 31.0, 23.0, 22.0, 9.0, 23.0, 11.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.742706298828125, -2.65338134765625, -2.564056396484375, -2.4747314453125, -2.385406494140625, -2.29608154296875, -2.206756591796875, -2.117431640625, -2.028106689453125, -1.93878173828125, -1.849456787109375, -1.7601318359375, -1.670806884765625, -1.58148193359375, -1.492156982421875, -1.40283203125, -1.313507080078125, -1.22418212890625, -1.134857177734375, -1.0455322265625, -0.956207275390625, -0.86688232421875, -0.777557373046875, -0.688232421875, -0.598907470703125, -0.50958251953125, -0.420257568359375, -0.3309326171875, -0.241607666015625, -0.15228271484375, -0.062957763671875, 0.0263671875, 0.115692138671875, 0.20501708984375, 0.294342041015625, 0.3836669921875, 0.472991943359375, 0.56231689453125, 0.651641845703125, 0.740966796875, 0.830291748046875, 0.91961669921875, 1.008941650390625, 1.0982666015625, 1.187591552734375, 1.27691650390625, 1.366241455078125, 1.45556640625, 1.544891357421875, 1.63421630859375, 1.723541259765625, 1.8128662109375, 1.902191162109375, 1.99151611328125, 2.080841064453125, 2.170166015625, 2.259490966796875, 2.34881591796875, 2.438140869140625, 2.5274658203125, 2.616790771484375, 2.70611572265625, 2.795440673828125, 2.884765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 12.0, 8.0, 10.0, 19.0, 25.0, 32.0, 35.0, 55.0, 65.0, 78.0, 102.0, 157.0, 193.0, 333.0, 433.0, 641.0, 1019.0, 1703.0, 2979.0, 5832.0, 13301.0, 35432.0, 114043.0, 356948.0, 346064.0, 108980.0, 33989.0, 12630.0, 5625.0, 3008.0, 1654.0, 949.0, 643.0, 439.0, 308.0, 246.0, 131.0, 111.0, 96.0, 61.0, 53.0, 22.0, 28.0, 19.0, 15.0, 7.0, 6.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.921875, -3.80645751953125, -3.6910400390625, -3.57562255859375, -3.460205078125, -3.34478759765625, -3.2293701171875, -3.11395263671875, -2.99853515625, -2.88311767578125, -2.7677001953125, -2.65228271484375, -2.536865234375, -2.42144775390625, -2.3060302734375, -2.19061279296875, -2.0751953125, -1.95977783203125, -1.8443603515625, -1.72894287109375, -1.613525390625, -1.49810791015625, -1.3826904296875, -1.26727294921875, -1.15185546875, -1.03643798828125, -0.9210205078125, -0.80560302734375, -0.690185546875, -0.57476806640625, -0.4593505859375, -0.34393310546875, -0.228515625, -0.11309814453125, 0.0023193359375, 0.11773681640625, 0.233154296875, 0.34857177734375, 0.4639892578125, 0.57940673828125, 0.69482421875, 0.81024169921875, 0.9256591796875, 1.04107666015625, 1.156494140625, 1.27191162109375, 1.3873291015625, 1.50274658203125, 1.6181640625, 1.73358154296875, 1.8489990234375, 1.96441650390625, 2.079833984375, 2.19525146484375, 2.3106689453125, 2.42608642578125, 2.54150390625, 2.65692138671875, 2.7723388671875, 2.88775634765625, 3.003173828125, 3.11859130859375, 3.2340087890625, 3.34942626953125, 3.46484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 4.0, 7.0, 15.0, 12.0, 23.0, 28.0, 38.0, 73.0, 99.0, 133.0, 126.0, 120.0, 86.0, 65.0, 43.0, 25.0, 28.0, 15.0, 14.0, 6.0, 5.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0006742477416992188, -0.0006527304649353027, -0.0006312131881713867, -0.0006096959114074707, -0.0005881786346435547, -0.0005666613578796387, -0.0005451440811157227, -0.0005236268043518066, -0.0005021095275878906, -0.0004805922508239746, -0.0004590749740600586, -0.0004375576972961426, -0.00041604042053222656, -0.00039452314376831055, -0.00037300586700439453, -0.0003514885902404785, -0.0003299713134765625, -0.0003084540367126465, -0.00028693675994873047, -0.00026541948318481445, -0.00024390220642089844, -0.00022238492965698242, -0.0002008676528930664, -0.0001793503761291504, -0.00015783309936523438, -0.00013631582260131836, -0.00011479854583740234, -9.328126907348633e-05, -7.176399230957031e-05, -5.02467155456543e-05, -2.872943878173828e-05, -7.212162017822266e-06, 1.430511474609375e-05, 3.5822391510009766e-05, 5.733966827392578e-05, 7.88569450378418e-05, 0.00010037422180175781, 0.00012189149856567383, 0.00014340877532958984, 0.00016492605209350586, 0.00018644332885742188, 0.0002079606056213379, 0.0002294778823852539, 0.0002509951591491699, 0.00027251243591308594, 0.00029402971267700195, 0.00031554698944091797, 0.000337064266204834, 0.00035858154296875, 0.000380098819732666, 0.00040161609649658203, 0.00042313337326049805, 0.00044465065002441406, 0.0004661679267883301, 0.0004876852035522461, 0.0005092024803161621, 0.0005307197570800781, 0.0005522370338439941, 0.0005737543106079102, 0.0005952715873718262, 0.0006167888641357422, 0.0006383061408996582, 0.0006598234176635742, 0.0006813406944274902, 0.0007028579711914062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 6.0, 5.0, 6.0, 13.0, 18.0, 34.0, 38.0, 58.0, 116.0, 153.0, 243.0, 464.0, 911.0, 1799.0, 4195.0, 11618.0, 43305.0, 223616.0, 565967.0, 148756.0, 31388.0, 9165.0, 3367.0, 1539.0, 759.0, 380.0, 215.0, 140.0, 80.0, 63.0, 33.0, 33.0, 24.0, 6.0, 5.0, 12.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.32421875, -5.14898681640625, -4.9737548828125, -4.79852294921875, -4.623291015625, -4.44805908203125, -4.2728271484375, -4.09759521484375, -3.92236328125, -3.74713134765625, -3.5718994140625, -3.39666748046875, -3.221435546875, -3.04620361328125, -2.8709716796875, -2.69573974609375, -2.5205078125, -2.34527587890625, -2.1700439453125, -1.99481201171875, -1.819580078125, -1.64434814453125, -1.4691162109375, -1.29388427734375, -1.11865234375, -0.94342041015625, -0.7681884765625, -0.59295654296875, -0.417724609375, -0.24249267578125, -0.0672607421875, 0.10797119140625, 0.283203125, 0.45843505859375, 0.6336669921875, 0.80889892578125, 0.984130859375, 1.15936279296875, 1.3345947265625, 1.50982666015625, 1.68505859375, 1.86029052734375, 2.0355224609375, 2.21075439453125, 2.385986328125, 2.56121826171875, 2.7364501953125, 2.91168212890625, 3.0869140625, 3.26214599609375, 3.4373779296875, 3.61260986328125, 3.787841796875, 3.96307373046875, 4.1383056640625, 4.31353759765625, 4.48876953125, 4.66400146484375, 4.8392333984375, 5.01446533203125, 5.189697265625, 5.36492919921875, 5.5401611328125, 5.71539306640625, 5.890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 12.0, 8.0, 11.0, 20.0, 29.0, 54.0, 64.0, 76.0, 95.0, 105.0, 99.0, 116.0, 73.0, 70.0, 44.0, 34.0, 18.0, 23.0, 12.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.3424072265625, -2.245361328125, -2.1483154296875, -2.05126953125, -1.9542236328125, -1.857177734375, -1.7601318359375, -1.6630859375, -1.5660400390625, -1.468994140625, -1.3719482421875, -1.27490234375, -1.1778564453125, -1.080810546875, -0.9837646484375, -0.88671875, -0.7896728515625, -0.692626953125, -0.5955810546875, -0.49853515625, -0.4014892578125, -0.304443359375, -0.2073974609375, -0.1103515625, -0.0133056640625, 0.083740234375, 0.1807861328125, 0.27783203125, 0.3748779296875, 0.471923828125, 0.5689697265625, 0.666015625, 0.7630615234375, 0.860107421875, 0.9571533203125, 1.05419921875, 1.1512451171875, 1.248291015625, 1.3453369140625, 1.4423828125, 1.5394287109375, 1.636474609375, 1.7335205078125, 1.83056640625, 1.9276123046875, 2.024658203125, 2.1217041015625, 2.21875, 2.3157958984375, 2.412841796875, 2.5098876953125, 2.60693359375, 2.7039794921875, 2.801025390625, 2.8980712890625, 2.9951171875, 3.0921630859375, 3.189208984375, 3.2862548828125, 3.38330078125, 3.4803466796875, 3.577392578125, 3.6744384765625, 3.771484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 7.0, 13.0, 24.0, 57.0, 128.0, 195.0, 196.0, 159.0, 111.0, 45.0, 31.0, 15.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.039459228515625, -48.49869918823242, -46.95793914794922, -45.41717529296875, -43.87641525268555, -42.335655212402344, -40.79489517211914, -39.25413513183594, -37.713375091552734, -36.17261505126953, -34.63185501098633, -33.091094970703125, -31.55033302307129, -30.009571075439453, -28.46881103515625, -26.928050994873047, -25.38728904724121, -23.846529006958008, -22.305767059326172, -20.76500701904297, -19.224246978759766, -17.683486938476562, -16.142724990844727, -14.601964950561523, -13.061203956604004, -11.520442962646484, -9.979682922363281, -8.438921928405762, -6.8981614112854, -5.357400894165039, -3.8166399002075195, -2.2758798599243164, -0.7351188659667969, 0.805641770362854, 2.346402406692505, 3.8871631622314453, 5.427923679351807, 6.968684196472168, 8.509445190429688, 10.05020523071289, 11.59096622467041, 13.13172721862793, 14.672487258911133, 16.21324920654297, 17.754009246826172, 19.294769287109375, 20.835529327392578, 22.37628936767578, 23.917051315307617, 25.45781135559082, 26.998573303222656, 28.53933334350586, 30.080093383789062, 31.620853424072266, 33.16161346435547, 34.70237731933594, 36.24313735961914, 37.783897399902344, 39.32465744018555, 40.86541748046875, 42.40618133544922, 43.94694137573242, 45.487701416015625, 47.02846145629883, 48.56922149658203]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 5.0, 1.0, 6.0, 10.0, 14.0, 17.0, 14.0, 16.0, 30.0, 42.0, 25.0, 34.0, 38.0, 34.0, 51.0, 56.0, 43.0, 53.0, 47.0, 53.0, 47.0, 57.0, 45.0, 38.0, 27.0, 31.0, 25.0, 21.0, 28.0, 21.0, 13.0, 11.0, 9.0, 11.0, 8.0, 7.0, 1.0, 1.0, 0.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.185787200927734, -18.594310760498047, -18.00283432006836, -17.411357879638672, -16.819881439208984, -16.228403091430664, -15.636926651000977, -15.045450210571289, -14.453973770141602, -13.862497329711914, -13.271020889282227, -12.679543495178223, -12.088067054748535, -11.496590614318848, -10.905113220214844, -10.313636779785156, -9.722160339355469, -9.130683898925781, -8.539207458496094, -7.94773006439209, -7.356253623962402, -6.764777183532715, -6.173300266265869, -5.581823348999023, -4.990346908569336, -4.398870468139648, -3.8073935508728027, -3.215916872024536, -2.6244401931762695, -2.032963514328003, -1.4414868354797363, -0.8500099182128906, -0.2585334777832031, 0.3329432010650635, 0.9244198799133301, 1.5158965587615967, 2.1073732376098633, 2.69884991645813, 3.2903265953063965, 3.881803512573242, 4.47327995300293, 5.064756393432617, 5.656233310699463, 6.247710227966309, 6.839186668395996, 7.430663108825684, 8.022140502929688, 8.613616943359375, 9.205093383789062, 9.79656982421875, 10.388046264648438, 10.979523658752441, 11.571000099182129, 12.162476539611816, 12.75395393371582, 13.345430374145508, 13.936906814575195, 14.528383255004883, 15.11985969543457, 15.711337089538574, 16.302814483642578, 16.894290924072266, 17.485767364501953, 18.07724380493164, 18.668720245361328]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 14.0, 14.0, 19.0, 53.0, 80.0, 131.0, 243.0, 446.0, 791.0, 1518.0, 3073.0, 7136.0, 18173.0, 52831.0, 201507.0, 3072613.0, 666674.0, 112885.0, 33425.0, 12216.0, 5081.0, 2371.0, 1201.0, 630.0, 396.0, 237.0, 143.0, 105.0, 58.0, 44.0, 46.0, 29.0, 19.0, 12.0, 9.0, 10.0, 7.0, 6.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.60546875, -4.40350341796875, -4.2015380859375, -3.99957275390625, -3.797607421875, -3.59564208984375, -3.3936767578125, -3.19171142578125, -2.98974609375, -2.78778076171875, -2.5858154296875, -2.38385009765625, -2.181884765625, -1.97991943359375, -1.7779541015625, -1.57598876953125, -1.3740234375, -1.17205810546875, -0.9700927734375, -0.76812744140625, -0.566162109375, -0.36419677734375, -0.1622314453125, 0.03973388671875, 0.24169921875, 0.44366455078125, 0.6456298828125, 0.84759521484375, 1.049560546875, 1.25152587890625, 1.4534912109375, 1.65545654296875, 1.857421875, 2.05938720703125, 2.2613525390625, 2.46331787109375, 2.665283203125, 2.86724853515625, 3.0692138671875, 3.27117919921875, 3.47314453125, 3.67510986328125, 3.8770751953125, 4.07904052734375, 4.281005859375, 4.48297119140625, 4.6849365234375, 4.88690185546875, 5.0888671875, 5.29083251953125, 5.4927978515625, 5.69476318359375, 5.896728515625, 6.09869384765625, 6.3006591796875, 6.50262451171875, 6.70458984375, 6.90655517578125, 7.1085205078125, 7.31048583984375, 7.512451171875, 7.71441650390625, 7.9163818359375, 8.11834716796875, 8.3203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 11.0, 10.0, 14.0, 20.0, 16.0, 31.0, 29.0, 45.0, 45.0, 51.0, 46.0, 64.0, 69.0, 66.0, 50.0, 67.0, 54.0, 62.0, 41.0, 34.0, 32.0, 27.0, 15.0, 17.0, 16.0, 15.0, 7.0, 10.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4765625, -0.460968017578125, -0.44537353515625, -0.429779052734375, -0.4141845703125, -0.398590087890625, -0.38299560546875, -0.367401123046875, -0.351806640625, -0.336212158203125, -0.32061767578125, -0.305023193359375, -0.2894287109375, -0.273834228515625, -0.25823974609375, -0.242645263671875, -0.22705078125, -0.211456298828125, -0.19586181640625, -0.180267333984375, -0.1646728515625, -0.149078369140625, -0.13348388671875, -0.117889404296875, -0.102294921875, -0.086700439453125, -0.07110595703125, -0.055511474609375, -0.0399169921875, -0.024322509765625, -0.00872802734375, 0.006866455078125, 0.0224609375, 0.038055419921875, 0.05364990234375, 0.069244384765625, 0.0848388671875, 0.100433349609375, 0.11602783203125, 0.131622314453125, 0.147216796875, 0.162811279296875, 0.17840576171875, 0.194000244140625, 0.2095947265625, 0.225189208984375, 0.24078369140625, 0.256378173828125, 0.27197265625, 0.287567138671875, 0.30316162109375, 0.318756103515625, 0.3343505859375, 0.349945068359375, 0.36553955078125, 0.381134033203125, 0.396728515625, 0.412322998046875, 0.42791748046875, 0.443511962890625, 0.4591064453125, 0.474700927734375, 0.49029541015625, 0.505889892578125, 0.521484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 8.0, 16.0, 26.0, 39.0, 44.0, 92.0, 196.0, 528.0, 1276.0, 4516.0, 20354.0, 157228.0, 3589880.0, 374747.0, 35106.0, 7023.0, 1954.0, 645.0, 280.0, 117.0, 72.0, 41.0, 29.0, 17.0, 15.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.40869140625, -7.9580078125, -7.50732421875, -7.056640625, -6.60595703125, -6.1552734375, -5.70458984375, -5.25390625, -4.80322265625, -4.3525390625, -3.90185546875, -3.451171875, -3.00048828125, -2.5498046875, -2.09912109375, -1.6484375, -1.19775390625, -0.7470703125, -0.29638671875, 0.154296875, 0.60498046875, 1.0556640625, 1.50634765625, 1.95703125, 2.40771484375, 2.8583984375, 3.30908203125, 3.759765625, 4.21044921875, 4.6611328125, 5.11181640625, 5.5625, 6.01318359375, 6.4638671875, 6.91455078125, 7.365234375, 7.81591796875, 8.2666015625, 8.71728515625, 9.16796875, 9.61865234375, 10.0693359375, 10.52001953125, 10.970703125, 11.42138671875, 11.8720703125, 12.32275390625, 12.7734375, 13.22412109375, 13.6748046875, 14.12548828125, 14.576171875, 15.02685546875, 15.4775390625, 15.92822265625, 16.37890625, 16.82958984375, 17.2802734375, 17.73095703125, 18.181640625, 18.63232421875, 19.0830078125, 19.53369140625, 19.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 10.0, 16.0, 23.0, 20.0, 24.0, 49.0, 56.0, 92.0, 108.0, 166.0, 296.0, 609.0, 1472.0, 434.0, 235.0, 131.0, 98.0, 72.0, 33.0, 24.0, 22.0, 16.0, 17.0, 11.0, 5.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4267578125, -1.3725128173828125, -1.318267822265625, -1.2640228271484375, -1.20977783203125, -1.1555328369140625, -1.101287841796875, -1.0470428466796875, -0.9927978515625, -0.9385528564453125, -0.884307861328125, -0.8300628662109375, -0.77581787109375, -0.7215728759765625, -0.667327880859375, -0.6130828857421875, -0.558837890625, -0.5045928955078125, -0.450347900390625, -0.3961029052734375, -0.34185791015625, -0.2876129150390625, -0.233367919921875, -0.1791229248046875, -0.1248779296875, -0.0706329345703125, -0.016387939453125, 0.0378570556640625, 0.09210205078125, 0.1463470458984375, 0.200592041015625, 0.2548370361328125, 0.30908203125, 0.3633270263671875, 0.417572021484375, 0.4718170166015625, 0.52606201171875, 0.5803070068359375, 0.634552001953125, 0.6887969970703125, 0.7430419921875, 0.7972869873046875, 0.851531982421875, 0.9057769775390625, 0.96002197265625, 1.0142669677734375, 1.068511962890625, 1.1227569580078125, 1.177001953125, 1.2312469482421875, 1.285491943359375, 1.3397369384765625, 1.39398193359375, 1.4482269287109375, 1.502471923828125, 1.5567169189453125, 1.6109619140625, 1.6652069091796875, 1.719451904296875, 1.7736968994140625, 1.82794189453125, 1.8821868896484375, 1.936431884765625, 1.9906768798828125, 2.044921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 71.0, 234.0, 401.0, 210.0, 58.0, 21.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.905574798583984, -61.66053771972656, -60.415504455566406, -59.170467376708984, -57.92543029785156, -56.68039321899414, -55.435359954833984, -54.19032287597656, -52.94528579711914, -51.70024871826172, -50.45521545410156, -49.21017837524414, -47.96514129638672, -46.7201042175293, -45.47507095336914, -44.23003387451172, -42.98500061035156, -41.73996353149414, -40.494930267333984, -39.24989318847656, -38.00485610961914, -36.75981903076172, -35.51478576660156, -34.26974868774414, -33.02471160888672, -31.77967643737793, -30.534639358520508, -29.28960418701172, -28.044567108154297, -26.799531936645508, -25.55449676513672, -24.309459686279297, -23.064420700073242, -21.819385528564453, -20.57434844970703, -19.329313278198242, -18.08427619934082, -16.83924102783203, -15.594204902648926, -14.34916877746582, -13.104132652282715, -11.85909652709961, -10.614060401916504, -9.369024276733398, -8.12398910522461, -6.878952503204346, -5.633916854858398, -4.388880729675293, -3.1438446044921875, -1.8988085985183716, -0.6537725925445557, 0.5912632942199707, 1.8362994194030762, 3.0813355445861816, 4.326371192932129, 5.571407318115234, 6.81644344329834, 8.061479568481445, 9.30651569366455, 10.551551818847656, 11.796586990356445, 13.041624069213867, 14.286659240722656, 15.531695365905762, 16.776731491088867]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 4.0, 11.0, 11.0, 11.0, 23.0, 21.0, 27.0, 26.0, 27.0, 42.0, 37.0, 43.0, 46.0, 61.0, 59.0, 48.0, 49.0, 44.0, 47.0, 44.0, 38.0, 33.0, 44.0, 21.0, 37.0, 27.0, 18.0, 26.0, 18.0, 9.0, 8.0, 13.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.264930725097656, -8.04144287109375, -7.81795597076416, -7.594468116760254, -7.370980739593506, -7.147493362426758, -6.92400598526001, -6.700518608093262, -6.4770307540893555, -6.253543376922607, -6.030055999755859, -5.806568145751953, -5.583080768585205, -5.359593391418457, -5.136106014251709, -4.912618637084961, -4.689131259918213, -4.465643882751465, -4.242156505584717, -4.018669128417969, -3.7951812744140625, -3.5716938972473145, -3.3482065200805664, -3.1247191429138184, -2.901231527328491, -2.677744150161743, -2.454256534576416, -2.230769157409668, -2.00728178024292, -1.7837941646575928, -1.5603067874908447, -1.3368192911148071, -1.1133317947387695, -0.8898442983627319, -0.6663568615913391, -0.4428694248199463, -0.2193819284439087, 0.004105567932128906, 0.22759294509887695, 0.45108044147491455, 0.6745679378509521, 0.8980554342269897, 1.1215429306030273, 1.3450303077697754, 1.568517804145813, 1.7920053005218506, 2.0154926776885986, 2.238980293273926, 2.462467670440674, 2.685955047607422, 2.909442663192749, 3.132930040359497, 3.356417655944824, 3.5799050331115723, 3.8033924102783203, 4.026879787445068, 4.250367164611816, 4.4738545417785645, 4.6973419189453125, 4.920829772949219, 5.144317150115967, 5.367804527282715, 5.591291904449463, 5.814779281616211, 6.038267135620117]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 8.0, 11.0, 15.0, 19.0, 34.0, 60.0, 83.0, 113.0, 202.0, 350.0, 583.0, 1007.0, 1922.0, 3998.0, 9053.0, 20910.0, 51370.0, 122378.0, 262399.0, 301472.0, 157246.0, 65869.0, 27419.0, 11660.0, 5020.0, 2397.0, 1254.0, 673.0, 387.0, 212.0, 136.0, 105.0, 60.0, 36.0, 17.0, 22.0, 17.0, 7.0, 11.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.65985107421875, -3.5384521484375, -3.41705322265625, -3.295654296875, -3.17425537109375, -3.0528564453125, -2.93145751953125, -2.81005859375, -2.68865966796875, -2.5672607421875, -2.44586181640625, -2.324462890625, -2.20306396484375, -2.0816650390625, -1.96026611328125, -1.8388671875, -1.71746826171875, -1.5960693359375, -1.47467041015625, -1.353271484375, -1.23187255859375, -1.1104736328125, -0.98907470703125, -0.86767578125, -0.74627685546875, -0.6248779296875, -0.50347900390625, -0.382080078125, -0.26068115234375, -0.1392822265625, -0.01788330078125, 0.103515625, 0.22491455078125, 0.3463134765625, 0.46771240234375, 0.589111328125, 0.71051025390625, 0.8319091796875, 0.95330810546875, 1.07470703125, 1.19610595703125, 1.3175048828125, 1.43890380859375, 1.560302734375, 1.68170166015625, 1.8031005859375, 1.92449951171875, 2.0458984375, 2.16729736328125, 2.2886962890625, 2.41009521484375, 2.531494140625, 2.65289306640625, 2.7742919921875, 2.89569091796875, 3.01708984375, 3.13848876953125, 3.2598876953125, 3.38128662109375, 3.502685546875, 3.62408447265625, 3.7454833984375, 3.86688232421875, 3.98828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 12.0, 10.0, 16.0, 15.0, 20.0, 20.0, 25.0, 34.0, 44.0, 48.0, 53.0, 59.0, 48.0, 67.0, 66.0, 61.0, 68.0, 45.0, 58.0, 35.0, 40.0, 21.0, 22.0, 23.0, 16.0, 16.0, 13.0, 7.0, 3.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4683723449707031, -0.45066070556640625, -0.4329490661621094, -0.4152374267578125, -0.3975257873535156, -0.37981414794921875, -0.3621025085449219, -0.344390869140625, -0.3266792297363281, -0.30896759033203125, -0.2912559509277344, -0.2735443115234375, -0.2558326721191406, -0.23812103271484375, -0.22040939331054688, -0.20269775390625, -0.18498611450195312, -0.16727447509765625, -0.14956283569335938, -0.1318511962890625, -0.11413955688476562, -0.09642791748046875, -0.07871627807617188, -0.061004638671875, -0.043292999267578125, -0.02558135986328125, -0.007869720458984375, 0.0098419189453125, 0.027553558349609375, 0.04526519775390625, 0.06297683715820312, 0.0806884765625, 0.09840011596679688, 0.11611175537109375, 0.13382339477539062, 0.1515350341796875, 0.16924667358398438, 0.18695831298828125, 0.20466995239257812, 0.222381591796875, 0.24009323120117188, 0.25780487060546875, 0.2755165100097656, 0.2932281494140625, 0.3109397888183594, 0.32865142822265625, 0.3463630676269531, 0.36407470703125, 0.3817863464355469, 0.39949798583984375, 0.4172096252441406, 0.4349212646484375, 0.4526329040527344, 0.47034454345703125, 0.4880561828613281, 0.505767822265625, 0.5234794616699219, 0.5411911010742188, 0.5589027404785156, 0.5766143798828125, 0.5943260192871094, 0.6120376586914062, 0.6297492980957031, 0.6474609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 13.0, 12.0, 21.0, 22.0, 34.0, 46.0, 61.0, 100.0, 135.0, 214.0, 373.0, 593.0, 1251.0, 2607.0, 6356.0, 18273.0, 58662.0, 207723.0, 467849.0, 198442.0, 56867.0, 17385.0, 6264.0, 2485.0, 1146.0, 592.0, 362.0, 233.0, 143.0, 97.0, 51.0, 25.0, 29.0, 30.0, 23.0, 5.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.34765625, -6.1580810546875, -5.968505859375, -5.7789306640625, -5.58935546875, -5.3997802734375, -5.210205078125, -5.0206298828125, -4.8310546875, -4.6414794921875, -4.451904296875, -4.2623291015625, -4.07275390625, -3.8831787109375, -3.693603515625, -3.5040283203125, -3.314453125, -3.1248779296875, -2.935302734375, -2.7457275390625, -2.55615234375, -2.3665771484375, -2.177001953125, -1.9874267578125, -1.7978515625, -1.6082763671875, -1.418701171875, -1.2291259765625, -1.03955078125, -0.8499755859375, -0.660400390625, -0.4708251953125, -0.28125, -0.0916748046875, 0.097900390625, 0.2874755859375, 0.47705078125, 0.6666259765625, 0.856201171875, 1.0457763671875, 1.2353515625, 1.4249267578125, 1.614501953125, 1.8040771484375, 1.99365234375, 2.1832275390625, 2.372802734375, 2.5623779296875, 2.751953125, 2.9415283203125, 3.131103515625, 3.3206787109375, 3.51025390625, 3.6998291015625, 3.889404296875, 4.0789794921875, 4.2685546875, 4.4581298828125, 4.647705078125, 4.8372802734375, 5.02685546875, 5.2164306640625, 5.406005859375, 5.5955810546875, 5.78515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 1.0, 7.0, 4.0, 10.0, 6.0, 10.0, 14.0, 14.0, 12.0, 17.0, 24.0, 25.0, 29.0, 32.0, 35.0, 39.0, 33.0, 53.0, 47.0, 50.0, 43.0, 52.0, 44.0, 45.0, 41.0, 37.0, 31.0, 42.0, 41.0, 21.0, 18.0, 21.0, 11.0, 18.0, 9.0, 18.0, 14.0, 6.0, 11.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.98199462890625, -2.8858642578125, -2.78973388671875, -2.693603515625, -2.59747314453125, -2.5013427734375, -2.40521240234375, -2.30908203125, -2.21295166015625, -2.1168212890625, -2.02069091796875, -1.924560546875, -1.82843017578125, -1.7322998046875, -1.63616943359375, -1.5400390625, -1.44390869140625, -1.3477783203125, -1.25164794921875, -1.155517578125, -1.05938720703125, -0.9632568359375, -0.86712646484375, -0.77099609375, -0.67486572265625, -0.5787353515625, -0.48260498046875, -0.386474609375, -0.29034423828125, -0.1942138671875, -0.09808349609375, -0.001953125, 0.09417724609375, 0.1903076171875, 0.28643798828125, 0.382568359375, 0.47869873046875, 0.5748291015625, 0.67095947265625, 0.76708984375, 0.86322021484375, 0.9593505859375, 1.05548095703125, 1.151611328125, 1.24774169921875, 1.3438720703125, 1.44000244140625, 1.5361328125, 1.63226318359375, 1.7283935546875, 1.82452392578125, 1.920654296875, 2.01678466796875, 2.1129150390625, 2.20904541015625, 2.30517578125, 2.40130615234375, 2.4974365234375, 2.59356689453125, 2.689697265625, 2.78582763671875, 2.8819580078125, 2.97808837890625, 3.07421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 8.0, 7.0, 7.0, 11.0, 12.0, 15.0, 26.0, 34.0, 38.0, 67.0, 90.0, 135.0, 158.0, 286.0, 421.0, 614.0, 1155.0, 2082.0, 3970.0, 7746.0, 16529.0, 37414.0, 93332.0, 252051.0, 361576.0, 160579.0, 60618.0, 25324.0, 11618.0, 5670.0, 2861.0, 1567.0, 840.0, 516.0, 383.0, 248.0, 161.0, 97.0, 61.0, 52.0, 34.0, 30.0, 21.0, 23.0, 19.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 5.0], "bins": [-2.583984375, -2.506317138671875, -2.42864990234375, -2.350982666015625, -2.2733154296875, -2.195648193359375, -2.11798095703125, -2.040313720703125, -1.962646484375, -1.884979248046875, -1.80731201171875, -1.729644775390625, -1.6519775390625, -1.574310302734375, -1.49664306640625, -1.418975830078125, -1.34130859375, -1.263641357421875, -1.18597412109375, -1.108306884765625, -1.0306396484375, -0.952972412109375, -0.87530517578125, -0.797637939453125, -0.719970703125, -0.642303466796875, -0.56463623046875, -0.486968994140625, -0.4093017578125, -0.331634521484375, -0.25396728515625, -0.176300048828125, -0.0986328125, -0.020965576171875, 0.05670166015625, 0.134368896484375, 0.2120361328125, 0.289703369140625, 0.36737060546875, 0.445037841796875, 0.522705078125, 0.600372314453125, 0.67803955078125, 0.755706787109375, 0.8333740234375, 0.911041259765625, 0.98870849609375, 1.066375732421875, 1.14404296875, 1.221710205078125, 1.29937744140625, 1.377044677734375, 1.4547119140625, 1.532379150390625, 1.61004638671875, 1.687713623046875, 1.765380859375, 1.843048095703125, 1.92071533203125, 1.998382568359375, 2.0760498046875, 2.153717041015625, 2.23138427734375, 2.309051513671875, 2.38671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 11.0, 9.0, 10.0, 12.0, 24.0, 24.0, 32.0, 49.0, 53.0, 78.0, 105.0, 109.0, 105.0, 66.0, 62.0, 65.0, 29.0, 30.0, 22.0, 29.0, 13.0, 7.0, 10.0, 7.0, 6.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005450248718261719, -0.0005292855203151703, -0.0005135461688041687, -0.0004978068172931671, -0.00048206746578216553, -0.00046632811427116394, -0.00045058876276016235, -0.00043484941124916077, -0.0004191100597381592, -0.0004033707082271576, -0.000387631356716156, -0.0003718920052051544, -0.00035615265369415283, -0.00034041330218315125, -0.00032467395067214966, -0.00030893459916114807, -0.0002931952476501465, -0.0002774558961391449, -0.0002617165446281433, -0.0002459771931171417, -0.00023023784160614014, -0.00021449849009513855, -0.00019875913858413696, -0.00018301978707313538, -0.0001672804355621338, -0.0001515410840511322, -0.00013580173254013062, -0.00012006238102912903, -0.00010432302951812744, -8.858367800712585e-05, -7.284432649612427e-05, -5.710497498512268e-05, -4.1365623474121094e-05, -2.5626271963119507e-05, -9.88692045211792e-06, 5.852431058883667e-06, 2.1591782569885254e-05, 3.733113408088684e-05, 5.307048559188843e-05, 6.880983710289001e-05, 8.45491886138916e-05, 0.00010028854012489319, 0.00011602789163589478, 0.00013176724314689636, 0.00014750659465789795, 0.00016324594616889954, 0.00017898529767990112, 0.0001947246491909027, 0.0002104640007019043, 0.00022620335221290588, 0.00024194270372390747, 0.00025768205523490906, 0.00027342140674591064, 0.00028916075825691223, 0.0003049001097679138, 0.0003206394612789154, 0.000336378812789917, 0.0003521181643009186, 0.00036785751581192017, 0.00038359686732292175, 0.00039933621883392334, 0.0004150755703449249, 0.0004308149218559265, 0.0004465542733669281, 0.0004622936248779297]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 10.0, 5.0, 7.0, 8.0, 32.0, 26.0, 35.0, 68.0, 97.0, 190.0, 260.0, 438.0, 852.0, 1650.0, 3754.0, 9921.0, 30544.0, 122104.0, 527358.0, 266120.0, 57143.0, 16941.0, 5855.0, 2455.0, 1167.0, 570.0, 342.0, 203.0, 127.0, 88.0, 63.0, 41.0, 30.0, 20.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.29296875, -5.148895263671875, -5.00482177734375, -4.860748291015625, -4.7166748046875, -4.572601318359375, -4.42852783203125, -4.284454345703125, -4.140380859375, -3.996307373046875, -3.85223388671875, -3.708160400390625, -3.5640869140625, -3.420013427734375, -3.27593994140625, -3.131866455078125, -2.98779296875, -2.843719482421875, -2.69964599609375, -2.555572509765625, -2.4114990234375, -2.267425537109375, -2.12335205078125, -1.979278564453125, -1.835205078125, -1.691131591796875, -1.54705810546875, -1.402984619140625, -1.2589111328125, -1.114837646484375, -0.97076416015625, -0.826690673828125, -0.6826171875, -0.538543701171875, -0.39447021484375, -0.250396728515625, -0.1063232421875, 0.037750244140625, 0.18182373046875, 0.325897216796875, 0.469970703125, 0.614044189453125, 0.75811767578125, 0.902191162109375, 1.0462646484375, 1.190338134765625, 1.33441162109375, 1.478485107421875, 1.62255859375, 1.766632080078125, 1.91070556640625, 2.054779052734375, 2.1988525390625, 2.342926025390625, 2.48699951171875, 2.631072998046875, 2.775146484375, 2.919219970703125, 3.06329345703125, 3.207366943359375, 3.3514404296875, 3.495513916015625, 3.63958740234375, 3.783660888671875, 3.927734375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 3.0, 4.0, 5.0, 7.0, 9.0, 11.0, 22.0, 24.0, 34.0, 43.0, 36.0, 46.0, 60.0, 68.0, 59.0, 67.0, 60.0, 71.0, 52.0, 51.0, 41.0, 25.0, 24.0, 22.0, 23.0, 16.0, 13.0, 17.0, 11.0, 8.0, 10.0, 7.0, 6.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.072265625, -2.0130462646484375, -1.953826904296875, -1.8946075439453125, -1.83538818359375, -1.7761688232421875, -1.716949462890625, -1.6577301025390625, -1.5985107421875, -1.5392913818359375, -1.480072021484375, -1.4208526611328125, -1.36163330078125, -1.3024139404296875, -1.243194580078125, -1.1839752197265625, -1.124755859375, -1.0655364990234375, -1.006317138671875, -0.9470977783203125, -0.88787841796875, -0.8286590576171875, -0.769439697265625, -0.7102203369140625, -0.6510009765625, -0.5917816162109375, -0.532562255859375, -0.4733428955078125, -0.41412353515625, -0.3549041748046875, -0.295684814453125, -0.2364654541015625, -0.17724609375, -0.1180267333984375, -0.058807373046875, 0.0004119873046875, 0.05963134765625, 0.1188507080078125, 0.178070068359375, 0.2372894287109375, 0.2965087890625, 0.3557281494140625, 0.414947509765625, 0.4741668701171875, 0.53338623046875, 0.5926055908203125, 0.651824951171875, 0.7110443115234375, 0.770263671875, 0.8294830322265625, 0.888702392578125, 0.9479217529296875, 1.00714111328125, 1.0663604736328125, 1.125579833984375, 1.1847991943359375, 1.2440185546875, 1.3032379150390625, 1.362457275390625, 1.4216766357421875, 1.48089599609375, 1.5401153564453125, 1.599334716796875, 1.6585540771484375, 1.7177734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 15.0, 53.0, 109.0, 237.0, 228.0, 181.0, 97.0, 39.0, 20.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.669189453125, -103.43450927734375, -101.1998291015625, -98.96514892578125, -96.73046875, -94.49578857421875, -92.2611083984375, -90.02642822265625, -87.791748046875, -85.55706787109375, -83.3223876953125, -81.08770751953125, -78.85302734375, -76.61834716796875, -74.3836669921875, -72.14898681640625, -69.914306640625, -67.67962646484375, -65.4449462890625, -63.21026611328125, -60.9755859375, -58.74090576171875, -56.5062255859375, -54.27154541015625, -52.03685760498047, -49.80217742919922, -47.56749725341797, -45.33281707763672, -43.09813690185547, -40.86345672607422, -38.62877655029297, -36.39409637451172, -34.15941619873047, -31.92473602294922, -29.69005584716797, -27.45537567138672, -25.22069549560547, -22.98601531982422, -20.751333236694336, -18.516653060913086, -16.281972885131836, -14.047292709350586, -11.812612533569336, -9.57793140411377, -7.3432512283325195, -5.1085710525512695, -2.873889923095703, -0.6392097473144531, 1.5954704284667969, 3.830150842666626, 6.064831256866455, 8.299511909484863, 10.534192085266113, 12.768872261047363, 15.00355339050293, 17.23823356628418, 19.47291374206543, 21.70759391784668, 23.94227409362793, 26.176956176757812, 28.411636352539062, 30.646316528320312, 32.88099670410156, 35.11567687988281, 37.35035705566406]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 8.0, 10.0, 8.0, 10.0, 15.0, 5.0, 20.0, 18.0, 17.0, 24.0, 37.0, 28.0, 30.0, 29.0, 29.0, 40.0, 36.0, 42.0, 36.0, 37.0, 42.0, 40.0, 29.0, 33.0, 52.0, 37.0, 37.0, 27.0, 30.0, 28.0, 21.0, 24.0, 19.0, 13.0, 19.0, 10.0, 9.0, 7.0, 7.0, 5.0, 9.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-20.03070068359375, -19.401100158691406, -18.771501541137695, -18.14190101623535, -17.51230239868164, -16.882701873779297, -16.253101348876953, -15.623502731323242, -14.993902206420898, -14.364302635192871, -13.734703063964844, -13.1051025390625, -12.475502967834473, -11.845903396606445, -11.216303825378418, -10.58670425415039, -9.957104682922363, -9.327505111694336, -8.697905540466309, -8.068305969238281, -7.4387054443359375, -6.80910587310791, -6.179506301879883, -5.549906253814697, -4.92030668258667, -4.290707111358643, -3.661107063293457, -3.0315074920654297, -2.4019076824188232, -1.7723078727722168, -1.1427083015441895, -0.5131082534790039, 0.11649131774902344, 0.7460910677909851, 1.3756908178329468, 2.0052905082702637, 2.63489031791687, 3.2644901275634766, 3.894089698791504, 4.5236897468566895, 5.153289318084717, 5.782888889312744, 6.41248893737793, 7.042088508605957, 7.671688079833984, 8.301288604736328, 8.930887222290039, 9.560487747192383, 10.19008731842041, 10.819686889648438, 11.449286460876465, 12.078886032104492, 12.708486557006836, 13.338086128234863, 13.96768569946289, 14.597286224365234, 15.226884841918945, 15.856484413146973, 16.486083984375, 17.115684509277344, 17.745283126831055, 18.3748836517334, 19.00448226928711, 19.634082794189453, 20.263683319091797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 9.0, 21.0, 19.0, 39.0, 50.0, 92.0, 188.0, 359.0, 660.0, 1501.0, 3479.0, 9142.0, 29876.0, 137185.0, 3555667.0, 374178.0, 56739.0, 15748.0, 5286.0, 2141.0, 903.0, 426.0, 224.0, 125.0, 76.0, 56.0, 30.0, 21.0, 8.0, 12.0, 8.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.4493408203125, -4.234619140625, -4.0198974609375, -3.80517578125, -3.5904541015625, -3.375732421875, -3.1610107421875, -2.9462890625, -2.7315673828125, -2.516845703125, -2.3021240234375, -2.08740234375, -1.8726806640625, -1.657958984375, -1.4432373046875, -1.228515625, -1.0137939453125, -0.799072265625, -0.5843505859375, -0.36962890625, -0.1549072265625, 0.059814453125, 0.2745361328125, 0.4892578125, 0.7039794921875, 0.918701171875, 1.1334228515625, 1.34814453125, 1.5628662109375, 1.777587890625, 1.9923095703125, 2.20703125, 2.4217529296875, 2.636474609375, 2.8511962890625, 3.06591796875, 3.2806396484375, 3.495361328125, 3.7100830078125, 3.9248046875, 4.1395263671875, 4.354248046875, 4.5689697265625, 4.78369140625, 4.9984130859375, 5.213134765625, 5.4278564453125, 5.642578125, 5.8572998046875, 6.072021484375, 6.2867431640625, 6.50146484375, 6.7161865234375, 6.930908203125, 7.1456298828125, 7.3603515625, 7.5750732421875, 7.789794921875, 8.0045166015625, 8.21923828125, 8.4339599609375, 8.648681640625, 8.8634033203125, 9.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 10.0, 13.0, 6.0, 15.0, 15.0, 26.0, 30.0, 42.0, 41.0, 59.0, 67.0, 66.0, 73.0, 68.0, 60.0, 47.0, 69.0, 46.0, 47.0, 41.0, 27.0, 27.0, 30.0, 19.0, 12.0, 11.0, 8.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6742095947265625, -0.650665283203125, -0.6271209716796875, -0.60357666015625, -0.5800323486328125, -0.556488037109375, -0.5329437255859375, -0.5093994140625, -0.4858551025390625, -0.462310791015625, -0.4387664794921875, -0.41522216796875, -0.3916778564453125, -0.368133544921875, -0.3445892333984375, -0.321044921875, -0.2975006103515625, -0.273956298828125, -0.2504119873046875, -0.22686767578125, -0.2033233642578125, -0.179779052734375, -0.1562347412109375, -0.1326904296875, -0.1091461181640625, -0.085601806640625, -0.0620574951171875, -0.03851318359375, -0.0149688720703125, 0.008575439453125, 0.0321197509765625, 0.0556640625, 0.0792083740234375, 0.102752685546875, 0.1262969970703125, 0.14984130859375, 0.1733856201171875, 0.196929931640625, 0.2204742431640625, 0.2440185546875, 0.2675628662109375, 0.291107177734375, 0.3146514892578125, 0.33819580078125, 0.3617401123046875, 0.385284423828125, 0.4088287353515625, 0.432373046875, 0.4559173583984375, 0.479461669921875, 0.5030059814453125, 0.52655029296875, 0.5500946044921875, 0.573638916015625, 0.5971832275390625, 0.6207275390625, 0.6442718505859375, 0.667816162109375, 0.6913604736328125, 0.71490478515625, 0.7384490966796875, 0.761993408203125, 0.7855377197265625, 0.80908203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 2.0, 6.0, 11.0, 19.0, 36.0, 66.0, 100.0, 182.0, 336.0, 606.0, 1143.0, 2390.0, 5661.0, 15182.0, 50163.0, 261642.0, 3442219.0, 330629.0, 56580.0, 15991.0, 5967.0, 2529.0, 1326.0, 685.0, 345.0, 201.0, 120.0, 62.0, 27.0, 22.0, 16.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.37860107421875, -5.1595458984375, -4.94049072265625, -4.721435546875, -4.50238037109375, -4.2833251953125, -4.06427001953125, -3.84521484375, -3.62615966796875, -3.4071044921875, -3.18804931640625, -2.968994140625, -2.74993896484375, -2.5308837890625, -2.31182861328125, -2.0927734375, -1.87371826171875, -1.6546630859375, -1.43560791015625, -1.216552734375, -0.99749755859375, -0.7784423828125, -0.55938720703125, -0.34033203125, -0.12127685546875, 0.0977783203125, 0.31683349609375, 0.535888671875, 0.75494384765625, 0.9739990234375, 1.19305419921875, 1.412109375, 1.63116455078125, 1.8502197265625, 2.06927490234375, 2.288330078125, 2.50738525390625, 2.7264404296875, 2.94549560546875, 3.16455078125, 3.38360595703125, 3.6026611328125, 3.82171630859375, 4.040771484375, 4.25982666015625, 4.4788818359375, 4.69793701171875, 4.9169921875, 5.13604736328125, 5.3551025390625, 5.57415771484375, 5.793212890625, 6.01226806640625, 6.2313232421875, 6.45037841796875, 6.66943359375, 6.88848876953125, 7.1075439453125, 7.32659912109375, 7.545654296875, 7.76470947265625, 7.9837646484375, 8.20281982421875, 8.421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 15.0, 21.0, 24.0, 34.0, 40.0, 56.0, 94.0, 125.0, 232.0, 487.0, 1798.0, 486.0, 210.0, 130.0, 88.0, 54.0, 43.0, 15.0, 16.0, 22.0, 6.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.7412109375, -1.692108154296875, -1.64300537109375, -1.593902587890625, -1.5447998046875, -1.495697021484375, -1.44659423828125, -1.397491455078125, -1.348388671875, -1.299285888671875, -1.25018310546875, -1.201080322265625, -1.1519775390625, -1.102874755859375, -1.05377197265625, -1.004669189453125, -0.95556640625, -0.906463623046875, -0.85736083984375, -0.808258056640625, -0.7591552734375, -0.710052490234375, -0.66094970703125, -0.611846923828125, -0.562744140625, -0.513641357421875, -0.46453857421875, -0.415435791015625, -0.3663330078125, -0.317230224609375, -0.26812744140625, -0.219024658203125, -0.169921875, -0.120819091796875, -0.07171630859375, -0.022613525390625, 0.0264892578125, 0.075592041015625, 0.12469482421875, 0.173797607421875, 0.222900390625, 0.272003173828125, 0.32110595703125, 0.370208740234375, 0.4193115234375, 0.468414306640625, 0.51751708984375, 0.566619873046875, 0.61572265625, 0.664825439453125, 0.71392822265625, 0.763031005859375, 0.8121337890625, 0.861236572265625, 0.91033935546875, 0.959442138671875, 1.008544921875, 1.057647705078125, 1.10675048828125, 1.155853271484375, 1.2049560546875, 1.254058837890625, 1.30316162109375, 1.352264404296875, 1.4013671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 12.0, 12.0, 17.0, 15.0, 40.0, 59.0, 84.0, 87.0, 128.0, 122.0, 95.0, 75.0, 75.0, 57.0, 38.0, 24.0, 20.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.787405014038086, -8.515711784362793, -8.2440185546875, -7.972325325012207, -7.700632095336914, -7.428938865661621, -7.157245635986328, -6.885552406311035, -6.613859176635742, -6.342165946960449, -6.070472717285156, -5.798779487609863, -5.52708625793457, -5.255393028259277, -4.983699798583984, -4.712006568908691, -4.440313339233398, -4.1686201095581055, -3.8969268798828125, -3.6252336502075195, -3.3535404205322266, -3.0818471908569336, -2.8101539611816406, -2.5384607315063477, -2.2667675018310547, -1.9950742721557617, -1.7233810424804688, -1.4516878128051758, -1.1799945831298828, -0.9083013534545898, -0.6366081237792969, -0.3649148941040039, -0.09322166442871094, 0.17847156524658203, 0.450164794921875, 0.721858024597168, 0.9935512542724609, 1.265244483947754, 1.5369377136230469, 1.8086309432983398, 2.080324172973633, 2.352017402648926, 2.6237106323242188, 2.8954038619995117, 3.1670970916748047, 3.4387903213500977, 3.7104835510253906, 3.9821767807006836, 4.253870010375977, 4.5255632400512695, 4.7972564697265625, 5.0689496994018555, 5.340642929077148, 5.612336158752441, 5.884029388427734, 6.155722618103027, 6.42741584777832, 6.699109077453613, 6.970802307128906, 7.242495536804199, 7.514188766479492, 7.785881996154785, 8.057575225830078, 8.329268455505371, 8.600961685180664]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 9.0, 10.0, 16.0, 15.0, 19.0, 26.0, 21.0, 31.0, 30.0, 37.0, 41.0, 45.0, 49.0, 46.0, 40.0, 65.0, 47.0, 63.0, 52.0, 56.0, 47.0, 38.0, 34.0, 35.0, 30.0, 23.0, 10.0, 17.0, 9.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.989559650421143, -6.79185676574707, -6.594154357910156, -6.396451473236084, -6.198748588562012, -6.001046180725098, -5.803343296051025, -5.605640411376953, -5.407938003540039, -5.210235118865967, -5.012532711029053, -4.8148298263549805, -4.617127418518066, -4.419424533843994, -4.221721649169922, -4.024019241333008, -3.8263163566589355, -3.6286137104034424, -3.430911064147949, -3.233208179473877, -3.035505533218384, -2.8378028869628906, -2.6401000022888184, -2.442397356033325, -2.244694709777832, -2.046992063522339, -1.8492892980575562, -1.6515865325927734, -1.4538838863372803, -1.256181240081787, -1.0584784746170044, -0.8607757091522217, -0.6630735397338867, -0.4653708338737488, -0.26766812801361084, -0.0699654221534729, 0.12773728370666504, 0.325439989566803, 0.5231426954269409, 0.7208454608917236, 0.9185481071472168, 1.11625075340271, 1.3139535188674927, 1.5116562843322754, 1.7093589305877686, 1.9070615768432617, 2.104764461517334, 2.302467107772827, 2.5001697540283203, 2.6978724002838135, 2.8955750465393066, 3.093277931213379, 3.290980577468872, 3.4886832237243652, 3.6863861083984375, 3.8840887546539307, 4.081791400909424, 4.279494285583496, 4.47719669342041, 4.674899578094482, 4.872602462768555, 5.070304870605469, 5.268007755279541, 5.465710639953613, 5.663413047790527]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 18.0, 21.0, 27.0, 37.0, 62.0, 71.0, 125.0, 162.0, 274.0, 386.0, 658.0, 976.0, 1515.0, 2417.0, 3992.0, 6942.0, 11688.0, 20836.0, 36588.0, 64182.0, 110688.0, 184990.0, 228554.0, 156817.0, 92048.0, 52841.0, 29915.0, 17029.0, 9817.0, 5638.0, 3469.0, 2006.0, 1337.0, 848.0, 530.0, 337.0, 234.0, 136.0, 117.0, 68.0, 52.0, 31.0, 19.0, 13.0, 16.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.054931640625, -1.98486328125, -1.914794921875, -1.8447265625, -1.774658203125, -1.70458984375, -1.634521484375, -1.564453125, -1.494384765625, -1.42431640625, -1.354248046875, -1.2841796875, -1.214111328125, -1.14404296875, -1.073974609375, -1.00390625, -0.933837890625, -0.86376953125, -0.793701171875, -0.7236328125, -0.653564453125, -0.58349609375, -0.513427734375, -0.443359375, -0.373291015625, -0.30322265625, -0.233154296875, -0.1630859375, -0.093017578125, -0.02294921875, 0.047119140625, 0.1171875, 0.187255859375, 0.25732421875, 0.327392578125, 0.3974609375, 0.467529296875, 0.53759765625, 0.607666015625, 0.677734375, 0.747802734375, 0.81787109375, 0.887939453125, 0.9580078125, 1.028076171875, 1.09814453125, 1.168212890625, 1.23828125, 1.308349609375, 1.37841796875, 1.448486328125, 1.5185546875, 1.588623046875, 1.65869140625, 1.728759765625, 1.798828125, 1.868896484375, 1.93896484375, 2.009033203125, 2.0791015625, 2.149169921875, 2.21923828125, 2.289306640625, 2.359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 7.0, 7.0, 15.0, 13.0, 23.0, 33.0, 30.0, 42.0, 39.0, 48.0, 45.0, 50.0, 69.0, 67.0, 55.0, 55.0, 60.0, 38.0, 45.0, 34.0, 34.0, 29.0, 24.0, 31.0, 19.0, 12.0, 11.0, 12.0, 16.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.558258056640625, -0.53692626953125, -0.515594482421875, -0.4942626953125, -0.472930908203125, -0.45159912109375, -0.430267333984375, -0.408935546875, -0.387603759765625, -0.36627197265625, -0.344940185546875, -0.3236083984375, -0.302276611328125, -0.28094482421875, -0.259613037109375, -0.23828125, -0.216949462890625, -0.19561767578125, -0.174285888671875, -0.1529541015625, -0.131622314453125, -0.11029052734375, -0.088958740234375, -0.067626953125, -0.046295166015625, -0.02496337890625, -0.003631591796875, 0.0177001953125, 0.039031982421875, 0.06036376953125, 0.081695556640625, 0.10302734375, 0.124359130859375, 0.14569091796875, 0.167022705078125, 0.1883544921875, 0.209686279296875, 0.23101806640625, 0.252349853515625, 0.273681640625, 0.295013427734375, 0.31634521484375, 0.337677001953125, 0.3590087890625, 0.380340576171875, 0.40167236328125, 0.423004150390625, 0.4443359375, 0.465667724609375, 0.48699951171875, 0.508331298828125, 0.5296630859375, 0.550994873046875, 0.57232666015625, 0.593658447265625, 0.614990234375, 0.636322021484375, 0.65765380859375, 0.678985595703125, 0.7003173828125, 0.721649169921875, 0.74298095703125, 0.764312744140625, 0.78564453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 5.0, 14.0, 22.0, 18.0, 40.0, 40.0, 58.0, 81.0, 131.0, 184.0, 285.0, 474.0, 773.0, 1575.0, 3396.0, 8086.0, 21642.0, 64453.0, 196837.0, 409500.0, 225171.0, 73960.0, 24881.0, 9120.0, 3806.0, 1669.0, 896.0, 495.0, 282.0, 198.0, 146.0, 71.0, 71.0, 52.0, 27.0, 34.0, 16.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.48828125, -4.35455322265625, -4.2208251953125, -4.08709716796875, -3.953369140625, -3.81964111328125, -3.6859130859375, -3.55218505859375, -3.41845703125, -3.28472900390625, -3.1510009765625, -3.01727294921875, -2.883544921875, -2.74981689453125, -2.6160888671875, -2.48236083984375, -2.3486328125, -2.21490478515625, -2.0811767578125, -1.94744873046875, -1.813720703125, -1.67999267578125, -1.5462646484375, -1.41253662109375, -1.27880859375, -1.14508056640625, -1.0113525390625, -0.87762451171875, -0.743896484375, -0.61016845703125, -0.4764404296875, -0.34271240234375, -0.208984375, -0.07525634765625, 0.0584716796875, 0.19219970703125, 0.325927734375, 0.45965576171875, 0.5933837890625, 0.72711181640625, 0.86083984375, 0.99456787109375, 1.1282958984375, 1.26202392578125, 1.395751953125, 1.52947998046875, 1.6632080078125, 1.79693603515625, 1.9306640625, 2.06439208984375, 2.1981201171875, 2.33184814453125, 2.465576171875, 2.59930419921875, 2.7330322265625, 2.86676025390625, 3.00048828125, 3.13421630859375, 3.2679443359375, 3.40167236328125, 3.535400390625, 3.66912841796875, 3.8028564453125, 3.93658447265625, 4.0703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 10.0, 6.0, 6.0, 9.0, 8.0, 12.0, 11.0, 21.0, 25.0, 29.0, 37.0, 23.0, 41.0, 34.0, 34.0, 59.0, 42.0, 42.0, 47.0, 51.0, 46.0, 50.0, 43.0, 42.0, 34.0, 37.0, 38.0, 21.0, 25.0, 18.0, 18.0, 11.0, 16.0, 7.0, 6.0, 7.0, 11.0, 5.0, 6.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.474609375, -3.370208740234375, -3.26580810546875, -3.161407470703125, -3.0570068359375, -2.952606201171875, -2.84820556640625, -2.743804931640625, -2.639404296875, -2.535003662109375, -2.43060302734375, -2.326202392578125, -2.2218017578125, -2.117401123046875, -2.01300048828125, -1.908599853515625, -1.80419921875, -1.699798583984375, -1.59539794921875, -1.490997314453125, -1.3865966796875, -1.282196044921875, -1.17779541015625, -1.073394775390625, -0.968994140625, -0.864593505859375, -0.76019287109375, -0.655792236328125, -0.5513916015625, -0.446990966796875, -0.34259033203125, -0.238189697265625, -0.1337890625, -0.029388427734375, 0.07501220703125, 0.179412841796875, 0.2838134765625, 0.388214111328125, 0.49261474609375, 0.597015380859375, 0.701416015625, 0.805816650390625, 0.91021728515625, 1.014617919921875, 1.1190185546875, 1.223419189453125, 1.32781982421875, 1.432220458984375, 1.53662109375, 1.641021728515625, 1.74542236328125, 1.849822998046875, 1.9542236328125, 2.058624267578125, 2.16302490234375, 2.267425537109375, 2.371826171875, 2.476226806640625, 2.58062744140625, 2.685028076171875, 2.7894287109375, 2.893829345703125, 2.99822998046875, 3.102630615234375, 3.20703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 1.0, 10.0, 8.0, 18.0, 22.0, 26.0, 56.0, 60.0, 131.0, 224.0, 437.0, 818.0, 2020.0, 5405.0, 17848.0, 74585.0, 362971.0, 449504.0, 100202.0, 23164.0, 6661.0, 2303.0, 1014.0, 424.0, 222.0, 140.0, 89.0, 61.0, 43.0, 28.0, 12.0, 10.0, 14.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.321197509765625, -2.23223876953125, -2.143280029296875, -2.0543212890625, -1.965362548828125, -1.87640380859375, -1.787445068359375, -1.698486328125, -1.609527587890625, -1.52056884765625, -1.431610107421875, -1.3426513671875, -1.253692626953125, -1.16473388671875, -1.075775146484375, -0.98681640625, -0.897857666015625, -0.80889892578125, -0.719940185546875, -0.6309814453125, -0.542022705078125, -0.45306396484375, -0.364105224609375, -0.275146484375, -0.186187744140625, -0.09722900390625, -0.008270263671875, 0.0806884765625, 0.169647216796875, 0.25860595703125, 0.347564697265625, 0.4365234375, 0.525482177734375, 0.61444091796875, 0.703399658203125, 0.7923583984375, 0.881317138671875, 0.97027587890625, 1.059234619140625, 1.148193359375, 1.237152099609375, 1.32611083984375, 1.415069580078125, 1.5040283203125, 1.592987060546875, 1.68194580078125, 1.770904541015625, 1.85986328125, 1.948822021484375, 2.03778076171875, 2.126739501953125, 2.2156982421875, 2.304656982421875, 2.39361572265625, 2.482574462890625, 2.571533203125, 2.660491943359375, 2.74945068359375, 2.838409423828125, 2.9273681640625, 3.016326904296875, 3.10528564453125, 3.194244384765625, 3.283203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 8.0, 9.0, 13.0, 11.0, 21.0, 19.0, 28.0, 40.0, 28.0, 67.0, 105.0, 113.0, 133.0, 89.0, 68.0, 53.0, 38.0, 37.0, 30.0, 21.0, 6.0, 12.0, 10.0, 3.0, 7.0, 4.0, 1.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.0005645751953125, -0.0005497299134731293, -0.0005348846316337585, -0.0005200393497943878, -0.0005051940679550171, -0.0004903487861156464, -0.00047550350427627563, -0.0004606582224369049, -0.0004458129405975342, -0.00043096765875816345, -0.0004161223769187927, -0.000401277095079422, -0.00038643181324005127, -0.00037158653140068054, -0.0003567412495613098, -0.0003418959677219391, -0.00032705068588256836, -0.00031220540404319763, -0.0002973601222038269, -0.0002825148403644562, -0.00026766955852508545, -0.0002528242766857147, -0.000237978994846344, -0.00022313371300697327, -0.00020828843116760254, -0.0001934431493282318, -0.00017859786748886108, -0.00016375258564949036, -0.00014890730381011963, -0.0001340620219707489, -0.00011921674013137817, -0.00010437145829200745, -8.952617645263672e-05, -7.468089461326599e-05, -5.9835612773895264e-05, -4.4990330934524536e-05, -3.014504909515381e-05, -1.529976725578308e-05, -4.544854164123535e-07, 1.4390796422958374e-05, 2.92360782623291e-05, 4.408136010169983e-05, 5.892664194107056e-05, 7.377192378044128e-05, 8.861720561981201e-05, 0.00010346248745918274, 0.00011830776929855347, 0.0001331530511379242, 0.00014799833297729492, 0.00016284361481666565, 0.00017768889665603638, 0.0001925341784954071, 0.00020737946033477783, 0.00022222474217414856, 0.0002370700240135193, 0.00025191530585289, 0.00026676058769226074, 0.00028160586953163147, 0.0002964511513710022, 0.0003112964332103729, 0.00032614171504974365, 0.0003409869968891144, 0.0003558322787284851, 0.00037067756056785583, 0.00038552284240722656]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 13.0, 11.0, 25.0, 20.0, 32.0, 46.0, 69.0, 105.0, 183.0, 339.0, 597.0, 1033.0, 2299.0, 5153.0, 14425.0, 51120.0, 246142.0, 532175.0, 143967.0, 33090.0, 10043.0, 3832.0, 1695.0, 876.0, 463.0, 293.0, 171.0, 111.0, 66.0, 55.0, 25.0, 19.0, 15.0, 5.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.15625, -3.0643310546875, -2.972412109375, -2.8804931640625, -2.78857421875, -2.6966552734375, -2.604736328125, -2.5128173828125, -2.4208984375, -2.3289794921875, -2.237060546875, -2.1451416015625, -2.05322265625, -1.9613037109375, -1.869384765625, -1.7774658203125, -1.685546875, -1.5936279296875, -1.501708984375, -1.4097900390625, -1.31787109375, -1.2259521484375, -1.134033203125, -1.0421142578125, -0.9501953125, -0.8582763671875, -0.766357421875, -0.6744384765625, -0.58251953125, -0.4906005859375, -0.398681640625, -0.3067626953125, -0.21484375, -0.1229248046875, -0.031005859375, 0.0609130859375, 0.15283203125, 0.2447509765625, 0.336669921875, 0.4285888671875, 0.5205078125, 0.6124267578125, 0.704345703125, 0.7962646484375, 0.88818359375, 0.9801025390625, 1.072021484375, 1.1639404296875, 1.255859375, 1.3477783203125, 1.439697265625, 1.5316162109375, 1.62353515625, 1.7154541015625, 1.807373046875, 1.8992919921875, 1.9912109375, 2.0831298828125, 2.175048828125, 2.2669677734375, 2.35888671875, 2.4508056640625, 2.542724609375, 2.6346435546875, 2.7265625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 9.0, 5.0, 7.0, 11.0, 12.0, 19.0, 25.0, 29.0, 37.0, 47.0, 43.0, 66.0, 69.0, 83.0, 64.0, 81.0, 60.0, 52.0, 38.0, 46.0, 33.0, 32.0, 17.0, 26.0, 21.0, 11.0, 10.0, 7.0, 3.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.787109375, -1.7331390380859375, -1.679168701171875, -1.6251983642578125, -1.57122802734375, -1.5172576904296875, -1.463287353515625, -1.4093170166015625, -1.3553466796875, -1.3013763427734375, -1.247406005859375, -1.1934356689453125, -1.13946533203125, -1.0854949951171875, -1.031524658203125, -0.9775543212890625, -0.923583984375, -0.8696136474609375, -0.815643310546875, -0.7616729736328125, -0.70770263671875, -0.6537322998046875, -0.599761962890625, -0.5457916259765625, -0.4918212890625, -0.4378509521484375, -0.383880615234375, -0.3299102783203125, -0.27593994140625, -0.2219696044921875, -0.167999267578125, -0.1140289306640625, -0.06005859375, -0.0060882568359375, 0.047882080078125, 0.1018524169921875, 0.15582275390625, 0.2097930908203125, 0.263763427734375, 0.3177337646484375, 0.3717041015625, 0.4256744384765625, 0.479644775390625, 0.5336151123046875, 0.58758544921875, 0.6415557861328125, 0.695526123046875, 0.7494964599609375, 0.803466796875, 0.8574371337890625, 0.911407470703125, 0.9653778076171875, 1.01934814453125, 1.0733184814453125, 1.127288818359375, 1.1812591552734375, 1.2352294921875, 1.2891998291015625, 1.343170166015625, 1.3971405029296875, 1.45111083984375, 1.5050811767578125, 1.559051513671875, 1.6130218505859375, 1.6669921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 12.0, 7.0, 17.0, 31.0, 53.0, 60.0, 81.0, 107.0, 130.0, 109.0, 123.0, 80.0, 61.0, 44.0, 28.0, 18.0, 10.0, 8.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.029603958129883, -26.17972755432129, -25.329851150512695, -24.4799747467041, -23.630098342895508, -22.780221939086914, -21.930347442626953, -21.08047103881836, -20.230594635009766, -19.380718231201172, -18.530841827392578, -17.680965423583984, -16.83108901977539, -15.981212615966797, -15.13133716583252, -14.281460762023926, -13.431583404541016, -12.581707000732422, -11.731830596923828, -10.881954193115234, -10.03207778930664, -9.182201385498047, -8.33232593536377, -7.482449531555176, -6.632573127746582, -5.782696723937988, -4.9328203201293945, -4.082944393157959, -3.2330679893493652, -2.3831915855407715, -1.533315658569336, -0.6834392547607422, 0.16643524169921875, 1.016311526298523, 1.8661878108978271, 2.716063976287842, 3.5659403800964355, 4.415816783905029, 5.265692710876465, 6.115569114685059, 6.965445518493652, 7.815321922302246, 8.66519832611084, 9.515073776245117, 10.364950180053711, 11.214826583862305, 12.064702987670898, 12.914579391479492, 13.764455795288086, 14.61433219909668, 15.464208602905273, 16.314085006713867, 17.16396141052246, 18.013837814331055, 18.863712310791016, 19.71358871459961, 20.563465118408203, 21.413341522216797, 22.26321792602539, 23.113094329833984, 23.962970733642578, 24.812847137451172, 25.662723541259766, 26.51259994506836, 27.362476348876953]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 5.0, 10.0, 11.0, 12.0, 13.0, 25.0, 20.0, 13.0, 23.0, 31.0, 27.0, 31.0, 29.0, 39.0, 48.0, 39.0, 41.0, 47.0, 40.0, 54.0, 45.0, 42.0, 40.0, 38.0, 25.0, 32.0, 40.0, 26.0, 29.0, 23.0, 20.0, 12.0, 10.0, 9.0, 9.0, 11.0, 6.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-20.653261184692383, -20.05702018737793, -19.460779190063477, -18.864538192749023, -18.26829719543457, -17.672056198120117, -17.075815200805664, -16.47957420349121, -15.883333206176758, -15.287092208862305, -14.690851211547852, -14.094610214233398, -13.498369216918945, -12.902128219604492, -12.305887222290039, -11.709646224975586, -11.113405227661133, -10.51716423034668, -9.920923233032227, -9.324682235717773, -8.72844123840332, -8.132200241088867, -7.535959243774414, -6.939718246459961, -6.343477249145508, -5.747236251831055, -5.150995254516602, -4.554754257202148, -3.9585132598876953, -3.362272262573242, -2.766031265258789, -2.169790267944336, -1.5735511779785156, -0.9773101806640625, -0.3810691833496094, 0.21517181396484375, 0.8114128112792969, 1.40765380859375, 2.003894805908203, 2.6001358032226562, 3.1963768005371094, 3.7926177978515625, 4.388858795166016, 4.985099792480469, 5.581340789794922, 6.177581787109375, 6.773822784423828, 7.370063781738281, 7.966304779052734, 8.562545776367188, 9.15878677368164, 9.755027770996094, 10.351268768310547, 10.947509765625, 11.543750762939453, 12.139991760253906, 12.73623275756836, 13.332473754882812, 13.928714752197266, 14.524955749511719, 15.121196746826172, 15.717437744140625, 16.313678741455078, 16.90991973876953, 17.506160736083984]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 6.0, 13.0, 11.0, 13.0, 40.0, 68.0, 138.0, 282.0, 546.0, 1236.0, 3096.0, 8150.0, 25113.0, 114204.0, 3699647.0, 279828.0, 41354.0, 12487.0, 4516.0, 1885.0, 863.0, 347.0, 200.0, 76.0, 54.0, 37.0, 26.0, 9.0, 11.0, 8.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.583984375, -3.392242431640625, -3.20050048828125, -3.008758544921875, -2.8170166015625, -2.625274658203125, -2.43353271484375, -2.241790771484375, -2.050048828125, -1.858306884765625, -1.66656494140625, -1.474822998046875, -1.2830810546875, -1.091339111328125, -0.89959716796875, -0.707855224609375, -0.51611328125, -0.324371337890625, -0.13262939453125, 0.059112548828125, 0.2508544921875, 0.442596435546875, 0.63433837890625, 0.826080322265625, 1.017822265625, 1.209564208984375, 1.40130615234375, 1.593048095703125, 1.7847900390625, 1.976531982421875, 2.16827392578125, 2.360015869140625, 2.5517578125, 2.743499755859375, 2.93524169921875, 3.126983642578125, 3.3187255859375, 3.510467529296875, 3.70220947265625, 3.893951416015625, 4.085693359375, 4.277435302734375, 4.46917724609375, 4.660919189453125, 4.8526611328125, 5.044403076171875, 5.23614501953125, 5.427886962890625, 5.61962890625, 5.811370849609375, 6.00311279296875, 6.194854736328125, 6.3865966796875, 6.578338623046875, 6.77008056640625, 6.961822509765625, 7.153564453125, 7.345306396484375, 7.53704833984375, 7.728790283203125, 7.9205322265625, 8.112274169921875, 8.30401611328125, 8.495758056640625, 8.6875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 11.0, 14.0, 17.0, 25.0, 20.0, 14.0, 19.0, 30.0, 48.0, 58.0, 47.0, 49.0, 62.0, 48.0, 52.0, 59.0, 51.0, 48.0, 46.0, 42.0, 33.0, 25.0, 22.0, 21.0, 19.0, 19.0, 21.0, 16.0, 22.0, 9.0, 4.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.642578125, -0.6216888427734375, -0.600799560546875, -0.5799102783203125, -0.55902099609375, -0.5381317138671875, -0.517242431640625, -0.4963531494140625, -0.4754638671875, -0.4545745849609375, -0.433685302734375, -0.4127960205078125, -0.39190673828125, -0.3710174560546875, -0.350128173828125, -0.3292388916015625, -0.308349609375, -0.2874603271484375, -0.266571044921875, -0.2456817626953125, -0.22479248046875, -0.2039031982421875, -0.183013916015625, -0.1621246337890625, -0.1412353515625, -0.1203460693359375, -0.099456787109375, -0.0785675048828125, -0.05767822265625, -0.0367889404296875, -0.015899658203125, 0.0049896240234375, 0.02587890625, 0.0467681884765625, 0.067657470703125, 0.0885467529296875, 0.10943603515625, 0.1303253173828125, 0.151214599609375, 0.1721038818359375, 0.1929931640625, 0.2138824462890625, 0.234771728515625, 0.2556610107421875, 0.27655029296875, 0.2974395751953125, 0.318328857421875, 0.3392181396484375, 0.360107421875, 0.3809967041015625, 0.401885986328125, 0.4227752685546875, 0.44366455078125, 0.4645538330078125, 0.485443115234375, 0.5063323974609375, 0.5272216796875, 0.5481109619140625, 0.569000244140625, 0.5898895263671875, 0.61077880859375, 0.6316680908203125, 0.652557373046875, 0.6734466552734375, 0.6943359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 21.0, 20.0, 46.0, 70.0, 139.0, 283.0, 561.0, 1057.0, 2430.0, 5843.0, 16376.0, 55108.0, 259875.0, 3424663.0, 333348.0, 63995.0, 18605.0, 6505.0, 2676.0, 1244.0, 620.0, 353.0, 202.0, 85.0, 59.0, 34.0, 17.0, 18.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.955078125, -3.794036865234375, -3.63299560546875, -3.471954345703125, -3.3109130859375, -3.149871826171875, -2.98883056640625, -2.827789306640625, -2.666748046875, -2.505706787109375, -2.34466552734375, -2.183624267578125, -2.0225830078125, -1.861541748046875, -1.70050048828125, -1.539459228515625, -1.37841796875, -1.217376708984375, -1.05633544921875, -0.895294189453125, -0.7342529296875, -0.573211669921875, -0.41217041015625, -0.251129150390625, -0.090087890625, 0.070953369140625, 0.23199462890625, 0.393035888671875, 0.5540771484375, 0.715118408203125, 0.87615966796875, 1.037200927734375, 1.1982421875, 1.359283447265625, 1.52032470703125, 1.681365966796875, 1.8424072265625, 2.003448486328125, 2.16448974609375, 2.325531005859375, 2.486572265625, 2.647613525390625, 2.80865478515625, 2.969696044921875, 3.1307373046875, 3.291778564453125, 3.45281982421875, 3.613861083984375, 3.77490234375, 3.935943603515625, 4.09698486328125, 4.258026123046875, 4.4190673828125, 4.580108642578125, 4.74114990234375, 4.902191162109375, 5.063232421875, 5.224273681640625, 5.38531494140625, 5.546356201171875, 5.7073974609375, 5.868438720703125, 6.02947998046875, 6.190521240234375, 6.3515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 3.0, 9.0, 13.0, 22.0, 22.0, 32.0, 45.0, 66.0, 78.0, 110.0, 165.0, 333.0, 1558.0, 814.0, 273.0, 151.0, 79.0, 63.0, 51.0, 37.0, 32.0, 23.0, 16.0, 19.0, 8.0, 5.0, 9.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.19921875, -1.16156005859375, -1.1239013671875, -1.08624267578125, -1.048583984375, -1.01092529296875, -0.9732666015625, -0.93560791015625, -0.89794921875, -0.86029052734375, -0.8226318359375, -0.78497314453125, -0.747314453125, -0.70965576171875, -0.6719970703125, -0.63433837890625, -0.5966796875, -0.55902099609375, -0.5213623046875, -0.48370361328125, -0.446044921875, -0.40838623046875, -0.3707275390625, -0.33306884765625, -0.29541015625, -0.25775146484375, -0.2200927734375, -0.18243408203125, -0.144775390625, -0.10711669921875, -0.0694580078125, -0.03179931640625, 0.005859375, 0.04351806640625, 0.0811767578125, 0.11883544921875, 0.156494140625, 0.19415283203125, 0.2318115234375, 0.26947021484375, 0.30712890625, 0.34478759765625, 0.3824462890625, 0.42010498046875, 0.457763671875, 0.49542236328125, 0.5330810546875, 0.57073974609375, 0.6083984375, 0.64605712890625, 0.6837158203125, 0.72137451171875, 0.759033203125, 0.79669189453125, 0.8343505859375, 0.87200927734375, 0.90966796875, 0.94732666015625, 0.9849853515625, 1.02264404296875, 1.060302734375, 1.09796142578125, 1.1356201171875, 1.17327880859375, 1.2109375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 15.0, 9.0, 32.0, 50.0, 64.0, 77.0, 98.0, 122.0, 111.0, 96.0, 80.0, 76.0, 38.0, 39.0, 17.0, 23.0, 13.0, 6.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.371510982513428, -7.140501499176025, -6.909492015838623, -6.678482532501221, -6.447473049163818, -6.216463565826416, -5.9854536056518555, -5.754444122314453, -5.523434638977051, -5.292425155639648, -5.061415672302246, -4.830406188964844, -4.599396705627441, -4.368387222290039, -4.137377738952637, -3.9063680171966553, -3.675358772277832, -3.4443492889404297, -3.2133398056030273, -2.982330322265625, -2.7513208389282227, -2.5203113555908203, -2.289301633834839, -2.0582921504974365, -1.8272826671600342, -1.5962731838226318, -1.3652637004852295, -1.1342540979385376, -0.9032446146011353, -0.6722351312637329, -0.441225528717041, -0.21021604537963867, 0.020793914794921875, 0.2518034279346466, 0.48281294107437134, 0.7138224840164185, 0.9448319673538208, 1.1758414506912231, 1.406851053237915, 1.6378605365753174, 1.8688700199127197, 2.099879503250122, 2.3308889865875244, 2.561898708343506, 2.792908191680908, 3.0239176750183105, 3.254927158355713, 3.4859366416931152, 3.7169461250305176, 3.94795560836792, 4.178965091705322, 4.409974575042725, 4.640984058380127, 4.871993541717529, 5.10300350189209, 5.334012985229492, 5.5650224685668945, 5.796031951904297, 6.027041435241699, 6.258050918579102, 6.489060401916504, 6.720069885253906, 6.951079368591309, 7.182088851928711, 7.413098335266113]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 4.0, 9.0, 15.0, 12.0, 23.0, 22.0, 25.0, 39.0, 46.0, 40.0, 39.0, 46.0, 65.0, 49.0, 45.0, 50.0, 55.0, 42.0, 38.0, 56.0, 36.0, 36.0, 32.0, 36.0, 28.0, 34.0, 12.0, 11.0, 17.0, 13.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.425556182861328, -5.264196395874023, -5.102836608886719, -4.941476821899414, -4.780117034912109, -4.618757247924805, -4.4573974609375, -4.296037673950195, -4.134677886962891, -3.973318099975586, -3.8119583129882812, -3.6505985260009766, -3.489238739013672, -3.327878952026367, -3.1665189266204834, -3.0051591396331787, -2.843799114227295, -2.6824393272399902, -2.5210795402526855, -2.359719753265381, -2.198359966278076, -2.0370001792907715, -1.8756401538848877, -1.714280366897583, -1.5529205799102783, -1.3915607929229736, -1.230201005935669, -1.0688410997390747, -0.90748131275177, -0.7461215257644653, -0.5847616791725159, -0.4234018325805664, -0.2620420455932617, -0.10068222880363464, 0.06067758798599243, 0.2220374047756195, 0.3833972215652466, 0.5447570085525513, 0.7061168551445007, 0.8674767017364502, 1.0288364887237549, 1.1901962757110596, 1.3515560626983643, 1.5129159688949585, 1.6742757558822632, 1.8356355428695679, 1.996995449066162, 2.158355236053467, 2.3197150230407715, 2.481074810028076, 2.642434597015381, 2.8037943840026855, 2.9651541709899902, 3.126513957977295, 3.2878739833831787, 3.4492337703704834, 3.610593557357788, 3.7719533443450928, 3.9333131313323975, 4.094673156738281, 4.256032943725586, 4.417392730712891, 4.578752517700195, 4.7401123046875, 4.901472091674805]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 6.0, 10.0, 19.0, 24.0, 19.0, 56.0, 73.0, 102.0, 172.0, 289.0, 436.0, 738.0, 1233.0, 1934.0, 3247.0, 5697.0, 9677.0, 17471.0, 31593.0, 58026.0, 106039.0, 183343.0, 235571.0, 172822.0, 98666.0, 53638.0, 29294.0, 16004.0, 9112.0, 5330.0, 3070.0, 1835.0, 1171.0, 678.0, 436.0, 249.0, 150.0, 96.0, 69.0, 65.0, 33.0, 18.0, 17.0, 7.0, 4.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.18359375, -2.1141357421875, -2.044677734375, -1.9752197265625, -1.90576171875, -1.8363037109375, -1.766845703125, -1.6973876953125, -1.6279296875, -1.5584716796875, -1.489013671875, -1.4195556640625, -1.35009765625, -1.2806396484375, -1.211181640625, -1.1417236328125, -1.072265625, -1.0028076171875, -0.933349609375, -0.8638916015625, -0.79443359375, -0.7249755859375, -0.655517578125, -0.5860595703125, -0.5166015625, -0.4471435546875, -0.377685546875, -0.3082275390625, -0.23876953125, -0.1693115234375, -0.099853515625, -0.0303955078125, 0.0390625, 0.1085205078125, 0.177978515625, 0.2474365234375, 0.31689453125, 0.3863525390625, 0.455810546875, 0.5252685546875, 0.5947265625, 0.6641845703125, 0.733642578125, 0.8031005859375, 0.87255859375, 0.9420166015625, 1.011474609375, 1.0809326171875, 1.150390625, 1.2198486328125, 1.289306640625, 1.3587646484375, 1.42822265625, 1.4976806640625, 1.567138671875, 1.6365966796875, 1.7060546875, 1.7755126953125, 1.844970703125, 1.9144287109375, 1.98388671875, 2.0533447265625, 2.122802734375, 2.1922607421875, 2.26171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 7.0, 12.0, 16.0, 14.0, 18.0, 27.0, 27.0, 35.0, 40.0, 47.0, 48.0, 39.0, 55.0, 55.0, 38.0, 62.0, 50.0, 67.0, 46.0, 40.0, 39.0, 22.0, 22.0, 25.0, 33.0, 21.0, 11.0, 14.0, 14.0, 13.0, 10.0, 8.0, 5.0, 1.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.59552001953125, -0.5743408203125, -0.55316162109375, -0.531982421875, -0.51080322265625, -0.4896240234375, -0.46844482421875, -0.447265625, -0.42608642578125, -0.4049072265625, -0.38372802734375, -0.362548828125, -0.34136962890625, -0.3201904296875, -0.29901123046875, -0.27783203125, -0.25665283203125, -0.2354736328125, -0.21429443359375, -0.193115234375, -0.17193603515625, -0.1507568359375, -0.12957763671875, -0.1083984375, -0.08721923828125, -0.0660400390625, -0.04486083984375, -0.023681640625, -0.00250244140625, 0.0186767578125, 0.03985595703125, 0.06103515625, 0.08221435546875, 0.1033935546875, 0.12457275390625, 0.145751953125, 0.16693115234375, 0.1881103515625, 0.20928955078125, 0.23046875, 0.25164794921875, 0.2728271484375, 0.29400634765625, 0.315185546875, 0.33636474609375, 0.3575439453125, 0.37872314453125, 0.39990234375, 0.42108154296875, 0.4422607421875, 0.46343994140625, 0.484619140625, 0.50579833984375, 0.5269775390625, 0.54815673828125, 0.5693359375, 0.59051513671875, 0.6116943359375, 0.63287353515625, 0.654052734375, 0.67523193359375, 0.6964111328125, 0.71759033203125, 0.73876953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 17.0, 10.0, 17.0, 30.0, 34.0, 43.0, 61.0, 109.0, 131.0, 217.0, 376.0, 581.0, 1175.0, 2530.0, 6890.0, 23826.0, 97649.0, 413386.0, 380290.0, 87934.0, 21637.0, 6512.0, 2427.0, 1054.0, 571.0, 358.0, 212.0, 150.0, 97.0, 57.0, 48.0, 30.0, 30.0, 22.0, 13.0, 9.0, 6.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.00390625, -4.85211181640625, -4.7003173828125, -4.54852294921875, -4.396728515625, -4.24493408203125, -4.0931396484375, -3.94134521484375, -3.78955078125, -3.63775634765625, -3.4859619140625, -3.33416748046875, -3.182373046875, -3.03057861328125, -2.8787841796875, -2.72698974609375, -2.5751953125, -2.42340087890625, -2.2716064453125, -2.11981201171875, -1.968017578125, -1.81622314453125, -1.6644287109375, -1.51263427734375, -1.36083984375, -1.20904541015625, -1.0572509765625, -0.90545654296875, -0.753662109375, -0.60186767578125, -0.4500732421875, -0.29827880859375, -0.146484375, 0.00531005859375, 0.1571044921875, 0.30889892578125, 0.460693359375, 0.61248779296875, 0.7642822265625, 0.91607666015625, 1.06787109375, 1.21966552734375, 1.3714599609375, 1.52325439453125, 1.675048828125, 1.82684326171875, 1.9786376953125, 2.13043212890625, 2.2822265625, 2.43402099609375, 2.5858154296875, 2.73760986328125, 2.889404296875, 3.04119873046875, 3.1929931640625, 3.34478759765625, 3.49658203125, 3.64837646484375, 3.8001708984375, 3.95196533203125, 4.103759765625, 4.25555419921875, 4.4073486328125, 4.55914306640625, 4.7109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 7.0, 10.0, 10.0, 18.0, 19.0, 22.0, 15.0, 35.0, 31.0, 24.0, 34.0, 52.0, 48.0, 54.0, 50.0, 57.0, 59.0, 37.0, 50.0, 53.0, 27.0, 36.0, 40.0, 26.0, 32.0, 24.0, 12.0, 23.0, 15.0, 16.0, 11.0, 9.0, 11.0, 9.0, 6.0, 0.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.458709716796875, -2.35882568359375, -2.258941650390625, -2.1590576171875, -2.059173583984375, -1.95928955078125, -1.859405517578125, -1.759521484375, -1.659637451171875, -1.55975341796875, -1.459869384765625, -1.3599853515625, -1.260101318359375, -1.16021728515625, -1.060333251953125, -0.96044921875, -0.860565185546875, -0.76068115234375, -0.660797119140625, -0.5609130859375, -0.461029052734375, -0.36114501953125, -0.261260986328125, -0.161376953125, -0.061492919921875, 0.03839111328125, 0.138275146484375, 0.2381591796875, 0.338043212890625, 0.43792724609375, 0.537811279296875, 0.6376953125, 0.737579345703125, 0.83746337890625, 0.937347412109375, 1.0372314453125, 1.137115478515625, 1.23699951171875, 1.336883544921875, 1.436767578125, 1.536651611328125, 1.63653564453125, 1.736419677734375, 1.8363037109375, 1.936187744140625, 2.03607177734375, 2.135955810546875, 2.23583984375, 2.335723876953125, 2.43560791015625, 2.535491943359375, 2.6353759765625, 2.735260009765625, 2.83514404296875, 2.935028076171875, 3.034912109375, 3.134796142578125, 3.23468017578125, 3.334564208984375, 3.4344482421875, 3.534332275390625, 3.63421630859375, 3.734100341796875, 3.833984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 8.0, 5.0, 14.0, 23.0, 23.0, 35.0, 54.0, 86.0, 166.0, 255.0, 428.0, 782.0, 1655.0, 3577.0, 9160.0, 28375.0, 116842.0, 499284.0, 299074.0, 60592.0, 16833.0, 5968.0, 2527.0, 1295.0, 625.0, 291.0, 193.0, 130.0, 73.0, 55.0, 41.0, 29.0, 11.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.333282470703125, -2.26422119140625, -2.195159912109375, -2.1260986328125, -2.057037353515625, -1.98797607421875, -1.918914794921875, -1.849853515625, -1.780792236328125, -1.71173095703125, -1.642669677734375, -1.5736083984375, -1.504547119140625, -1.43548583984375, -1.366424560546875, -1.29736328125, -1.228302001953125, -1.15924072265625, -1.090179443359375, -1.0211181640625, -0.952056884765625, -0.88299560546875, -0.813934326171875, -0.744873046875, -0.675811767578125, -0.60675048828125, -0.537689208984375, -0.4686279296875, -0.399566650390625, -0.33050537109375, -0.261444091796875, -0.1923828125, -0.123321533203125, -0.05426025390625, 0.014801025390625, 0.0838623046875, 0.152923583984375, 0.22198486328125, 0.291046142578125, 0.360107421875, 0.429168701171875, 0.49822998046875, 0.567291259765625, 0.6363525390625, 0.705413818359375, 0.77447509765625, 0.843536376953125, 0.91259765625, 0.981658935546875, 1.05072021484375, 1.119781494140625, 1.1888427734375, 1.257904052734375, 1.32696533203125, 1.396026611328125, 1.465087890625, 1.534149169921875, 1.60321044921875, 1.672271728515625, 1.7413330078125, 1.810394287109375, 1.87945556640625, 1.948516845703125, 2.017578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 12.0, 20.0, 27.0, 32.0, 52.0, 49.0, 105.0, 132.0, 167.0, 120.0, 67.0, 43.0, 39.0, 28.0, 22.0, 15.0, 24.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005602836608886719, -0.0005448013544082642, -0.0005293190479278564, -0.0005138367414474487, -0.000498354434967041, -0.0004828721284866333, -0.0004673898220062256, -0.00045190751552581787, -0.00043642520904541016, -0.00042094290256500244, -0.0004054605960845947, -0.000389978289604187, -0.0003744959831237793, -0.0003590136766433716, -0.00034353137016296387, -0.00032804906368255615, -0.00031256675720214844, -0.0002970844507217407, -0.000281602144241333, -0.0002661198377609253, -0.0002506375312805176, -0.00023515522480010986, -0.00021967291831970215, -0.00020419061183929443, -0.00018870830535888672, -0.000173225998878479, -0.0001577436923980713, -0.00014226138591766357, -0.00012677907943725586, -0.00011129677295684814, -9.581446647644043e-05, -8.033215999603271e-05, -6.4849853515625e-05, -4.9367547035217285e-05, -3.388524055480957e-05, -1.8402934074401855e-05, -2.9206275939941406e-06, 1.2561678886413574e-05, 2.804398536682129e-05, 4.3526291847229004e-05, 5.900859832763672e-05, 7.449090480804443e-05, 8.997321128845215e-05, 0.00010545551776885986, 0.00012093782424926758, 0.0001364201307296753, 0.000151902437210083, 0.00016738474369049072, 0.00018286705017089844, 0.00019834935665130615, 0.00021383166313171387, 0.00022931396961212158, 0.0002447962760925293, 0.000260278582572937, 0.0002757608890533447, 0.00029124319553375244, 0.00030672550201416016, 0.00032220780849456787, 0.0003376901149749756, 0.0003531724214553833, 0.000368654727935791, 0.00038413703441619873, 0.00039961934089660645, 0.00041510164737701416, 0.0004305839538574219]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 16.0, 12.0, 24.0, 21.0, 45.0, 77.0, 96.0, 167.0, 263.0, 442.0, 956.0, 2175.0, 6145.0, 21513.0, 100905.0, 548912.0, 296637.0, 50512.0, 12448.0, 3999.0, 1536.0, 718.0, 377.0, 226.0, 93.0, 79.0, 49.0, 38.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.808868408203125, -2.72320556640625, -2.637542724609375, -2.5518798828125, -2.466217041015625, -2.38055419921875, -2.294891357421875, -2.209228515625, -2.123565673828125, -2.03790283203125, -1.952239990234375, -1.8665771484375, -1.780914306640625, -1.69525146484375, -1.609588623046875, -1.52392578125, -1.438262939453125, -1.35260009765625, -1.266937255859375, -1.1812744140625, -1.095611572265625, -1.00994873046875, -0.924285888671875, -0.838623046875, -0.752960205078125, -0.66729736328125, -0.581634521484375, -0.4959716796875, -0.410308837890625, -0.32464599609375, -0.238983154296875, -0.1533203125, -0.067657470703125, 0.01800537109375, 0.103668212890625, 0.1893310546875, 0.274993896484375, 0.36065673828125, 0.446319580078125, 0.531982421875, 0.617645263671875, 0.70330810546875, 0.788970947265625, 0.8746337890625, 0.960296630859375, 1.04595947265625, 1.131622314453125, 1.21728515625, 1.302947998046875, 1.38861083984375, 1.474273681640625, 1.5599365234375, 1.645599365234375, 1.73126220703125, 1.816925048828125, 1.902587890625, 1.988250732421875, 2.07391357421875, 2.159576416015625, 2.2452392578125, 2.330902099609375, 2.41656494140625, 2.502227783203125, 2.587890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 3.0, 9.0, 18.0, 12.0, 17.0, 23.0, 22.0, 36.0, 42.0, 45.0, 51.0, 56.0, 74.0, 77.0, 81.0, 92.0, 59.0, 47.0, 40.0, 31.0, 30.0, 30.0, 14.0, 7.0, 13.0, 10.0, 11.0, 6.0, 6.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.275390625, -1.2330474853515625, -1.190704345703125, -1.1483612060546875, -1.10601806640625, -1.0636749267578125, -1.021331787109375, -0.9789886474609375, -0.9366455078125, -0.8943023681640625, -0.851959228515625, -0.8096160888671875, -0.76727294921875, -0.7249298095703125, -0.682586669921875, -0.6402435302734375, -0.597900390625, -0.5555572509765625, -0.513214111328125, -0.4708709716796875, -0.42852783203125, -0.3861846923828125, -0.343841552734375, -0.3014984130859375, -0.2591552734375, -0.2168121337890625, -0.174468994140625, -0.1321258544921875, -0.08978271484375, -0.0474395751953125, -0.005096435546875, 0.0372467041015625, 0.07958984375, 0.1219329833984375, 0.164276123046875, 0.2066192626953125, 0.24896240234375, 0.2913055419921875, 0.333648681640625, 0.3759918212890625, 0.4183349609375, 0.4606781005859375, 0.503021240234375, 0.5453643798828125, 0.58770751953125, 0.6300506591796875, 0.672393798828125, 0.7147369384765625, 0.757080078125, 0.7994232177734375, 0.841766357421875, 0.8841094970703125, 0.92645263671875, 0.9687957763671875, 1.011138916015625, 1.0534820556640625, 1.0958251953125, 1.1381683349609375, 1.180511474609375, 1.2228546142578125, 1.26519775390625, 1.3075408935546875, 1.349884033203125, 1.3922271728515625, 1.4345703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 20.0, 33.0, 47.0, 84.0, 136.0, 161.0, 180.0, 129.0, 75.0, 61.0, 29.0, 14.0, 8.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.0475959777832, -38.993011474609375, -37.93842697143555, -36.88384246826172, -35.82925796508789, -34.77467346191406, -33.720088958740234, -32.665504455566406, -31.610918045043945, -30.556333541870117, -29.50174903869629, -28.44716453552246, -27.392578125, -26.337993621826172, -25.283409118652344, -24.228824615478516, -23.174240112304688, -22.11965560913086, -21.06507110595703, -20.010486602783203, -18.955902099609375, -17.901317596435547, -16.846731185913086, -15.792146682739258, -14.73756217956543, -13.682977676391602, -12.628393173217773, -11.573807716369629, -10.5192232131958, -9.464638710021973, -8.410053253173828, -7.35546875, -6.300882339477539, -5.246297836303711, -4.191712856292725, -3.1371281147003174, -2.08254337310791, -1.027958869934082, 0.026626110076904297, 1.0812110900878906, 2.1357955932617188, 3.190380334854126, 4.244965076446533, 5.2995500564575195, 6.354134559631348, 7.408719062805176, 8.46330451965332, 9.517889022827148, 10.572473526000977, 11.627058029174805, 12.681642532348633, 13.736227989196777, 14.790812492370605, 15.845396995544434, 16.899982452392578, 17.954566955566406, 19.009151458740234, 20.063735961914062, 21.11832046508789, 22.17290496826172, 23.227489471435547, 24.282073974609375, 25.336660385131836, 26.391244888305664, 27.445829391479492]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 10.0, 19.0, 18.0, 19.0, 23.0, 36.0, 29.0, 35.0, 24.0, 43.0, 46.0, 43.0, 37.0, 53.0, 44.0, 47.0, 43.0, 51.0, 52.0, 38.0, 34.0, 41.0, 31.0, 28.0, 31.0, 19.0, 18.0, 14.0, 13.0, 10.0, 13.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.359699249267578, -13.80445671081543, -13.249214172363281, -12.693971633911133, -12.1387300491333, -11.583487510681152, -11.028244972229004, -10.473002433776855, -9.917760848999023, -9.362518310546875, -8.807275772094727, -8.252033233642578, -7.696791648864746, -7.141549110412598, -6.586306571960449, -6.031064033508301, -5.475821495056152, -4.920578956604004, -4.365336894989014, -3.8100943565368652, -3.254852056503296, -2.6996097564697266, -2.144367218017578, -1.5891249179840088, -1.0338826179504395, -0.47864025831222534, 0.07660210132598877, 0.6318445205688477, 1.187086820602417, 1.7423291206359863, 2.2975716590881348, 2.852813959121704, 3.4080562591552734, 3.9632985591888428, 4.518540859222412, 5.0737833976745605, 5.629025459289551, 6.184267997741699, 6.739510536193848, 7.294753074645996, 7.849995136260986, 8.405237197875977, 8.960479736328125, 9.515722274780273, 10.070964813232422, 10.62620735168457, 11.181449890136719, 11.73669147491455, 12.2919340133667, 12.847176551818848, 13.402419090270996, 13.957660675048828, 14.512903213500977, 15.068145751953125, 15.623388290405273, 16.178630828857422, 16.73387336730957, 17.28911590576172, 17.844358444213867, 18.399600982666016, 18.954843521118164, 19.510086059570312, 20.065326690673828, 20.620569229125977, 21.175811767578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 7.0, 4.0, 16.0, 23.0, 39.0, 64.0, 93.0, 144.0, 218.0, 348.0, 598.0, 920.0, 1551.0, 2624.0, 4970.0, 9715.0, 19303.0, 43289.0, 113444.0, 477953.0, 3094251.0, 275891.0, 81923.0, 33351.0, 15476.0, 7841.0, 4169.0, 2325.0, 1360.0, 879.0, 557.0, 324.0, 186.0, 124.0, 89.0, 69.0, 40.0, 32.0, 21.0, 28.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.09381103515625, -2.0001220703125, -1.90643310546875, -1.812744140625, -1.71905517578125, -1.6253662109375, -1.53167724609375, -1.43798828125, -1.34429931640625, -1.2506103515625, -1.15692138671875, -1.063232421875, -0.96954345703125, -0.8758544921875, -0.78216552734375, -0.6884765625, -0.59478759765625, -0.5010986328125, -0.40740966796875, -0.313720703125, -0.22003173828125, -0.1263427734375, -0.03265380859375, 0.06103515625, 0.15472412109375, 0.2484130859375, 0.34210205078125, 0.435791015625, 0.52947998046875, 0.6231689453125, 0.71685791015625, 0.810546875, 0.90423583984375, 0.9979248046875, 1.09161376953125, 1.185302734375, 1.27899169921875, 1.3726806640625, 1.46636962890625, 1.56005859375, 1.65374755859375, 1.7474365234375, 1.84112548828125, 1.934814453125, 2.02850341796875, 2.1221923828125, 2.21588134765625, 2.3095703125, 2.40325927734375, 2.4969482421875, 2.59063720703125, 2.684326171875, 2.77801513671875, 2.8717041015625, 2.96539306640625, 3.05908203125, 3.15277099609375, 3.2464599609375, 3.34014892578125, 3.433837890625, 3.52752685546875, 3.6212158203125, 3.71490478515625, 3.80859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 10.0, 11.0, 19.0, 16.0, 17.0, 27.0, 19.0, 23.0, 40.0, 46.0, 37.0, 42.0, 48.0, 47.0, 54.0, 46.0, 41.0, 52.0, 37.0, 42.0, 29.0, 26.0, 32.0, 31.0, 20.0, 26.0, 21.0, 13.0, 12.0, 12.0, 12.0, 8.0, 6.0, 10.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.56689453125, -0.548980712890625, -0.53106689453125, -0.513153076171875, -0.4952392578125, -0.477325439453125, -0.45941162109375, -0.441497802734375, -0.423583984375, -0.405670166015625, -0.38775634765625, -0.369842529296875, -0.3519287109375, -0.334014892578125, -0.31610107421875, -0.298187255859375, -0.2802734375, -0.262359619140625, -0.24444580078125, -0.226531982421875, -0.2086181640625, -0.190704345703125, -0.17279052734375, -0.154876708984375, -0.136962890625, -0.119049072265625, -0.10113525390625, -0.083221435546875, -0.0653076171875, -0.047393798828125, -0.02947998046875, -0.011566162109375, 0.00634765625, 0.024261474609375, 0.04217529296875, 0.060089111328125, 0.0780029296875, 0.095916748046875, 0.11383056640625, 0.131744384765625, 0.149658203125, 0.167572021484375, 0.18548583984375, 0.203399658203125, 0.2213134765625, 0.239227294921875, 0.25714111328125, 0.275054931640625, 0.29296875, 0.310882568359375, 0.32879638671875, 0.346710205078125, 0.3646240234375, 0.382537841796875, 0.40045166015625, 0.418365478515625, 0.436279296875, 0.454193115234375, 0.47210693359375, 0.490020751953125, 0.5079345703125, 0.525848388671875, 0.54376220703125, 0.561676025390625, 0.57958984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 7.0, 18.0, 14.0, 28.0, 60.0, 91.0, 196.0, 534.0, 1670.0, 6183.0, 29160.0, 262364.0, 3638139.0, 221885.0, 25750.0, 5711.0, 1482.0, 536.0, 210.0, 107.0, 43.0, 36.0, 28.0, 16.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.377410888671875, -3.15911865234375, -2.940826416015625, -2.7225341796875, -2.504241943359375, -2.28594970703125, -2.067657470703125, -1.849365234375, -1.631072998046875, -1.41278076171875, -1.194488525390625, -0.9761962890625, -0.757904052734375, -0.53961181640625, -0.321319580078125, -0.10302734375, 0.115264892578125, 0.33355712890625, 0.551849365234375, 0.7701416015625, 0.988433837890625, 1.20672607421875, 1.425018310546875, 1.643310546875, 1.861602783203125, 2.07989501953125, 2.298187255859375, 2.5164794921875, 2.734771728515625, 2.95306396484375, 3.171356201171875, 3.3896484375, 3.607940673828125, 3.82623291015625, 4.044525146484375, 4.2628173828125, 4.481109619140625, 4.69940185546875, 4.917694091796875, 5.135986328125, 5.354278564453125, 5.57257080078125, 5.790863037109375, 6.0091552734375, 6.227447509765625, 6.44573974609375, 6.664031982421875, 6.88232421875, 7.100616455078125, 7.31890869140625, 7.537200927734375, 7.7554931640625, 7.973785400390625, 8.19207763671875, 8.410369873046875, 8.628662109375, 8.846954345703125, 9.06524658203125, 9.283538818359375, 9.5018310546875, 9.720123291015625, 9.93841552734375, 10.156707763671875, 10.375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 10.0, 1.0, 3.0, 6.0, 6.0, 7.0, 10.0, 15.0, 18.0, 14.0, 23.0, 36.0, 42.0, 56.0, 83.0, 107.0, 151.0, 273.0, 508.0, 1256.0, 590.0, 279.0, 150.0, 112.0, 84.0, 64.0, 36.0, 30.0, 16.0, 22.0, 7.0, 17.0, 7.0, 11.0, 7.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.2232666015625, -1.178955078125, -1.1346435546875, -1.09033203125, -1.0460205078125, -1.001708984375, -0.9573974609375, -0.9130859375, -0.8687744140625, -0.824462890625, -0.7801513671875, -0.73583984375, -0.6915283203125, -0.647216796875, -0.6029052734375, -0.55859375, -0.5142822265625, -0.469970703125, -0.4256591796875, -0.38134765625, -0.3370361328125, -0.292724609375, -0.2484130859375, -0.2041015625, -0.1597900390625, -0.115478515625, -0.0711669921875, -0.02685546875, 0.0174560546875, 0.061767578125, 0.1060791015625, 0.150390625, 0.1947021484375, 0.239013671875, 0.2833251953125, 0.32763671875, 0.3719482421875, 0.416259765625, 0.4605712890625, 0.5048828125, 0.5491943359375, 0.593505859375, 0.6378173828125, 0.68212890625, 0.7264404296875, 0.770751953125, 0.8150634765625, 0.859375, 0.9036865234375, 0.947998046875, 0.9923095703125, 1.03662109375, 1.0809326171875, 1.125244140625, 1.1695556640625, 1.2138671875, 1.2581787109375, 1.302490234375, 1.3468017578125, 1.39111328125, 1.4354248046875, 1.479736328125, 1.5240478515625, 1.568359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 68.0, 157.0, 260.0, 250.0, 148.0, 72.0, 18.0, 6.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.629150390625, -36.75761413574219, -35.88608169555664, -35.01454544067383, -34.143009185791016, -33.2714729309082, -32.399940490722656, -31.528404235839844, -30.65686798095703, -29.78533363342285, -28.91379737854004, -28.04226303100586, -27.170726776123047, -26.299192428588867, -25.427658081054688, -24.556121826171875, -23.684587478637695, -22.813053131103516, -21.941516876220703, -21.069982528686523, -20.19844627380371, -19.32691192626953, -18.45537567138672, -17.58384132385254, -16.71230697631836, -15.840771675109863, -14.969236373901367, -14.097702026367188, -13.226165771484375, -12.354631423950195, -11.4830961227417, -10.611560821533203, -9.74002456665039, -8.868489265441895, -7.996953964233398, -7.1254191398620605, -6.2538838386535645, -5.382348537445068, -4.5108137130737305, -3.6392784118652344, -2.7677431106567383, -1.8962079286575317, -1.0246727466583252, -0.1531376838684082, 0.7183976173400879, 1.589932918548584, 2.461467742919922, 3.333003044128418, 4.204538345336914, 5.07607364654541, 5.947608947753906, 6.819143772125244, 7.69067907333374, 8.562213897705078, 9.433749198913574, 10.30528450012207, 11.176819801330566, 12.048355102539062, 12.919890403747559, 13.791425704956055, 14.662960052490234, 15.534496307373047, 16.406030654907227, 17.277565002441406, 18.14910125732422]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 8.0, 4.0, 14.0, 9.0, 14.0, 15.0, 21.0, 17.0, 25.0, 23.0, 30.0, 26.0, 36.0, 39.0, 46.0, 59.0, 51.0, 37.0, 43.0, 42.0, 51.0, 45.0, 46.0, 34.0, 33.0, 33.0, 38.0, 27.0, 21.0, 24.0, 17.0, 10.0, 16.0, 12.0, 11.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.874296188354492, -6.670568466186523, -6.466841220855713, -6.263113498687744, -6.059386253356934, -5.855658531188965, -5.651931285858154, -5.4482035636901855, -5.244476318359375, -5.040748596191406, -4.837021350860596, -4.633293628692627, -4.429566383361816, -4.225838661193848, -4.022111415863037, -3.8183836936950684, -3.6146562099456787, -3.410928726196289, -3.2072012424468994, -3.0034737586975098, -2.79974627494812, -2.5960187911987305, -2.3922910690307617, -2.188563823699951, -1.984836220741272, -1.7811087369918823, -1.5773812532424927, -1.3736536502838135, -1.1699261665344238, -0.9661986827850342, -0.7624711990356445, -0.5587437152862549, -0.35501623153686523, -0.1512887328863144, 0.05243876576423645, 0.2561662793159485, 0.45989376306533813, 0.6636213064193726, 0.8673487901687622, 1.0710762739181519, 1.2748037576675415, 1.4785312414169312, 1.6822587251663208, 1.885986328125, 2.0897138118743896, 2.2934412956237793, 2.497168779373169, 2.7008962631225586, 2.9046237468719482, 3.108351230621338, 3.3120787143707275, 3.515806198120117, 3.719533681869507, 3.9232611656188965, 4.126988887786865, 4.330716133117676, 4.5344438552856445, 4.738171577453613, 4.941898822784424, 5.145626544952393, 5.349353790283203, 5.553081512451172, 5.756808757781982, 5.960536479949951, 6.164263725280762]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 7.0, 12.0, 20.0, 29.0, 46.0, 56.0, 68.0, 129.0, 211.0, 367.0, 641.0, 1124.0, 2205.0, 3999.0, 8073.0, 16074.0, 32602.0, 67056.0, 141719.0, 320211.0, 243722.0, 107432.0, 51422.0, 25329.0, 12513.0, 6439.0, 3184.0, 1621.0, 877.0, 520.0, 270.0, 197.0, 113.0, 78.0, 56.0, 43.0, 24.0, 18.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.26953125, -3.1728515625, -3.076171875, -2.9794921875, -2.8828125, -2.7861328125, -2.689453125, -2.5927734375, -2.49609375, -2.3994140625, -2.302734375, -2.2060546875, -2.109375, -2.0126953125, -1.916015625, -1.8193359375, -1.72265625, -1.6259765625, -1.529296875, -1.4326171875, -1.3359375, -1.2392578125, -1.142578125, -1.0458984375, -0.94921875, -0.8525390625, -0.755859375, -0.6591796875, -0.5625, -0.4658203125, -0.369140625, -0.2724609375, -0.17578125, -0.0791015625, 0.017578125, 0.1142578125, 0.2109375, 0.3076171875, 0.404296875, 0.5009765625, 0.59765625, 0.6943359375, 0.791015625, 0.8876953125, 0.984375, 1.0810546875, 1.177734375, 1.2744140625, 1.37109375, 1.4677734375, 1.564453125, 1.6611328125, 1.7578125, 1.8544921875, 1.951171875, 2.0478515625, 2.14453125, 2.2412109375, 2.337890625, 2.4345703125, 2.53125, 2.6279296875, 2.724609375, 2.8212890625, 2.91796875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 8.0, 6.0, 7.0, 10.0, 12.0, 14.0, 14.0, 19.0, 23.0, 35.0, 38.0, 39.0, 49.0, 52.0, 44.0, 50.0, 54.0, 46.0, 60.0, 47.0, 39.0, 55.0, 31.0, 37.0, 29.0, 27.0, 28.0, 25.0, 14.0, 17.0, 13.0, 14.0, 11.0, 8.0, 3.0, 6.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.6798629760742188, -0.6590423583984375, -0.6382217407226562, -0.617401123046875, -0.5965805053710938, -0.5757598876953125, -0.5549392700195312, -0.53411865234375, -0.5132980346679688, -0.4924774169921875, -0.47165679931640625, -0.450836181640625, -0.43001556396484375, -0.4091949462890625, -0.38837432861328125, -0.3675537109375, -0.34673309326171875, -0.3259124755859375, -0.30509185791015625, -0.284271240234375, -0.26345062255859375, -0.2426300048828125, -0.22180938720703125, -0.20098876953125, -0.18016815185546875, -0.1593475341796875, -0.13852691650390625, -0.117706298828125, -0.09688568115234375, -0.0760650634765625, -0.05524444580078125, -0.034423828125, -0.01360321044921875, 0.0072174072265625, 0.02803802490234375, 0.048858642578125, 0.06967926025390625, 0.0904998779296875, 0.11132049560546875, 0.13214111328125, 0.15296173095703125, 0.1737823486328125, 0.19460296630859375, 0.215423583984375, 0.23624420166015625, 0.2570648193359375, 0.27788543701171875, 0.2987060546875, 0.31952667236328125, 0.3403472900390625, 0.36116790771484375, 0.381988525390625, 0.40280914306640625, 0.4236297607421875, 0.44445037841796875, 0.46527099609375, 0.48609161376953125, 0.5069122314453125, 0.5277328491210938, 0.548553466796875, 0.5693740844726562, 0.5901947021484375, 0.6110153198242188, 0.6318359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 4.0, 9.0, 8.0, 13.0, 14.0, 25.0, 35.0, 47.0, 67.0, 62.0, 90.0, 153.0, 189.0, 318.0, 515.0, 926.0, 1519.0, 2926.0, 6172.0, 13994.0, 35417.0, 96508.0, 289448.0, 386246.0, 132028.0, 47414.0, 18456.0, 7699.0, 3520.0, 1896.0, 1063.0, 593.0, 336.0, 252.0, 179.0, 99.0, 78.0, 52.0, 35.0, 36.0, 25.0, 15.0, 18.0, 6.0, 10.0, 5.0, 8.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0], "bins": [-3.474609375, -3.369781494140625, -3.26495361328125, -3.160125732421875, -3.0552978515625, -2.950469970703125, -2.84564208984375, -2.740814208984375, -2.635986328125, -2.531158447265625, -2.42633056640625, -2.321502685546875, -2.2166748046875, -2.111846923828125, -2.00701904296875, -1.902191162109375, -1.79736328125, -1.692535400390625, -1.58770751953125, -1.482879638671875, -1.3780517578125, -1.273223876953125, -1.16839599609375, -1.063568115234375, -0.958740234375, -0.853912353515625, -0.74908447265625, -0.644256591796875, -0.5394287109375, -0.434600830078125, -0.32977294921875, -0.224945068359375, -0.1201171875, -0.015289306640625, 0.08953857421875, 0.194366455078125, 0.2991943359375, 0.404022216796875, 0.50885009765625, 0.613677978515625, 0.718505859375, 0.823333740234375, 0.92816162109375, 1.032989501953125, 1.1378173828125, 1.242645263671875, 1.34747314453125, 1.452301025390625, 1.55712890625, 1.661956787109375, 1.76678466796875, 1.871612548828125, 1.9764404296875, 2.081268310546875, 2.18609619140625, 2.290924072265625, 2.395751953125, 2.500579833984375, 2.60540771484375, 2.710235595703125, 2.8150634765625, 2.919891357421875, 3.02471923828125, 3.129547119140625, 3.234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 7.0, 12.0, 10.0, 15.0, 14.0, 17.0, 27.0, 40.0, 32.0, 35.0, 46.0, 56.0, 44.0, 43.0, 56.0, 53.0, 42.0, 44.0, 46.0, 48.0, 46.0, 47.0, 36.0, 29.0, 22.0, 26.0, 20.0, 12.0, 9.0, 16.0, 9.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.913604736328125, -2.80963134765625, -2.705657958984375, -2.6016845703125, -2.497711181640625, -2.39373779296875, -2.289764404296875, -2.185791015625, -2.081817626953125, -1.97784423828125, -1.873870849609375, -1.7698974609375, -1.665924072265625, -1.56195068359375, -1.457977294921875, -1.35400390625, -1.250030517578125, -1.14605712890625, -1.042083740234375, -0.9381103515625, -0.834136962890625, -0.73016357421875, -0.626190185546875, -0.522216796875, -0.418243408203125, -0.31427001953125, -0.210296630859375, -0.1063232421875, -0.002349853515625, 0.10162353515625, 0.205596923828125, 0.3095703125, 0.413543701171875, 0.51751708984375, 0.621490478515625, 0.7254638671875, 0.829437255859375, 0.93341064453125, 1.037384033203125, 1.141357421875, 1.245330810546875, 1.34930419921875, 1.453277587890625, 1.5572509765625, 1.661224365234375, 1.76519775390625, 1.869171142578125, 1.97314453125, 2.077117919921875, 2.18109130859375, 2.285064697265625, 2.3890380859375, 2.493011474609375, 2.59698486328125, 2.700958251953125, 2.804931640625, 2.908905029296875, 3.01287841796875, 3.116851806640625, 3.2208251953125, 3.324798583984375, 3.42877197265625, 3.532745361328125, 3.63671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 14.0, 12.0, 17.0, 25.0, 62.0, 78.0, 127.0, 195.0, 394.0, 653.0, 1359.0, 3246.0, 8852.0, 30636.0, 168946.0, 662557.0, 132105.0, 26070.0, 7648.0, 2839.0, 1274.0, 636.0, 347.0, 166.0, 102.0, 61.0, 37.0, 34.0, 22.0, 10.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.890625, -3.77764892578125, -3.6646728515625, -3.55169677734375, -3.438720703125, -3.32574462890625, -3.2127685546875, -3.09979248046875, -2.98681640625, -2.87384033203125, -2.7608642578125, -2.64788818359375, -2.534912109375, -2.42193603515625, -2.3089599609375, -2.19598388671875, -2.0830078125, -1.97003173828125, -1.8570556640625, -1.74407958984375, -1.631103515625, -1.51812744140625, -1.4051513671875, -1.29217529296875, -1.17919921875, -1.06622314453125, -0.9532470703125, -0.84027099609375, -0.727294921875, -0.61431884765625, -0.5013427734375, -0.38836669921875, -0.275390625, -0.16241455078125, -0.0494384765625, 0.06353759765625, 0.176513671875, 0.28948974609375, 0.4024658203125, 0.51544189453125, 0.62841796875, 0.74139404296875, 0.8543701171875, 0.96734619140625, 1.080322265625, 1.19329833984375, 1.3062744140625, 1.41925048828125, 1.5322265625, 1.64520263671875, 1.7581787109375, 1.87115478515625, 1.984130859375, 2.09710693359375, 2.2100830078125, 2.32305908203125, 2.43603515625, 2.54901123046875, 2.6619873046875, 2.77496337890625, 2.887939453125, 3.00091552734375, 3.1138916015625, 3.22686767578125, 3.33984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 8.0, 13.0, 14.0, 18.0, 20.0, 27.0, 35.0, 66.0, 106.0, 268.0, 171.0, 79.0, 50.0, 35.0, 27.0, 18.0, 6.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007853507995605469, -0.0007588639855384827, -0.0007323771715164185, -0.0007058903574943542, -0.00067940354347229, -0.0006529167294502258, -0.0006264299154281616, -0.0005999431014060974, -0.0005734562873840332, -0.000546969473361969, -0.0005204826593399048, -0.0004939958453178406, -0.00046750903129577637, -0.00044102221727371216, -0.00041453540325164795, -0.00038804858922958374, -0.00036156177520751953, -0.0003350749611854553, -0.0003085881471633911, -0.0002821013331413269, -0.0002556145191192627, -0.00022912770509719849, -0.00020264089107513428, -0.00017615407705307007, -0.00014966726303100586, -0.00012318044900894165, -9.669363498687744e-05, -7.020682096481323e-05, -4.3720006942749023e-05, -1.7233192920684814e-05, 9.253621101379395e-06, 3.5740435123443604e-05, 6.222724914550781e-05, 8.871406316757202e-05, 0.00011520087718963623, 0.00014168769121170044, 0.00016817450523376465, 0.00019466131925582886, 0.00022114813327789307, 0.0002476349472999573, 0.0002741217613220215, 0.0003006085753440857, 0.0003270953893661499, 0.0003535822033882141, 0.0003800690174102783, 0.00040655583143234253, 0.00043304264545440674, 0.00045952945947647095, 0.00048601627349853516, 0.0005125030875205994, 0.0005389899015426636, 0.0005654767155647278, 0.000591963529586792, 0.0006184503436088562, 0.0006449371576309204, 0.0006714239716529846, 0.0006979107856750488, 0.000724397599697113, 0.0007508844137191772, 0.0007773712277412415, 0.0008038580417633057, 0.0008303448557853699, 0.0008568316698074341, 0.0008833184838294983, 0.0009098052978515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 7.0, 9.0, 11.0, 6.0, 21.0, 23.0, 49.0, 59.0, 101.0, 165.0, 251.0, 528.0, 1186.0, 2652.0, 7676.0, 28350.0, 169699.0, 673670.0, 129973.0, 23161.0, 6444.0, 2313.0, 1005.0, 473.0, 268.0, 177.0, 92.0, 58.0, 36.0, 28.0, 13.0, 19.0, 11.0, 3.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.609893798828125, -3.49127197265625, -3.372650146484375, -3.2540283203125, -3.135406494140625, -3.01678466796875, -2.898162841796875, -2.779541015625, -2.660919189453125, -2.54229736328125, -2.423675537109375, -2.3050537109375, -2.186431884765625, -2.06781005859375, -1.949188232421875, -1.83056640625, -1.711944580078125, -1.59332275390625, -1.474700927734375, -1.3560791015625, -1.237457275390625, -1.11883544921875, -1.000213623046875, -0.881591796875, -0.762969970703125, -0.64434814453125, -0.525726318359375, -0.4071044921875, -0.288482666015625, -0.16986083984375, -0.051239013671875, 0.0673828125, 0.186004638671875, 0.30462646484375, 0.423248291015625, 0.5418701171875, 0.660491943359375, 0.77911376953125, 0.897735595703125, 1.016357421875, 1.134979248046875, 1.25360107421875, 1.372222900390625, 1.4908447265625, 1.609466552734375, 1.72808837890625, 1.846710205078125, 1.96533203125, 2.083953857421875, 2.20257568359375, 2.321197509765625, 2.4398193359375, 2.558441162109375, 2.67706298828125, 2.795684814453125, 2.914306640625, 3.032928466796875, 3.15155029296875, 3.270172119140625, 3.3887939453125, 3.507415771484375, 3.62603759765625, 3.744659423828125, 3.86328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 4.0, 17.0, 25.0, 22.0, 34.0, 32.0, 51.0, 75.0, 79.0, 100.0, 114.0, 98.0, 73.0, 61.0, 37.0, 38.0, 36.0, 16.0, 13.0, 12.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.47265625, -2.400543212890625, -2.32843017578125, -2.256317138671875, -2.1842041015625, -2.112091064453125, -2.03997802734375, -1.967864990234375, -1.895751953125, -1.823638916015625, -1.75152587890625, -1.679412841796875, -1.6072998046875, -1.535186767578125, -1.46307373046875, -1.390960693359375, -1.31884765625, -1.246734619140625, -1.17462158203125, -1.102508544921875, -1.0303955078125, -0.958282470703125, -0.88616943359375, -0.814056396484375, -0.741943359375, -0.669830322265625, -0.59771728515625, -0.525604248046875, -0.4534912109375, -0.381378173828125, -0.30926513671875, -0.237152099609375, -0.1650390625, -0.092926025390625, -0.02081298828125, 0.051300048828125, 0.1234130859375, 0.195526123046875, 0.26763916015625, 0.339752197265625, 0.411865234375, 0.483978271484375, 0.55609130859375, 0.628204345703125, 0.7003173828125, 0.772430419921875, 0.84454345703125, 0.916656494140625, 0.98876953125, 1.060882568359375, 1.13299560546875, 1.205108642578125, 1.2772216796875, 1.349334716796875, 1.42144775390625, 1.493560791015625, 1.565673828125, 1.637786865234375, 1.70989990234375, 1.782012939453125, 1.8541259765625, 1.926239013671875, 1.99835205078125, 2.070465087890625, 2.142578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 10.0, 14.0, 14.0, 14.0, 30.0, 31.0, 67.0, 73.0, 117.0, 101.0, 103.0, 104.0, 97.0, 66.0, 57.0, 36.0, 20.0, 14.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.158504486083984, -24.371158599853516, -23.583810806274414, -22.796464920043945, -22.009117126464844, -21.221771240234375, -20.434425354003906, -19.647077560424805, -18.859731674194336, -18.072385787963867, -17.285037994384766, -16.497692108154297, -15.710345268249512, -14.922998428344727, -14.135651588439941, -13.348304748535156, -12.560957908630371, -11.773611068725586, -10.9862642288208, -10.198917388916016, -9.411571502685547, -8.624224662780762, -7.836877822875977, -7.04953145980835, -6.2621846199035645, -5.474837779998779, -4.687491416931152, -3.900144577026367, -3.112797975540161, -2.325451374053955, -1.53810453414917, -0.750758171081543, 0.03658866882324219, 0.823935329914093, 1.6112819910049438, 2.3986287117004395, 3.1859753131866455, 3.9733219146728516, 4.760668754577637, 5.548015117645264, 6.335361957550049, 7.122708797454834, 7.910055160522461, 8.697402000427246, 9.484748840332031, 10.2720947265625, 11.059442520141602, 11.84678840637207, 12.634135246276855, 13.42148208618164, 14.208828926086426, 14.996175765991211, 15.78352165222168, 16.57086944580078, 17.35821533203125, 18.14556121826172, 18.93290901184082, 19.72025489807129, 20.50760269165039, 21.29494857788086, 22.08229637145996, 22.86964225769043, 23.65699005126953, 24.4443359375, 25.23168182373047]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 8.0, 12.0, 12.0, 21.0, 17.0, 27.0, 39.0, 29.0, 29.0, 25.0, 40.0, 44.0, 42.0, 34.0, 41.0, 48.0, 34.0, 46.0, 44.0, 49.0, 44.0, 34.0, 42.0, 30.0, 28.0, 21.0, 25.0, 22.0, 16.0, 14.0, 9.0, 9.0, 8.0, 12.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.96186065673828, -17.40020179748535, -16.838544845581055, -16.276885986328125, -15.715227127075195, -15.153569221496582, -14.591911315917969, -14.030252456665039, -13.46859359741211, -12.906935691833496, -12.345276832580566, -11.783618927001953, -11.221960067749023, -10.66030216217041, -10.098644256591797, -9.536985397338867, -8.975327491760254, -8.41366958618164, -7.852010726928711, -7.290352821350098, -6.728693962097168, -6.167036056518555, -5.605377674102783, -5.043719291687012, -4.48206090927124, -3.9204025268554688, -3.3587441444396973, -2.797086000442505, -2.2354276180267334, -1.673769235610962, -1.1121110916137695, -0.550452709197998, 0.011205673217773438, 0.5728639960289001, 1.1345223188400269, 1.6961805820465088, 2.2578389644622803, 2.8194973468780518, 3.381155490875244, 3.9428138732910156, 4.504472255706787, 5.066130638122559, 5.62778902053833, 6.189447402954102, 6.751105308532715, 7.3127641677856445, 7.874422073364258, 8.436080932617188, 8.9977388381958, 9.559396743774414, 10.121055603027344, 10.682713508605957, 11.244372367858887, 11.8060302734375, 12.36768913269043, 12.929347038269043, 13.491004943847656, 14.05266284942627, 14.6143217086792, 15.175979614257812, 15.737638473510742, 16.299297332763672, 16.86095428466797, 17.4226131439209, 17.984272003173828]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 15.0, 4.0, 16.0, 30.0, 31.0, 47.0, 74.0, 110.0, 170.0, 284.0, 396.0, 648.0, 1209.0, 2200.0, 4111.0, 8790.0, 20953.0, 61012.0, 297172.0, 3493686.0, 217471.0, 51015.0, 18319.0, 7910.0, 3721.0, 2009.0, 1071.0, 614.0, 360.0, 270.0, 184.0, 124.0, 70.0, 60.0, 32.0, 18.0, 18.0, 9.0, 10.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.2933349609375, -3.168701171875, -3.0440673828125, -2.91943359375, -2.7947998046875, -2.670166015625, -2.5455322265625, -2.4208984375, -2.2962646484375, -2.171630859375, -2.0469970703125, -1.92236328125, -1.7977294921875, -1.673095703125, -1.5484619140625, -1.423828125, -1.2991943359375, -1.174560546875, -1.0499267578125, -0.92529296875, -0.8006591796875, -0.676025390625, -0.5513916015625, -0.4267578125, -0.3021240234375, -0.177490234375, -0.0528564453125, 0.07177734375, 0.1964111328125, 0.321044921875, 0.4456787109375, 0.5703125, 0.6949462890625, 0.819580078125, 0.9442138671875, 1.06884765625, 1.1934814453125, 1.318115234375, 1.4427490234375, 1.5673828125, 1.6920166015625, 1.816650390625, 1.9412841796875, 2.06591796875, 2.1905517578125, 2.315185546875, 2.4398193359375, 2.564453125, 2.6890869140625, 2.813720703125, 2.9383544921875, 3.06298828125, 3.1876220703125, 3.312255859375, 3.4368896484375, 3.5615234375, 3.6861572265625, 3.810791015625, 3.9354248046875, 4.06005859375, 4.1846923828125, 4.309326171875, 4.4339599609375, 4.55859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 9.0, 10.0, 4.0, 9.0, 10.0, 13.0, 9.0, 19.0, 20.0, 27.0, 33.0, 37.0, 47.0, 36.0, 47.0, 41.0, 53.0, 40.0, 50.0, 59.0, 36.0, 49.0, 46.0, 43.0, 38.0, 27.0, 35.0, 22.0, 32.0, 18.0, 19.0, 18.0, 9.0, 13.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6047134399414062, -0.5819854736328125, -0.5592575073242188, -0.536529541015625, -0.5138015747070312, -0.4910736083984375, -0.46834564208984375, -0.44561767578125, -0.42288970947265625, -0.4001617431640625, -0.37743377685546875, -0.354705810546875, -0.33197784423828125, -0.3092498779296875, -0.28652191162109375, -0.2637939453125, -0.24106597900390625, -0.2183380126953125, -0.19561004638671875, -0.172882080078125, -0.15015411376953125, -0.1274261474609375, -0.10469818115234375, -0.08197021484375, -0.05924224853515625, -0.0365142822265625, -0.01378631591796875, 0.008941650390625, 0.03166961669921875, 0.0543975830078125, 0.07712554931640625, 0.099853515625, 0.12258148193359375, 0.1453094482421875, 0.16803741455078125, 0.190765380859375, 0.21349334716796875, 0.2362213134765625, 0.25894927978515625, 0.28167724609375, 0.30440521240234375, 0.3271331787109375, 0.34986114501953125, 0.372589111328125, 0.39531707763671875, 0.4180450439453125, 0.44077301025390625, 0.4635009765625, 0.48622894287109375, 0.5089569091796875, 0.5316848754882812, 0.554412841796875, 0.5771408081054688, 0.5998687744140625, 0.6225967407226562, 0.64532470703125, 0.6680526733398438, 0.6907806396484375, 0.7135086059570312, 0.736236572265625, 0.7589645385742188, 0.7816925048828125, 0.8044204711914062, 0.8271484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 9.0, 10.0, 27.0, 29.0, 35.0, 75.0, 110.0, 161.0, 242.0, 409.0, 739.0, 1472.0, 3246.0, 7338.0, 17795.0, 53531.0, 228967.0, 3273435.0, 478450.0, 84156.0, 25610.0, 9780.0, 4133.0, 1962.0, 1037.0, 582.0, 315.0, 214.0, 134.0, 81.0, 63.0, 39.0, 29.0, 18.0, 8.0, 10.0, 10.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.96484375, -4.8216552734375, -4.678466796875, -4.5352783203125, -4.39208984375, -4.2489013671875, -4.105712890625, -3.9625244140625, -3.8193359375, -3.6761474609375, -3.532958984375, -3.3897705078125, -3.24658203125, -3.1033935546875, -2.960205078125, -2.8170166015625, -2.673828125, -2.5306396484375, -2.387451171875, -2.2442626953125, -2.10107421875, -1.9578857421875, -1.814697265625, -1.6715087890625, -1.5283203125, -1.3851318359375, -1.241943359375, -1.0987548828125, -0.95556640625, -0.8123779296875, -0.669189453125, -0.5260009765625, -0.3828125, -0.2396240234375, -0.096435546875, 0.0467529296875, 0.18994140625, 0.3331298828125, 0.476318359375, 0.6195068359375, 0.7626953125, 0.9058837890625, 1.049072265625, 1.1922607421875, 1.33544921875, 1.4786376953125, 1.621826171875, 1.7650146484375, 1.908203125, 2.0513916015625, 2.194580078125, 2.3377685546875, 2.48095703125, 2.6241455078125, 2.767333984375, 2.9105224609375, 3.0537109375, 3.1968994140625, 3.340087890625, 3.4832763671875, 3.62646484375, 3.7696533203125, 3.912841796875, 4.0560302734375, 4.19921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 6.0, 12.0, 10.0, 12.0, 24.0, 31.0, 45.0, 39.0, 85.0, 123.0, 242.0, 640.0, 1772.0, 457.0, 168.0, 133.0, 81.0, 57.0, 37.0, 22.0, 19.0, 16.0, 8.0, 8.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5810546875, -1.5210418701171875, -1.461029052734375, -1.4010162353515625, -1.34100341796875, -1.2809906005859375, -1.220977783203125, -1.1609649658203125, -1.1009521484375, -1.0409393310546875, -0.980926513671875, -0.9209136962890625, -0.86090087890625, -0.8008880615234375, -0.740875244140625, -0.6808624267578125, -0.620849609375, -0.5608367919921875, -0.500823974609375, -0.4408111572265625, -0.38079833984375, -0.3207855224609375, -0.260772705078125, -0.2007598876953125, -0.1407470703125, -0.0807342529296875, -0.020721435546875, 0.0392913818359375, 0.09930419921875, 0.1593170166015625, 0.219329833984375, 0.2793426513671875, 0.33935546875, 0.3993682861328125, 0.459381103515625, 0.5193939208984375, 0.57940673828125, 0.6394195556640625, 0.699432373046875, 0.7594451904296875, 0.8194580078125, 0.8794708251953125, 0.939483642578125, 0.9994964599609375, 1.05950927734375, 1.1195220947265625, 1.179534912109375, 1.2395477294921875, 1.299560546875, 1.3595733642578125, 1.419586181640625, 1.4795989990234375, 1.53961181640625, 1.5996246337890625, 1.659637451171875, 1.7196502685546875, 1.7796630859375, 1.8396759033203125, 1.899688720703125, 1.9597015380859375, 2.01971435546875, 2.0797271728515625, 2.139739990234375, 2.1997528076171875, 2.259765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 4.0, 25.0, 30.0, 73.0, 113.0, 142.0, 160.0, 143.0, 90.0, 101.0, 51.0, 28.0, 20.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.641157150268555, -11.145184516906738, -10.649211883544922, -10.153239250183105, -9.657266616821289, -9.161294937133789, -8.665322303771973, -8.169349670410156, -7.67337703704834, -7.177404403686523, -6.681431770324707, -6.185459613800049, -5.689486980438232, -5.193514347076416, -4.697542190551758, -4.201569557189941, -3.705596923828125, -3.2096242904663086, -2.7136518955230713, -2.217679500579834, -1.7217068672180176, -1.2257342338562012, -0.7297618389129639, -0.23378944396972656, 0.26218318939208984, 0.7581557035446167, 1.2541282176971436, 1.7501007318496704, 2.2460732460021973, 2.7420458793640137, 3.238018274307251, 3.7339906692504883, 4.229963302612305, 4.725935935974121, 5.2219085693359375, 5.717880725860596, 6.213853359222412, 6.7098259925842285, 7.205798149108887, 7.701770782470703, 8.19774341583252, 8.693716049194336, 9.189688682556152, 9.685661315917969, 10.181632995605469, 10.677606582641602, 11.173578262329102, 11.669550895690918, 12.165523529052734, 12.66149616241455, 13.157468795776367, 13.653441429138184, 14.1494140625, 14.6453857421875, 15.141358375549316, 15.637331008911133, 16.133304595947266, 16.629276275634766, 17.1252498626709, 17.6212215423584, 18.11719512939453, 18.61316680908203, 19.109140396118164, 19.605112075805664, 20.101083755493164]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 7.0, 8.0, 7.0, 10.0, 14.0, 11.0, 18.0, 22.0, 16.0, 25.0, 39.0, 27.0, 32.0, 31.0, 39.0, 43.0, 31.0, 43.0, 35.0, 52.0, 45.0, 35.0, 47.0, 37.0, 47.0, 34.0, 34.0, 30.0, 23.0, 22.0, 23.0, 18.0, 16.0, 9.0, 8.0, 16.0, 3.0, 7.0, 9.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.438998222351074, -5.249924182891846, -5.060850143432617, -4.871776103973389, -4.68270206451416, -4.493628025054932, -4.304553985595703, -4.115479469299316, -3.926405668258667, -3.7373316287994385, -3.54825758934021, -3.3591833114624023, -3.170109272003174, -2.9810352325439453, -2.791961193084717, -2.6028871536254883, -2.4138131141662598, -2.2247390747070312, -2.0356650352478027, -1.8465908765792847, -1.6575168371200562, -1.4684427976608276, -1.2793686389923096, -1.090294599533081, -0.9012205600738525, -0.712146520614624, -0.5230724215507507, -0.33399832248687744, -0.14492428302764893, 0.04414975643157959, 0.23322391510009766, 0.42229795455932617, 0.6113715171813965, 0.800445556640625, 0.9895196557044983, 1.1785937547683716, 1.3676677942276, 1.5567418336868286, 1.7458159923553467, 1.9348900318145752, 2.1239640712738037, 2.3130381107330322, 2.5021121501922607, 2.6911864280700684, 2.880260467529297, 3.0693345069885254, 3.258408546447754, 3.4474825859069824, 3.636556625366211, 3.8256306648254395, 4.014704704284668, 4.2037787437438965, 4.392852783203125, 4.5819268226623535, 4.771000862121582, 4.960075378417969, 5.149148941040039, 5.338222980499268, 5.527297019958496, 5.716371059417725, 5.905445098876953, 6.094519138336182, 6.28359317779541, 6.472667694091797, 6.661741733551025]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 7.0, 12.0, 7.0, 23.0, 35.0, 47.0, 114.0, 164.0, 312.0, 585.0, 1229.0, 2439.0, 5014.0, 11165.0, 24322.0, 54637.0, 121491.0, 274637.0, 306369.0, 134474.0, 61093.0, 27040.0, 12213.0, 5729.0, 2705.0, 1295.0, 645.0, 339.0, 168.0, 98.0, 70.0, 33.0, 21.0, 7.0, 8.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.474609375, -3.355072021484375, -3.23553466796875, -3.115997314453125, -2.9964599609375, -2.876922607421875, -2.75738525390625, -2.637847900390625, -2.518310546875, -2.398773193359375, -2.27923583984375, -2.159698486328125, -2.0401611328125, -1.920623779296875, -1.80108642578125, -1.681549072265625, -1.56201171875, -1.442474365234375, -1.32293701171875, -1.203399658203125, -1.0838623046875, -0.964324951171875, -0.84478759765625, -0.725250244140625, -0.605712890625, -0.486175537109375, -0.36663818359375, -0.247100830078125, -0.1275634765625, -0.008026123046875, 0.11151123046875, 0.231048583984375, 0.3505859375, 0.470123291015625, 0.58966064453125, 0.709197998046875, 0.8287353515625, 0.948272705078125, 1.06781005859375, 1.187347412109375, 1.306884765625, 1.426422119140625, 1.54595947265625, 1.665496826171875, 1.7850341796875, 1.904571533203125, 2.02410888671875, 2.143646240234375, 2.26318359375, 2.382720947265625, 2.50225830078125, 2.621795654296875, 2.7413330078125, 2.860870361328125, 2.98040771484375, 3.099945068359375, 3.219482421875, 3.339019775390625, 3.45855712890625, 3.578094482421875, 3.6976318359375, 3.817169189453125, 3.93670654296875, 4.056243896484375, 4.17578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 11.0, 8.0, 9.0, 11.0, 13.0, 20.0, 13.0, 19.0, 26.0, 22.0, 36.0, 29.0, 31.0, 28.0, 30.0, 33.0, 51.0, 44.0, 40.0, 48.0, 40.0, 36.0, 32.0, 32.0, 33.0, 37.0, 24.0, 30.0, 31.0, 21.0, 19.0, 18.0, 19.0, 17.0, 19.0, 10.0, 14.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.60107421875, -0.5817489624023438, -0.5624237060546875, -0.5430984497070312, -0.523773193359375, -0.5044479370117188, -0.4851226806640625, -0.46579742431640625, -0.44647216796875, -0.42714691162109375, -0.4078216552734375, -0.38849639892578125, -0.369171142578125, -0.34984588623046875, -0.3305206298828125, -0.31119537353515625, -0.2918701171875, -0.27254486083984375, -0.2532196044921875, -0.23389434814453125, -0.214569091796875, -0.19524383544921875, -0.1759185791015625, -0.15659332275390625, -0.13726806640625, -0.11794281005859375, -0.0986175537109375, -0.07929229736328125, -0.059967041015625, -0.04064178466796875, -0.0213165283203125, -0.00199127197265625, 0.017333984375, 0.03665924072265625, 0.0559844970703125, 0.07530975341796875, 0.094635009765625, 0.11396026611328125, 0.1332855224609375, 0.15261077880859375, 0.17193603515625, 0.19126129150390625, 0.2105865478515625, 0.22991180419921875, 0.249237060546875, 0.26856231689453125, 0.2878875732421875, 0.30721282958984375, 0.3265380859375, 0.34586334228515625, 0.3651885986328125, 0.38451385498046875, 0.403839111328125, 0.42316436767578125, 0.4424896240234375, 0.46181488037109375, 0.48114013671875, 0.5004653930664062, 0.5197906494140625, 0.5391159057617188, 0.558441162109375, 0.5777664184570312, 0.5970916748046875, 0.6164169311523438, 0.6357421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 11.0, 11.0, 16.0, 18.0, 29.0, 35.0, 65.0, 69.0, 105.0, 184.0, 280.0, 460.0, 851.0, 1882.0, 5296.0, 21074.0, 114419.0, 563176.0, 275833.0, 48685.0, 10037.0, 3116.0, 1247.0, 631.0, 357.0, 221.0, 140.0, 94.0, 61.0, 38.0, 21.0, 24.0, 13.0, 12.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.48968505859375, -5.2918701171875, -5.09405517578125, -4.896240234375, -4.69842529296875, -4.5006103515625, -4.30279541015625, -4.10498046875, -3.90716552734375, -3.7093505859375, -3.51153564453125, -3.313720703125, -3.11590576171875, -2.9180908203125, -2.72027587890625, -2.5224609375, -2.32464599609375, -2.1268310546875, -1.92901611328125, -1.731201171875, -1.53338623046875, -1.3355712890625, -1.13775634765625, -0.93994140625, -0.74212646484375, -0.5443115234375, -0.34649658203125, -0.148681640625, 0.04913330078125, 0.2469482421875, 0.44476318359375, 0.642578125, 0.84039306640625, 1.0382080078125, 1.23602294921875, 1.433837890625, 1.63165283203125, 1.8294677734375, 2.02728271484375, 2.22509765625, 2.42291259765625, 2.6207275390625, 2.81854248046875, 3.016357421875, 3.21417236328125, 3.4119873046875, 3.60980224609375, 3.8076171875, 4.00543212890625, 4.2032470703125, 4.40106201171875, 4.598876953125, 4.79669189453125, 4.9945068359375, 5.19232177734375, 5.39013671875, 5.58795166015625, 5.7857666015625, 5.98358154296875, 6.181396484375, 6.37921142578125, 6.5770263671875, 6.77484130859375, 6.97265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 5.0, 7.0, 7.0, 14.0, 12.0, 14.0, 23.0, 22.0, 37.0, 36.0, 39.0, 38.0, 48.0, 41.0, 49.0, 57.0, 55.0, 44.0, 49.0, 50.0, 53.0, 30.0, 36.0, 34.0, 28.0, 23.0, 23.0, 16.0, 21.0, 14.0, 10.0, 13.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.0980224609375, -3.981201171875, -3.8643798828125, -3.74755859375, -3.6307373046875, -3.513916015625, -3.3970947265625, -3.2802734375, -3.1634521484375, -3.046630859375, -2.9298095703125, -2.81298828125, -2.6961669921875, -2.579345703125, -2.4625244140625, -2.345703125, -2.2288818359375, -2.112060546875, -1.9952392578125, -1.87841796875, -1.7615966796875, -1.644775390625, -1.5279541015625, -1.4111328125, -1.2943115234375, -1.177490234375, -1.0606689453125, -0.94384765625, -0.8270263671875, -0.710205078125, -0.5933837890625, -0.4765625, -0.3597412109375, -0.242919921875, -0.1260986328125, -0.00927734375, 0.1075439453125, 0.224365234375, 0.3411865234375, 0.4580078125, 0.5748291015625, 0.691650390625, 0.8084716796875, 0.92529296875, 1.0421142578125, 1.158935546875, 1.2757568359375, 1.392578125, 1.5093994140625, 1.626220703125, 1.7430419921875, 1.85986328125, 1.9766845703125, 2.093505859375, 2.2103271484375, 2.3271484375, 2.4439697265625, 2.560791015625, 2.6776123046875, 2.79443359375, 2.9112548828125, 3.028076171875, 3.1448974609375, 3.26171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 15.0, 14.0, 33.0, 46.0, 84.0, 117.0, 227.0, 387.0, 708.0, 1426.0, 2872.0, 6586.0, 17132.0, 51023.0, 220846.0, 557813.0, 131090.0, 35709.0, 12512.0, 5125.0, 2319.0, 1065.0, 554.0, 338.0, 179.0, 108.0, 77.0, 42.0, 33.0, 19.0, 12.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.630615234375, -2.53076171875, -2.430908203125, -2.3310546875, -2.231201171875, -2.13134765625, -2.031494140625, -1.931640625, -1.831787109375, -1.73193359375, -1.632080078125, -1.5322265625, -1.432373046875, -1.33251953125, -1.232666015625, -1.1328125, -1.032958984375, -0.93310546875, -0.833251953125, -0.7333984375, -0.633544921875, -0.53369140625, -0.433837890625, -0.333984375, -0.234130859375, -0.13427734375, -0.034423828125, 0.0654296875, 0.165283203125, 0.26513671875, 0.364990234375, 0.46484375, 0.564697265625, 0.66455078125, 0.764404296875, 0.8642578125, 0.964111328125, 1.06396484375, 1.163818359375, 1.263671875, 1.363525390625, 1.46337890625, 1.563232421875, 1.6630859375, 1.762939453125, 1.86279296875, 1.962646484375, 2.0625, 2.162353515625, 2.26220703125, 2.362060546875, 2.4619140625, 2.561767578125, 2.66162109375, 2.761474609375, 2.861328125, 2.961181640625, 3.06103515625, 3.160888671875, 3.2607421875, 3.360595703125, 3.46044921875, 3.560302734375, 3.66015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 11.0, 16.0, 8.0, 22.0, 24.0, 41.0, 39.0, 47.0, 78.0, 152.0, 176.0, 98.0, 64.0, 50.0, 28.0, 27.0, 27.0, 20.0, 13.0, 11.0, 6.0, 1.0, 7.0, 7.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008950233459472656, -0.0008702576160430908, -0.000845491886138916, -0.0008207261562347412, -0.0007959604263305664, -0.0007711946964263916, -0.0007464289665222168, -0.000721663236618042, -0.0006968975067138672, -0.0006721317768096924, -0.0006473660469055176, -0.0006226003170013428, -0.000597834587097168, -0.0005730688571929932, -0.0005483031272888184, -0.0005235373973846436, -0.0004987716674804688, -0.00047400593757629395, -0.00044924020767211914, -0.00042447447776794434, -0.00039970874786376953, -0.0003749430179595947, -0.0003501772880554199, -0.0003254115581512451, -0.0003006458282470703, -0.0002758800983428955, -0.0002511143684387207, -0.0002263486385345459, -0.0002015829086303711, -0.0001768171787261963, -0.00015205144882202148, -0.00012728571891784668, -0.00010251998901367188, -7.775425910949707e-05, -5.2988529205322266e-05, -2.822279930114746e-05, -3.4570693969726562e-06, 2.130866050720215e-05, 4.607439041137695e-05, 7.084012031555176e-05, 9.560585021972656e-05, 0.00012037158012390137, 0.00014513731002807617, 0.00016990303993225098, 0.00019466876983642578, 0.00021943449974060059, 0.0002442002296447754, 0.0002689659595489502, 0.000293731689453125, 0.0003184974193572998, 0.0003432631492614746, 0.0003680288791656494, 0.0003927946090698242, 0.000417560338973999, 0.00044232606887817383, 0.00046709179878234863, 0.0004918575286865234, 0.0005166232585906982, 0.000541388988494873, 0.0005661547183990479, 0.0005909204483032227, 0.0006156861782073975, 0.0006404519081115723, 0.0006652176380157471, 0.0006899833679199219]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 10.0, 12.0, 16.0, 16.0, 43.0, 37.0, 69.0, 121.0, 150.0, 258.0, 468.0, 929.0, 2314.0, 6301.0, 22679.0, 103808.0, 660070.0, 200233.0, 35886.0, 9355.0, 3027.0, 1216.0, 590.0, 317.0, 202.0, 123.0, 74.0, 62.0, 44.0, 23.0, 27.0, 13.0, 14.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.53515625, -4.407989501953125, -4.28082275390625, -4.153656005859375, -4.0264892578125, -3.899322509765625, -3.77215576171875, -3.644989013671875, -3.517822265625, -3.390655517578125, -3.26348876953125, -3.136322021484375, -3.0091552734375, -2.881988525390625, -2.75482177734375, -2.627655029296875, -2.50048828125, -2.373321533203125, -2.24615478515625, -2.118988037109375, -1.9918212890625, -1.864654541015625, -1.73748779296875, -1.610321044921875, -1.483154296875, -1.355987548828125, -1.22882080078125, -1.101654052734375, -0.9744873046875, -0.847320556640625, -0.72015380859375, -0.592987060546875, -0.4658203125, -0.338653564453125, -0.21148681640625, -0.084320068359375, 0.0428466796875, 0.170013427734375, 0.29718017578125, 0.424346923828125, 0.551513671875, 0.678680419921875, 0.80584716796875, 0.933013916015625, 1.0601806640625, 1.187347412109375, 1.31451416015625, 1.441680908203125, 1.56884765625, 1.696014404296875, 1.82318115234375, 1.950347900390625, 2.0775146484375, 2.204681396484375, 2.33184814453125, 2.459014892578125, 2.586181640625, 2.713348388671875, 2.84051513671875, 2.967681884765625, 3.0948486328125, 3.222015380859375, 3.34918212890625, 3.476348876953125, 3.603515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 2.0, 2.0, 7.0, 8.0, 11.0, 12.0, 15.0, 11.0, 22.0, 30.0, 39.0, 42.0, 86.0, 90.0, 129.0, 124.0, 94.0, 60.0, 58.0, 36.0, 24.0, 18.0, 9.0, 14.0, 6.0, 4.0, 10.0, 1.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.461456298828125, -2.38189697265625, -2.302337646484375, -2.2227783203125, -2.143218994140625, -2.06365966796875, -1.984100341796875, -1.904541015625, -1.824981689453125, -1.74542236328125, -1.665863037109375, -1.5863037109375, -1.506744384765625, -1.42718505859375, -1.347625732421875, -1.26806640625, -1.188507080078125, -1.10894775390625, -1.029388427734375, -0.9498291015625, -0.870269775390625, -0.79071044921875, -0.711151123046875, -0.631591796875, -0.552032470703125, -0.47247314453125, -0.392913818359375, -0.3133544921875, -0.233795166015625, -0.15423583984375, -0.074676513671875, 0.0048828125, 0.084442138671875, 0.16400146484375, 0.243560791015625, 0.3231201171875, 0.402679443359375, 0.48223876953125, 0.561798095703125, 0.641357421875, 0.720916748046875, 0.80047607421875, 0.880035400390625, 0.9595947265625, 1.039154052734375, 1.11871337890625, 1.198272705078125, 1.27783203125, 1.357391357421875, 1.43695068359375, 1.516510009765625, 1.5960693359375, 1.675628662109375, 1.75518798828125, 1.834747314453125, 1.914306640625, 1.993865966796875, 2.07342529296875, 2.152984619140625, 2.2325439453125, 2.312103271484375, 2.39166259765625, 2.471221923828125, 2.55078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 15.0, 26.0, 56.0, 70.0, 121.0, 145.0, 160.0, 136.0, 97.0, 71.0, 45.0, 17.0, 14.0, 7.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.233734130859375, -37.92694854736328, -36.62016296386719, -35.31338119506836, -34.006595611572266, -32.69981002807617, -31.393024444580078, -30.086238861083984, -28.779455184936523, -27.47266960144043, -26.16588592529297, -24.859100341796875, -23.55231475830078, -22.24553108215332, -20.938745498657227, -19.631961822509766, -18.325176239013672, -17.018390655517578, -15.711606979370117, -14.404821395874023, -13.098036766052246, -11.791252136230469, -10.484466552734375, -9.177681922912598, -7.87089729309082, -6.564112663269043, -5.257327556610107, -3.950542688369751, -2.6437578201293945, -1.3369731903076172, -0.03018808364868164, 1.276597023010254, 2.5833816528320312, 3.8901665210723877, 5.196951389312744, 6.50373649597168, 7.810521125793457, 9.117305755615234, 10.424091339111328, 11.730875968933105, 13.037660598754883, 14.34444522857666, 15.651229858398438, 16.95801544189453, 18.264801025390625, 19.571584701538086, 20.87837028503418, 22.18515396118164, 23.491939544677734, 24.798725128173828, 26.10550880432129, 27.412294387817383, 28.719078063964844, 30.025863647460938, 31.33264923095703, 32.639434814453125, 33.94622039794922, 35.25300598144531, 36.559791564941406, 37.866573333740234, 39.17335891723633, 40.48014450073242, 41.786930084228516, 43.09371566772461, 44.40049743652344]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 1.0, 3.0, 5.0, 10.0, 10.0, 11.0, 14.0, 11.0, 15.0, 12.0, 18.0, 22.0, 24.0, 30.0, 41.0, 32.0, 35.0, 38.0, 54.0, 35.0, 31.0, 41.0, 37.0, 38.0, 38.0, 34.0, 32.0, 35.0, 33.0, 33.0, 25.0, 24.0, 27.0, 19.0, 17.0, 22.0, 16.0, 12.0, 10.0, 14.0, 15.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.692367553710938, -16.12466812133789, -15.556970596313477, -14.989272117614746, -14.421573638916016, -13.853874206542969, -13.286175727844238, -12.718477249145508, -12.150778770446777, -11.583080291748047, -11.015381813049316, -10.447683334350586, -9.879983901977539, -9.312286376953125, -8.744586944580078, -8.176888465881348, -7.609189987182617, -7.041491508483887, -6.473793029785156, -5.906094074249268, -5.338395595550537, -4.770697116851807, -4.202998161315918, -3.6352996826171875, -3.067601203918457, -2.4999027252197266, -1.932204008102417, -1.364505410194397, -0.796806812286377, -0.22910833358764648, 0.3385903835296631, 0.9062891006469727, 1.473989486694336, 2.0416879653930664, 2.609386682510376, 3.1770853996276855, 3.744783878326416, 4.3124823570251465, 4.880181312561035, 5.447879791259766, 6.015578269958496, 6.583276748657227, 7.150975227355957, 7.718674182891846, 8.286373138427734, 8.854070663452148, 9.421770095825195, 9.989468574523926, 10.557167053222656, 11.124865531921387, 11.692564010620117, 12.260262489318848, 12.827960968017578, 13.395660400390625, 13.963358879089355, 14.531057357788086, 15.098755836486816, 15.666454315185547, 16.234153747558594, 16.801851272583008, 17.369550704956055, 17.93724822998047, 18.504947662353516, 19.072647094726562, 19.640344619750977]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 9.0, 16.0, 28.0, 30.0, 36.0, 42.0, 68.0, 146.0, 195.0, 337.0, 563.0, 984.0, 1718.0, 3140.0, 6187.0, 12422.0, 27368.0, 69743.0, 236498.0, 2974015.0, 650680.0, 127733.0, 44492.0, 18598.0, 8748.0, 4578.0, 2435.0, 1397.0, 811.0, 460.0, 294.0, 163.0, 129.0, 65.0, 48.0, 25.0, 24.0, 20.0, 13.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.7818603515625, -3.673095703125, -3.5643310546875, -3.45556640625, -3.3468017578125, -3.238037109375, -3.1292724609375, -3.0205078125, -2.9117431640625, -2.802978515625, -2.6942138671875, -2.58544921875, -2.4766845703125, -2.367919921875, -2.2591552734375, -2.150390625, -2.0416259765625, -1.932861328125, -1.8240966796875, -1.71533203125, -1.6065673828125, -1.497802734375, -1.3890380859375, -1.2802734375, -1.1715087890625, -1.062744140625, -0.9539794921875, -0.84521484375, -0.7364501953125, -0.627685546875, -0.5189208984375, -0.41015625, -0.3013916015625, -0.192626953125, -0.0838623046875, 0.02490234375, 0.1336669921875, 0.242431640625, 0.3511962890625, 0.4599609375, 0.5687255859375, 0.677490234375, 0.7862548828125, 0.89501953125, 1.0037841796875, 1.112548828125, 1.2213134765625, 1.330078125, 1.4388427734375, 1.547607421875, 1.6563720703125, 1.76513671875, 1.8739013671875, 1.982666015625, 2.0914306640625, 2.2001953125, 2.3089599609375, 2.417724609375, 2.5264892578125, 2.63525390625, 2.7440185546875, 2.852783203125, 2.9615478515625, 3.0703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 12.0, 9.0, 4.0, 12.0, 8.0, 27.0, 19.0, 23.0, 23.0, 43.0, 31.0, 39.0, 37.0, 41.0, 52.0, 46.0, 45.0, 68.0, 46.0, 39.0, 49.0, 54.0, 32.0, 29.0, 38.0, 35.0, 26.0, 21.0, 16.0, 15.0, 11.0, 8.0, 16.0, 6.0, 10.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 4.0], "bins": [-1.005859375, -0.9802932739257812, -0.9547271728515625, -0.9291610717773438, -0.903594970703125, -0.8780288696289062, -0.8524627685546875, -0.8268966674804688, -0.80133056640625, -0.7757644653320312, -0.7501983642578125, -0.7246322631835938, -0.699066162109375, -0.6735000610351562, -0.6479339599609375, -0.6223678588867188, -0.5968017578125, -0.5712356567382812, -0.5456695556640625, -0.5201034545898438, -0.494537353515625, -0.46897125244140625, -0.4434051513671875, -0.41783905029296875, -0.39227294921875, -0.36670684814453125, -0.3411407470703125, -0.31557464599609375, -0.290008544921875, -0.26444244384765625, -0.2388763427734375, -0.21331024169921875, -0.187744140625, -0.16217803955078125, -0.1366119384765625, -0.11104583740234375, -0.085479736328125, -0.05991363525390625, -0.0343475341796875, -0.00878143310546875, 0.01678466796875, 0.04235076904296875, 0.0679168701171875, 0.09348297119140625, 0.119049072265625, 0.14461517333984375, 0.1701812744140625, 0.19574737548828125, 0.2213134765625, 0.24687957763671875, 0.2724456787109375, 0.29801177978515625, 0.323577880859375, 0.34914398193359375, 0.3747100830078125, 0.40027618408203125, 0.42584228515625, 0.45140838623046875, 0.4769744873046875, 0.5025405883789062, 0.528106689453125, 0.5536727905273438, 0.5792388916015625, 0.6048049926757812, 0.63037109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 7.0, 8.0, 15.0, 13.0, 16.0, 49.0, 41.0, 90.0, 111.0, 177.0, 325.0, 553.0, 1022.0, 1914.0, 3922.0, 8206.0, 18898.0, 49706.0, 160709.0, 1159068.0, 2475854.0, 211784.0, 60969.0, 22244.0, 9350.0, 4393.0, 2086.0, 1166.0, 646.0, 344.0, 205.0, 136.0, 91.0, 59.0, 36.0, 25.0, 13.0, 13.0, 5.0, 3.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.223876953125, -4.09228515625, -3.960693359375, -3.8291015625, -3.697509765625, -3.56591796875, -3.434326171875, -3.302734375, -3.171142578125, -3.03955078125, -2.907958984375, -2.7763671875, -2.644775390625, -2.51318359375, -2.381591796875, -2.25, -2.118408203125, -1.98681640625, -1.855224609375, -1.7236328125, -1.592041015625, -1.46044921875, -1.328857421875, -1.197265625, -1.065673828125, -0.93408203125, -0.802490234375, -0.6708984375, -0.539306640625, -0.40771484375, -0.276123046875, -0.14453125, -0.012939453125, 0.11865234375, 0.250244140625, 0.3818359375, 0.513427734375, 0.64501953125, 0.776611328125, 0.908203125, 1.039794921875, 1.17138671875, 1.302978515625, 1.4345703125, 1.566162109375, 1.69775390625, 1.829345703125, 1.9609375, 2.092529296875, 2.22412109375, 2.355712890625, 2.4873046875, 2.618896484375, 2.75048828125, 2.882080078125, 3.013671875, 3.145263671875, 3.27685546875, 3.408447265625, 3.5400390625, 3.671630859375, 3.80322265625, 3.934814453125, 4.06640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 11.0, 17.0, 13.0, 26.0, 38.0, 35.0, 59.0, 87.0, 125.0, 234.0, 472.0, 1502.0, 700.0, 265.0, 149.0, 102.0, 68.0, 40.0, 32.0, 22.0, 24.0, 7.0, 9.0, 4.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.52386474609375, -2.4442138671875, -2.36456298828125, -2.284912109375, -2.20526123046875, -2.1256103515625, -2.04595947265625, -1.96630859375, -1.88665771484375, -1.8070068359375, -1.72735595703125, -1.647705078125, -1.56805419921875, -1.4884033203125, -1.40875244140625, -1.3291015625, -1.24945068359375, -1.1697998046875, -1.09014892578125, -1.010498046875, -0.93084716796875, -0.8511962890625, -0.77154541015625, -0.69189453125, -0.61224365234375, -0.5325927734375, -0.45294189453125, -0.373291015625, -0.29364013671875, -0.2139892578125, -0.13433837890625, -0.0546875, 0.02496337890625, 0.1046142578125, 0.18426513671875, 0.263916015625, 0.34356689453125, 0.4232177734375, 0.50286865234375, 0.58251953125, 0.66217041015625, 0.7418212890625, 0.82147216796875, 0.901123046875, 0.98077392578125, 1.0604248046875, 1.14007568359375, 1.2197265625, 1.29937744140625, 1.3790283203125, 1.45867919921875, 1.538330078125, 1.61798095703125, 1.6976318359375, 1.77728271484375, 1.85693359375, 1.93658447265625, 2.0162353515625, 2.09588623046875, 2.175537109375, 2.25518798828125, 2.3348388671875, 2.41448974609375, 2.494140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 12.0, 28.0, 45.0, 117.0, 193.0, 235.0, 176.0, 119.0, 42.0, 17.0, 7.0, 4.0, 3.0], "bins": [-53.71420669555664, -52.76578903198242, -51.8173713684082, -50.868953704833984, -49.920536041259766, -48.97211837768555, -48.02370071411133, -47.075279235839844, -46.126861572265625, -45.178443908691406, -44.23002624511719, -43.28160858154297, -42.33319091796875, -41.38477325439453, -40.43635559082031, -39.487937927246094, -38.539520263671875, -37.591102600097656, -36.64268493652344, -35.69426727294922, -34.745849609375, -33.79743194580078, -32.84901428222656, -31.90059471130371, -30.952177047729492, -30.003759384155273, -29.055341720581055, -28.106924057006836, -27.158504486083984, -26.210086822509766, -25.261669158935547, -24.313251495361328, -23.364835739135742, -22.416418075561523, -21.468000411987305, -20.519582748413086, -19.571163177490234, -18.622745513916016, -17.674327850341797, -16.725910186767578, -15.77749252319336, -14.82907485961914, -13.880657196044922, -12.932238578796387, -11.983820915222168, -11.03540325164795, -10.086984634399414, -9.138566970825195, -8.190149307250977, -7.241731643676758, -6.293313503265381, -5.344895362854004, -4.396477699279785, -3.4480600357055664, -2.4996418952941895, -1.5512237548828125, -0.6028060913085938, 0.3456118106842041, 1.294029712677002, 2.2424476146698, 3.1908655166625977, 4.139283180236816, 5.087701320648193, 6.03611946105957, 6.984537124633789]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 11.0, 10.0, 16.0, 12.0, 25.0, 18.0, 35.0, 28.0, 36.0, 40.0, 27.0, 32.0, 53.0, 37.0, 33.0, 42.0, 44.0, 45.0, 39.0, 44.0, 38.0, 18.0, 42.0, 28.0, 30.0, 28.0, 22.0, 28.0, 22.0, 15.0, 15.0, 18.0, 6.0, 6.0, 7.0, 6.0, 4.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0], "bins": [-9.243200302124023, -8.972718238830566, -8.70223617553711, -8.431754112243652, -8.161272048950195, -7.890789985656738, -7.620307922363281, -7.349825859069824, -7.079343795776367, -6.80886173248291, -6.538379669189453, -6.267897605895996, -5.997415542602539, -5.726933479309082, -5.456451416015625, -5.185969352722168, -4.915487289428711, -4.645005226135254, -4.374523162841797, -4.10404109954834, -3.833559036254883, -3.563076972961426, -3.2925949096679688, -3.0221128463745117, -2.7516307830810547, -2.4811487197875977, -2.2106666564941406, -1.9401845932006836, -1.6697025299072266, -1.3992204666137695, -1.1287384033203125, -0.8582563400268555, -0.5877742767333984, -0.3172922134399414, -0.046810150146484375, 0.22367191314697266, 0.4941539764404297, 0.7646360397338867, 1.0351181030273438, 1.3056001663208008, 1.5760822296142578, 1.8465642929077148, 2.117046356201172, 2.387528419494629, 2.658010482788086, 2.928492546081543, 3.198974609375, 3.469456672668457, 3.739938735961914, 4.010420799255371, 4.280902862548828, 4.551384925842285, 4.821866989135742, 5.092349052429199, 5.362831115722656, 5.633313179016113, 5.90379524230957, 6.174277305603027, 6.444759368896484, 6.715241432189941, 6.985723495483398, 7.2562055587768555, 7.5266876220703125, 7.7971696853637695, 8.067651748657227]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 20.0, 32.0, 66.0, 101.0, 165.0, 280.0, 539.0, 1011.0, 1978.0, 3785.0, 8280.0, 18004.0, 41274.0, 102778.0, 408723.0, 310527.0, 85766.0, 34968.0, 15714.0, 7211.0, 3553.0, 1742.0, 915.0, 475.0, 273.0, 165.0, 75.0, 51.0, 27.0, 14.0, 9.0, 8.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.8804931640625, -3.741455078125, -3.6024169921875, -3.46337890625, -3.3243408203125, -3.185302734375, -3.0462646484375, -2.9072265625, -2.7681884765625, -2.629150390625, -2.4901123046875, -2.35107421875, -2.2120361328125, -2.072998046875, -1.9339599609375, -1.794921875, -1.6558837890625, -1.516845703125, -1.3778076171875, -1.23876953125, -1.0997314453125, -0.960693359375, -0.8216552734375, -0.6826171875, -0.5435791015625, -0.404541015625, -0.2655029296875, -0.12646484375, 0.0125732421875, 0.151611328125, 0.2906494140625, 0.4296875, 0.5687255859375, 0.707763671875, 0.8468017578125, 0.98583984375, 1.1248779296875, 1.263916015625, 1.4029541015625, 1.5419921875, 1.6810302734375, 1.820068359375, 1.9591064453125, 2.09814453125, 2.2371826171875, 2.376220703125, 2.5152587890625, 2.654296875, 2.7933349609375, 2.932373046875, 3.0714111328125, 3.21044921875, 3.3494873046875, 3.488525390625, 3.6275634765625, 3.7666015625, 3.9056396484375, 4.044677734375, 4.1837158203125, 4.32275390625, 4.4617919921875, 4.600830078125, 4.7398681640625, 4.87890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 18.0, 9.0, 14.0, 22.0, 28.0, 24.0, 41.0, 29.0, 55.0, 37.0, 45.0, 56.0, 64.0, 46.0, 50.0, 49.0, 52.0, 61.0, 41.0, 40.0, 50.0, 22.0, 29.0, 27.0, 17.0, 14.0, 13.0, 11.0, 11.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.053802490234375, -1.02362060546875, -0.993438720703125, -0.9632568359375, -0.933074951171875, -0.90289306640625, -0.872711181640625, -0.842529296875, -0.812347412109375, -0.78216552734375, -0.751983642578125, -0.7218017578125, -0.691619873046875, -0.66143798828125, -0.631256103515625, -0.60107421875, -0.570892333984375, -0.54071044921875, -0.510528564453125, -0.4803466796875, -0.450164794921875, -0.41998291015625, -0.389801025390625, -0.359619140625, -0.329437255859375, -0.29925537109375, -0.269073486328125, -0.2388916015625, -0.208709716796875, -0.17852783203125, -0.148345947265625, -0.1181640625, -0.087982177734375, -0.05780029296875, -0.027618408203125, 0.0025634765625, 0.032745361328125, 0.06292724609375, 0.093109130859375, 0.123291015625, 0.153472900390625, 0.18365478515625, 0.213836669921875, 0.2440185546875, 0.274200439453125, 0.30438232421875, 0.334564208984375, 0.36474609375, 0.394927978515625, 0.42510986328125, 0.455291748046875, 0.4854736328125, 0.515655517578125, 0.54583740234375, 0.576019287109375, 0.606201171875, 0.636383056640625, 0.66656494140625, 0.696746826171875, 0.7269287109375, 0.757110595703125, 0.78729248046875, 0.817474365234375, 0.84765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 13.0, 11.0, 11.0, 16.0, 16.0, 21.0, 32.0, 39.0, 49.0, 60.0, 103.0, 123.0, 150.0, 234.0, 353.0, 563.0, 950.0, 2043.0, 5101.0, 16533.0, 75812.0, 621845.0, 264882.0, 41826.0, 10288.0, 3543.0, 1575.0, 767.0, 475.0, 329.0, 199.0, 125.0, 119.0, 71.0, 59.0, 35.0, 35.0, 25.0, 26.0, 16.0, 19.0, 15.0, 12.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.66015625, -6.44403076171875, -6.2279052734375, -6.01177978515625, -5.795654296875, -5.57952880859375, -5.3634033203125, -5.14727783203125, -4.93115234375, -4.71502685546875, -4.4989013671875, -4.28277587890625, -4.066650390625, -3.85052490234375, -3.6343994140625, -3.41827392578125, -3.2021484375, -2.98602294921875, -2.7698974609375, -2.55377197265625, -2.337646484375, -2.12152099609375, -1.9053955078125, -1.68927001953125, -1.47314453125, -1.25701904296875, -1.0408935546875, -0.82476806640625, -0.608642578125, -0.39251708984375, -0.1763916015625, 0.03973388671875, 0.255859375, 0.47198486328125, 0.6881103515625, 0.90423583984375, 1.120361328125, 1.33648681640625, 1.5526123046875, 1.76873779296875, 1.98486328125, 2.20098876953125, 2.4171142578125, 2.63323974609375, 2.849365234375, 3.06549072265625, 3.2816162109375, 3.49774169921875, 3.7138671875, 3.92999267578125, 4.1461181640625, 4.36224365234375, 4.578369140625, 4.79449462890625, 5.0106201171875, 5.22674560546875, 5.44287109375, 5.65899658203125, 5.8751220703125, 6.09124755859375, 6.307373046875, 6.52349853515625, 6.7396240234375, 6.95574951171875, 7.171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 7.0, 13.0, 21.0, 24.0, 26.0, 26.0, 38.0, 32.0, 43.0, 44.0, 62.0, 60.0, 58.0, 64.0, 42.0, 66.0, 53.0, 49.0, 35.0, 37.0, 36.0, 28.0, 30.0, 20.0, 11.0, 10.0, 14.0, 7.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.3687744140625, -4.214111328125, -4.0594482421875, -3.90478515625, -3.7501220703125, -3.595458984375, -3.4407958984375, -3.2861328125, -3.1314697265625, -2.976806640625, -2.8221435546875, -2.66748046875, -2.5128173828125, -2.358154296875, -2.2034912109375, -2.048828125, -1.8941650390625, -1.739501953125, -1.5848388671875, -1.43017578125, -1.2755126953125, -1.120849609375, -0.9661865234375, -0.8115234375, -0.6568603515625, -0.502197265625, -0.3475341796875, -0.19287109375, -0.0382080078125, 0.116455078125, 0.2711181640625, 0.42578125, 0.5804443359375, 0.735107421875, 0.8897705078125, 1.04443359375, 1.1990966796875, 1.353759765625, 1.5084228515625, 1.6630859375, 1.8177490234375, 1.972412109375, 2.1270751953125, 2.28173828125, 2.4364013671875, 2.591064453125, 2.7457275390625, 2.900390625, 3.0550537109375, 3.209716796875, 3.3643798828125, 3.51904296875, 3.6737060546875, 3.828369140625, 3.9830322265625, 4.1376953125, 4.2923583984375, 4.447021484375, 4.6016845703125, 4.75634765625, 4.9110107421875, 5.065673828125, 5.2203369140625, 5.375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 4.0, 9.0, 4.0, 24.0, 31.0, 44.0, 58.0, 95.0, 167.0, 293.0, 637.0, 1312.0, 3446.0, 11239.0, 57034.0, 812786.0, 133025.0, 19608.0, 5139.0, 1831.0, 861.0, 358.0, 191.0, 131.0, 61.0, 49.0, 32.0, 25.0, 17.0, 9.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.4140625, -5.218505859375, -5.02294921875, -4.827392578125, -4.6318359375, -4.436279296875, -4.24072265625, -4.045166015625, -3.849609375, -3.654052734375, -3.45849609375, -3.262939453125, -3.0673828125, -2.871826171875, -2.67626953125, -2.480712890625, -2.28515625, -2.089599609375, -1.89404296875, -1.698486328125, -1.5029296875, -1.307373046875, -1.11181640625, -0.916259765625, -0.720703125, -0.525146484375, -0.32958984375, -0.134033203125, 0.0615234375, 0.257080078125, 0.45263671875, 0.648193359375, 0.84375, 1.039306640625, 1.23486328125, 1.430419921875, 1.6259765625, 1.821533203125, 2.01708984375, 2.212646484375, 2.408203125, 2.603759765625, 2.79931640625, 2.994873046875, 3.1904296875, 3.385986328125, 3.58154296875, 3.777099609375, 3.97265625, 4.168212890625, 4.36376953125, 4.559326171875, 4.7548828125, 4.950439453125, 5.14599609375, 5.341552734375, 5.537109375, 5.732666015625, 5.92822265625, 6.123779296875, 6.3193359375, 6.514892578125, 6.71044921875, 6.906005859375, 7.1015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 5.0, 7.0, 3.0, 5.0, 19.0, 18.0, 31.0, 48.0, 178.0, 532.0, 66.0, 40.0, 14.0, 13.0, 15.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015134811401367188, -0.0014388710260391235, -0.0013642609119415283, -0.001289650797843933, -0.0012150406837463379, -0.0011404305696487427, -0.0010658204555511475, -0.0009912103414535522, -0.000916600227355957, -0.0008419901132583618, -0.0007673799991607666, -0.0006927698850631714, -0.0006181597709655762, -0.000543549656867981, -0.00046893954277038574, -0.00039432942867279053, -0.0003197193145751953, -0.0002451092004776001, -0.00017049908638000488, -9.588897228240967e-05, -2.1278858184814453e-05, 5.333125591278076e-05, 0.00012794137001037598, 0.0002025514841079712, 0.0002771615982055664, 0.0003517717123031616, 0.00042638182640075684, 0.000500991940498352, 0.0005756020545959473, 0.0006502121686935425, 0.0007248222827911377, 0.0007994323968887329, 0.0008740425109863281, 0.0009486526250839233, 0.0010232627391815186, 0.0010978728532791138, 0.001172482967376709, 0.0012470930814743042, 0.0013217031955718994, 0.0013963133096694946, 0.0014709234237670898, 0.001545533537864685, 0.0016201436519622803, 0.0016947537660598755, 0.0017693638801574707, 0.001843973994255066, 0.0019185841083526611, 0.0019931942224502563, 0.0020678043365478516, 0.0021424144506454468, 0.002217024564743042, 0.002291634678840637, 0.0023662447929382324, 0.0024408549070358276, 0.002515465021133423, 0.002590075135231018, 0.0026646852493286133, 0.0027392953634262085, 0.0028139054775238037, 0.002888515591621399, 0.002963125705718994, 0.0030377358198165894, 0.0031123459339141846, 0.00318695604801178, 0.003261566162109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 1.0, 4.0, 7.0, 15.0, 16.0, 32.0, 33.0, 71.0, 111.0, 157.0, 279.0, 581.0, 1397.0, 4379.0, 25905.0, 686775.0, 303488.0, 19081.0, 3786.0, 1199.0, 532.0, 269.0, 137.0, 94.0, 61.0, 40.0, 25.0, 21.0, 12.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0760498046875, -6.839599609375, -6.6031494140625, -6.36669921875, -6.1302490234375, -5.893798828125, -5.6573486328125, -5.4208984375, -5.1844482421875, -4.947998046875, -4.7115478515625, -4.47509765625, -4.2386474609375, -4.002197265625, -3.7657470703125, -3.529296875, -3.2928466796875, -3.056396484375, -2.8199462890625, -2.58349609375, -2.3470458984375, -2.110595703125, -1.8741455078125, -1.6376953125, -1.4012451171875, -1.164794921875, -0.9283447265625, -0.69189453125, -0.4554443359375, -0.218994140625, 0.0174560546875, 0.25390625, 0.4903564453125, 0.726806640625, 0.9632568359375, 1.19970703125, 1.4361572265625, 1.672607421875, 1.9090576171875, 2.1455078125, 2.3819580078125, 2.618408203125, 2.8548583984375, 3.09130859375, 3.3277587890625, 3.564208984375, 3.8006591796875, 4.037109375, 4.2735595703125, 4.510009765625, 4.7464599609375, 4.98291015625, 5.2193603515625, 5.455810546875, 5.6922607421875, 5.9287109375, 6.1651611328125, 6.401611328125, 6.6380615234375, 6.87451171875, 7.1109619140625, 7.347412109375, 7.5838623046875, 7.8203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 3.0, 12.0, 15.0, 16.0, 20.0, 65.0, 103.0, 264.0, 249.0, 100.0, 46.0, 28.0, 14.0, 13.0, 13.0, 13.0, 8.0, 2.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4674072265625, -4.302001953125, -4.1365966796875, -3.97119140625, -3.8057861328125, -3.640380859375, -3.4749755859375, -3.3095703125, -3.1441650390625, -2.978759765625, -2.8133544921875, -2.64794921875, -2.4825439453125, -2.317138671875, -2.1517333984375, -1.986328125, -1.8209228515625, -1.655517578125, -1.4901123046875, -1.32470703125, -1.1593017578125, -0.993896484375, -0.8284912109375, -0.6630859375, -0.4976806640625, -0.332275390625, -0.1668701171875, -0.00146484375, 0.1639404296875, 0.329345703125, 0.4947509765625, 0.66015625, 0.8255615234375, 0.990966796875, 1.1563720703125, 1.32177734375, 1.4871826171875, 1.652587890625, 1.8179931640625, 1.9833984375, 2.1488037109375, 2.314208984375, 2.4796142578125, 2.64501953125, 2.8104248046875, 2.975830078125, 3.1412353515625, 3.306640625, 3.4720458984375, 3.637451171875, 3.8028564453125, 3.96826171875, 4.1336669921875, 4.299072265625, 4.4644775390625, 4.6298828125, 4.7952880859375, 4.960693359375, 5.1260986328125, 5.29150390625, 5.4569091796875, 5.622314453125, 5.7877197265625, 5.953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 36.0, 66.0, 150.0, 221.0, 200.0, 151.0, 82.0, 42.0, 23.0, 11.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-73.78518676757812, -71.61172485351562, -69.43827056884766, -67.26480865478516, -65.09134674072266, -62.91788864135742, -60.74443054199219, -58.57096862792969, -56.39751052856445, -54.22405242919922, -52.05059051513672, -49.877132415771484, -47.70367431640625, -45.53021240234375, -43.356754302978516, -41.18329620361328, -39.00983428955078, -36.83637619018555, -34.66291427612305, -32.48945617675781, -30.315996170043945, -28.142536163330078, -25.969078063964844, -23.795618057250977, -21.62215805053711, -19.448698043823242, -17.275238037109375, -15.10177993774414, -12.928319931030273, -10.754859924316406, -8.581400871276855, -6.407941818237305, -4.2344818115234375, -2.0610222816467285, 0.11243724822998047, 2.2858967781066895, 4.459356307983398, 6.632816314697266, 8.806275367736816, 10.979734420776367, 13.153194427490234, 15.326654434204102, 17.50011444091797, 19.673572540283203, 21.84703254699707, 24.020492553710938, 26.193950653076172, 28.36741065979004, 30.540870666503906, 32.71432876586914, 34.88779067993164, 37.061248779296875, 39.234710693359375, 41.40816879272461, 43.581626892089844, 45.755088806152344, 47.92854690551758, 50.10200500488281, 52.27546691894531, 54.44892501831055, 56.62238311767578, 58.79584503173828, 60.969303131103516, 63.14276123046875, 65.31622314453125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 12.0, 7.0, 10.0, 19.0, 16.0, 18.0, 15.0, 26.0, 24.0, 30.0, 41.0, 34.0, 38.0, 46.0, 40.0, 50.0, 46.0, 49.0, 52.0, 41.0, 34.0, 42.0, 39.0, 37.0, 37.0, 24.0, 29.0, 26.0, 16.0, 17.0, 11.0, 9.0, 10.0, 14.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.82617950439453, -19.105825424194336, -18.38547134399414, -17.665115356445312, -16.944761276245117, -16.224407196044922, -15.50405216217041, -14.783697128295898, -14.063343048095703, -13.342988967895508, -12.622633934020996, -11.902278900146484, -11.181924819946289, -10.461570739746094, -9.741215705871582, -9.02086067199707, -8.300506591796875, -7.5801520347595215, -6.859797477722168, -6.1394429206848145, -5.419088363647461, -4.698733806610107, -3.978379249572754, -3.2580246925354004, -2.537670135498047, -1.8173155784606934, -1.0969610214233398, -0.37660646438598633, 0.3437480926513672, 1.0641026496887207, 1.7844572067260742, 2.5048117637634277, 3.2251663208007812, 3.9455208778381348, 4.665875434875488, 5.386229991912842, 6.106584548950195, 6.826939105987549, 7.547293663024902, 8.267648696899414, 8.98800277709961, 9.708356857299805, 10.428711891174316, 11.149066925048828, 11.869421005249023, 12.589775085449219, 13.31013011932373, 14.030485153198242, 14.750839233398438, 15.471193313598633, 16.191547393798828, 16.911903381347656, 17.63225746154785, 18.352611541748047, 19.072967529296875, 19.79332160949707, 20.513675689697266, 21.23402976989746, 21.954383850097656, 22.674739837646484, 23.39509391784668, 24.115447998046875, 24.835803985595703, 25.5561580657959, 26.276512145996094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 13.0, 13.0, 27.0, 35.0, 59.0, 88.0, 119.0, 193.0, 334.0, 576.0, 970.0, 1548.0, 2970.0, 5428.0, 11193.0, 24925.0, 66247.0, 283285.0, 3373917.0, 301901.0, 69620.0, 26109.0, 11705.0, 5708.0, 3090.0, 1712.0, 975.0, 565.0, 333.0, 212.0, 144.0, 77.0, 55.0, 45.0, 21.0, 12.0, 9.0, 12.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.06219482421875, -3.9290771484375, -3.79595947265625, -3.662841796875, -3.52972412109375, -3.3966064453125, -3.26348876953125, -3.13037109375, -2.99725341796875, -2.8641357421875, -2.73101806640625, -2.597900390625, -2.46478271484375, -2.3316650390625, -2.19854736328125, -2.0654296875, -1.93231201171875, -1.7991943359375, -1.66607666015625, -1.532958984375, -1.39984130859375, -1.2667236328125, -1.13360595703125, -1.00048828125, -0.86737060546875, -0.7342529296875, -0.60113525390625, -0.468017578125, -0.33489990234375, -0.2017822265625, -0.06866455078125, 0.064453125, 0.19757080078125, 0.3306884765625, 0.46380615234375, 0.596923828125, 0.73004150390625, 0.8631591796875, 0.99627685546875, 1.12939453125, 1.26251220703125, 1.3956298828125, 1.52874755859375, 1.661865234375, 1.79498291015625, 1.9281005859375, 2.06121826171875, 2.1943359375, 2.32745361328125, 2.4605712890625, 2.59368896484375, 2.726806640625, 2.85992431640625, 2.9930419921875, 3.12615966796875, 3.25927734375, 3.39239501953125, 3.5255126953125, 3.65863037109375, 3.791748046875, 3.92486572265625, 4.0579833984375, 4.19110107421875, 4.32421875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 4.0, 7.0, 17.0, 15.0, 19.0, 33.0, 25.0, 37.0, 48.0, 55.0, 60.0, 61.0, 63.0, 74.0, 61.0, 64.0, 62.0, 52.0, 46.0, 45.0, 32.0, 28.0, 28.0, 13.0, 12.0, 20.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46875, -1.4263916015625, -1.384033203125, -1.3416748046875, -1.29931640625, -1.2569580078125, -1.214599609375, -1.1722412109375, -1.1298828125, -1.0875244140625, -1.045166015625, -1.0028076171875, -0.96044921875, -0.9180908203125, -0.875732421875, -0.8333740234375, -0.791015625, -0.7486572265625, -0.706298828125, -0.6639404296875, -0.62158203125, -0.5792236328125, -0.536865234375, -0.4945068359375, -0.4521484375, -0.4097900390625, -0.367431640625, -0.3250732421875, -0.28271484375, -0.2403564453125, -0.197998046875, -0.1556396484375, -0.11328125, -0.0709228515625, -0.028564453125, 0.0137939453125, 0.05615234375, 0.0985107421875, 0.140869140625, 0.1832275390625, 0.2255859375, 0.2679443359375, 0.310302734375, 0.3526611328125, 0.39501953125, 0.4373779296875, 0.479736328125, 0.5220947265625, 0.564453125, 0.6068115234375, 0.649169921875, 0.6915283203125, 0.73388671875, 0.7762451171875, 0.818603515625, 0.8609619140625, 0.9033203125, 0.9456787109375, 0.988037109375, 1.0303955078125, 1.07275390625, 1.1151123046875, 1.157470703125, 1.1998291015625, 1.2421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 14.0, 16.0, 29.0, 25.0, 51.0, 72.0, 115.0, 188.0, 314.0, 636.0, 1165.0, 2561.0, 6046.0, 17154.0, 63119.0, 471361.0, 3403998.0, 172809.0, 35105.0, 11042.0, 4269.0, 1927.0, 951.0, 522.0, 295.0, 172.0, 113.0, 65.0, 55.0, 29.0, 14.0, 10.0, 15.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.578125, -7.3634033203125, -7.148681640625, -6.9339599609375, -6.71923828125, -6.5045166015625, -6.289794921875, -6.0750732421875, -5.8603515625, -5.6456298828125, -5.430908203125, -5.2161865234375, -5.00146484375, -4.7867431640625, -4.572021484375, -4.3572998046875, -4.142578125, -3.9278564453125, -3.713134765625, -3.4984130859375, -3.28369140625, -3.0689697265625, -2.854248046875, -2.6395263671875, -2.4248046875, -2.2100830078125, -1.995361328125, -1.7806396484375, -1.56591796875, -1.3511962890625, -1.136474609375, -0.9217529296875, -0.70703125, -0.4923095703125, -0.277587890625, -0.0628662109375, 0.15185546875, 0.3665771484375, 0.581298828125, 0.7960205078125, 1.0107421875, 1.2254638671875, 1.440185546875, 1.6549072265625, 1.86962890625, 2.0843505859375, 2.299072265625, 2.5137939453125, 2.728515625, 2.9432373046875, 3.157958984375, 3.3726806640625, 3.58740234375, 3.8021240234375, 4.016845703125, 4.2315673828125, 4.4462890625, 4.6610107421875, 4.875732421875, 5.0904541015625, 5.30517578125, 5.5198974609375, 5.734619140625, 5.9493408203125, 6.1640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 7.0, 6.0, 13.0, 13.0, 19.0, 23.0, 28.0, 52.0, 72.0, 109.0, 198.0, 431.0, 1647.0, 700.0, 278.0, 171.0, 84.0, 68.0, 42.0, 25.0, 11.0, 14.0, 12.0, 10.0, 11.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.357421875, -2.278076171875, -2.19873046875, -2.119384765625, -2.0400390625, -1.960693359375, -1.88134765625, -1.802001953125, -1.72265625, -1.643310546875, -1.56396484375, -1.484619140625, -1.4052734375, -1.325927734375, -1.24658203125, -1.167236328125, -1.087890625, -1.008544921875, -0.92919921875, -0.849853515625, -0.7705078125, -0.691162109375, -0.61181640625, -0.532470703125, -0.453125, -0.373779296875, -0.29443359375, -0.215087890625, -0.1357421875, -0.056396484375, 0.02294921875, 0.102294921875, 0.181640625, 0.260986328125, 0.34033203125, 0.419677734375, 0.4990234375, 0.578369140625, 0.65771484375, 0.737060546875, 0.81640625, 0.895751953125, 0.97509765625, 1.054443359375, 1.1337890625, 1.213134765625, 1.29248046875, 1.371826171875, 1.451171875, 1.530517578125, 1.60986328125, 1.689208984375, 1.7685546875, 1.847900390625, 1.92724609375, 2.006591796875, 2.0859375, 2.165283203125, 2.24462890625, 2.323974609375, 2.4033203125, 2.482666015625, 2.56201171875, 2.641357421875, 2.720703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 23.0, 50.0, 81.0, 155.0, 204.0, 199.0, 121.0, 88.0, 38.0, 20.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.287099838256836, -16.440752029418945, -15.594403266906738, -14.748054504394531, -13.90170669555664, -13.055357933044434, -12.209009170532227, -11.362661361694336, -10.516312599182129, -9.669963836669922, -8.823616027832031, -7.977267265319824, -7.130918979644775, -6.284570693969727, -5.4382219314575195, -4.591873645782471, -3.745525360107422, -2.899177074432373, -2.052828550338745, -1.2064800262451172, -0.36013174057006836, 0.48621654510498047, 1.3325653076171875, 2.1789135932922363, 3.025261878967285, 3.871610164642334, 4.717958450317383, 5.56430721282959, 6.410655498504639, 7.2570037841796875, 8.103352546691895, 8.949701309204102, 9.796051025390625, 10.642399787902832, 11.488747596740723, 12.33509635925293, 13.18144416809082, 14.027792930603027, 14.874141693115234, 15.720489501953125, 16.566837310791016, 17.413185119628906, 18.25953483581543, 19.10588264465332, 19.95223045349121, 20.798580169677734, 21.644927978515625, 22.491275787353516, 23.33762550354004, 24.18397331237793, 25.030323028564453, 25.876670837402344, 26.723018646240234, 27.569366455078125, 28.41571617126465, 29.26206398010254, 30.108413696289062, 30.954761505126953, 31.801111221313477, 32.6474609375, 33.49380874633789, 34.34015655517578, 35.18650436401367, 36.03285217285156, 36.87919998168945]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 11.0, 11.0, 13.0, 10.0, 17.0, 24.0, 22.0, 30.0, 24.0, 34.0, 34.0, 39.0, 30.0, 35.0, 41.0, 54.0, 45.0, 38.0, 50.0, 32.0, 42.0, 32.0, 31.0, 34.0, 30.0, 31.0, 21.0, 19.0, 23.0, 17.0, 20.0, 14.0, 15.0, 11.0, 3.0, 14.0, 7.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.798599243164062, -8.536223411560059, -8.273846626281738, -8.011470794677734, -7.7490949630737305, -7.486718654632568, -7.224342346191406, -6.961966514587402, -6.69959020614624, -6.437213897705078, -6.174838066101074, -5.912461757659912, -5.65008544921875, -5.387709617614746, -5.125333309173584, -4.862957000732422, -4.600581169128418, -4.338204860687256, -4.075829029083252, -3.81345272064209, -3.551076650619507, -3.288700580596924, -3.0263242721557617, -2.7639482021331787, -2.5015721321105957, -2.2391960620880127, -1.9768198728561401, -1.7144436836242676, -1.4520676136016846, -1.1896915435791016, -0.927315354347229, -0.6649391651153564, -0.40256309509277344, -0.14018696546554565, 0.12218916416168213, 0.3845652937889099, 0.6469414234161377, 0.9093174934387207, 1.1716936826705933, 1.4340698719024658, 1.6964459419250488, 1.9588220119476318, 2.221198081970215, 2.483574390411377, 2.74595046043396, 3.008326530456543, 3.270702838897705, 3.533078908920288, 3.795454978942871, 4.057831287384033, 4.320207118988037, 4.582583427429199, 4.844959259033203, 5.107335567474365, 5.369711875915527, 5.632087707519531, 5.894464015960693, 6.1568403244018555, 6.419216156005859, 6.6815924644470215, 6.943968772888184, 7.2063446044921875, 7.46872091293335, 7.731097221374512, 7.993473052978516]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 6.0, 12.0, 14.0, 25.0, 34.0, 33.0, 49.0, 76.0, 148.0, 197.0, 299.0, 653.0, 1145.0, 2017.0, 4024.0, 8199.0, 16944.0, 35223.0, 82275.0, 268100.0, 413132.0, 123307.0, 48305.0, 22216.0, 10794.0, 5313.0, 2685.0, 1382.0, 743.0, 439.0, 240.0, 173.0, 106.0, 66.0, 44.0, 30.0, 25.0, 16.0, 18.0, 7.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.299102783203125, -3.18609619140625, -3.073089599609375, -2.9600830078125, -2.847076416015625, -2.73406982421875, -2.621063232421875, -2.508056640625, -2.395050048828125, -2.28204345703125, -2.169036865234375, -2.0560302734375, -1.943023681640625, -1.83001708984375, -1.717010498046875, -1.60400390625, -1.490997314453125, -1.37799072265625, -1.264984130859375, -1.1519775390625, -1.038970947265625, -0.92596435546875, -0.812957763671875, -0.699951171875, -0.586944580078125, -0.47393798828125, -0.360931396484375, -0.2479248046875, -0.134918212890625, -0.02191162109375, 0.091094970703125, 0.2041015625, 0.317108154296875, 0.43011474609375, 0.543121337890625, 0.6561279296875, 0.769134521484375, 0.88214111328125, 0.995147705078125, 1.108154296875, 1.221160888671875, 1.33416748046875, 1.447174072265625, 1.5601806640625, 1.673187255859375, 1.78619384765625, 1.899200439453125, 2.01220703125, 2.125213623046875, 2.23822021484375, 2.351226806640625, 2.4642333984375, 2.577239990234375, 2.69024658203125, 2.803253173828125, 2.916259765625, 3.029266357421875, 3.14227294921875, 3.255279541015625, 3.3682861328125, 3.481292724609375, 3.59429931640625, 3.707305908203125, 3.8203125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 3.0, 8.0, 7.0, 10.0, 16.0, 19.0, 13.0, 17.0, 29.0, 24.0, 41.0, 34.0, 48.0, 49.0, 49.0, 46.0, 42.0, 42.0, 43.0, 51.0, 43.0, 43.0, 40.0, 49.0, 33.0, 28.0, 25.0, 28.0, 23.0, 22.0, 14.0, 14.0, 11.0, 13.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9746551513671875, -0.939544677734375, -0.9044342041015625, -0.86932373046875, -0.8342132568359375, -0.799102783203125, -0.7639923095703125, -0.7288818359375, -0.6937713623046875, -0.658660888671875, -0.6235504150390625, -0.58843994140625, -0.5533294677734375, -0.518218994140625, -0.4831085205078125, -0.447998046875, -0.4128875732421875, -0.377777099609375, -0.3426666259765625, -0.30755615234375, -0.2724456787109375, -0.237335205078125, -0.2022247314453125, -0.1671142578125, -0.1320037841796875, -0.096893310546875, -0.0617828369140625, -0.02667236328125, 0.0084381103515625, 0.043548583984375, 0.0786590576171875, 0.11376953125, 0.1488800048828125, 0.183990478515625, 0.2191009521484375, 0.25421142578125, 0.2893218994140625, 0.324432373046875, 0.3595428466796875, 0.3946533203125, 0.4297637939453125, 0.464874267578125, 0.4999847412109375, 0.53509521484375, 0.5702056884765625, 0.605316162109375, 0.6404266357421875, 0.675537109375, 0.7106475830078125, 0.745758056640625, 0.7808685302734375, 0.81597900390625, 0.8510894775390625, 0.886199951171875, 0.9213104248046875, 0.9564208984375, 0.9915313720703125, 1.026641845703125, 1.0617523193359375, 1.09686279296875, 1.1319732666015625, 1.167083740234375, 1.2021942138671875, 1.2373046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 10.0, 19.0, 8.0, 14.0, 22.0, 27.0, 36.0, 62.0, 74.0, 122.0, 193.0, 363.0, 646.0, 1346.0, 3338.0, 9880.0, 33989.0, 221214.0, 696570.0, 56613.0, 15175.0, 4879.0, 1957.0, 808.0, 429.0, 238.0, 134.0, 105.0, 56.0, 43.0, 45.0, 23.0, 14.0, 15.0, 16.0, 13.0, 15.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.2421875, -7.986083984375, -7.72998046875, -7.473876953125, -7.2177734375, -6.961669921875, -6.70556640625, -6.449462890625, -6.193359375, -5.937255859375, -5.68115234375, -5.425048828125, -5.1689453125, -4.912841796875, -4.65673828125, -4.400634765625, -4.14453125, -3.888427734375, -3.63232421875, -3.376220703125, -3.1201171875, -2.864013671875, -2.60791015625, -2.351806640625, -2.095703125, -1.839599609375, -1.58349609375, -1.327392578125, -1.0712890625, -0.815185546875, -0.55908203125, -0.302978515625, -0.046875, 0.209228515625, 0.46533203125, 0.721435546875, 0.9775390625, 1.233642578125, 1.48974609375, 1.745849609375, 2.001953125, 2.258056640625, 2.51416015625, 2.770263671875, 3.0263671875, 3.282470703125, 3.53857421875, 3.794677734375, 4.05078125, 4.306884765625, 4.56298828125, 4.819091796875, 5.0751953125, 5.331298828125, 5.58740234375, 5.843505859375, 6.099609375, 6.355712890625, 6.61181640625, 6.867919921875, 7.1240234375, 7.380126953125, 7.63623046875, 7.892333984375, 8.1484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 9.0, 5.0, 14.0, 20.0, 17.0, 31.0, 41.0, 46.0, 44.0, 51.0, 61.0, 67.0, 75.0, 79.0, 60.0, 65.0, 59.0, 56.0, 43.0, 31.0, 20.0, 18.0, 20.0, 8.0, 6.0, 8.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.421875, -7.20159912109375, -6.9813232421875, -6.76104736328125, -6.540771484375, -6.32049560546875, -6.1002197265625, -5.87994384765625, -5.65966796875, -5.43939208984375, -5.2191162109375, -4.99884033203125, -4.778564453125, -4.55828857421875, -4.3380126953125, -4.11773681640625, -3.8974609375, -3.67718505859375, -3.4569091796875, -3.23663330078125, -3.016357421875, -2.79608154296875, -2.5758056640625, -2.35552978515625, -2.13525390625, -1.91497802734375, -1.6947021484375, -1.47442626953125, -1.254150390625, -1.03387451171875, -0.8135986328125, -0.59332275390625, -0.373046875, -0.15277099609375, 0.0675048828125, 0.28778076171875, 0.508056640625, 0.72833251953125, 0.9486083984375, 1.16888427734375, 1.38916015625, 1.60943603515625, 1.8297119140625, 2.04998779296875, 2.270263671875, 2.49053955078125, 2.7108154296875, 2.93109130859375, 3.1513671875, 3.37164306640625, 3.5919189453125, 3.81219482421875, 4.032470703125, 4.25274658203125, 4.4730224609375, 4.69329833984375, 4.91357421875, 5.13385009765625, 5.3541259765625, 5.57440185546875, 5.794677734375, 6.01495361328125, 6.2352294921875, 6.45550537109375, 6.67578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 7.0, 18.0, 31.0, 39.0, 61.0, 98.0, 193.0, 260.0, 464.0, 779.0, 1475.0, 2886.0, 6302.0, 14328.0, 34447.0, 107750.0, 667517.0, 141860.0, 39901.0, 16291.0, 6964.0, 3158.0, 1582.0, 876.0, 520.0, 282.0, 159.0, 118.0, 49.0, 39.0, 27.0, 16.0, 15.0, 10.0, 8.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.0625, -2.978759765625, -2.89501953125, -2.811279296875, -2.7275390625, -2.643798828125, -2.56005859375, -2.476318359375, -2.392578125, -2.308837890625, -2.22509765625, -2.141357421875, -2.0576171875, -1.973876953125, -1.89013671875, -1.806396484375, -1.72265625, -1.638916015625, -1.55517578125, -1.471435546875, -1.3876953125, -1.303955078125, -1.22021484375, -1.136474609375, -1.052734375, -0.968994140625, -0.88525390625, -0.801513671875, -0.7177734375, -0.634033203125, -0.55029296875, -0.466552734375, -0.3828125, -0.299072265625, -0.21533203125, -0.131591796875, -0.0478515625, 0.035888671875, 0.11962890625, 0.203369140625, 0.287109375, 0.370849609375, 0.45458984375, 0.538330078125, 0.6220703125, 0.705810546875, 0.78955078125, 0.873291015625, 0.95703125, 1.040771484375, 1.12451171875, 1.208251953125, 1.2919921875, 1.375732421875, 1.45947265625, 1.543212890625, 1.626953125, 1.710693359375, 1.79443359375, 1.878173828125, 1.9619140625, 2.045654296875, 2.12939453125, 2.213134765625, 2.296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 6.0, 9.0, 10.0, 12.0, 24.0, 38.0, 35.0, 327.0, 379.0, 52.0, 18.0, 11.0, 11.0, 13.0, 11.0, 6.0, 6.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015039443969726562, -0.0014584660530090332, -0.0014129877090454102, -0.0013675093650817871, -0.001322031021118164, -0.001276552677154541, -0.001231074333190918, -0.001185595989227295, -0.0011401176452636719, -0.0010946393013000488, -0.0010491609573364258, -0.0010036826133728027, -0.0009582042694091797, -0.0009127259254455566, -0.0008672475814819336, -0.0008217692375183105, -0.0007762908935546875, -0.0007308125495910645, -0.0006853342056274414, -0.0006398558616638184, -0.0005943775177001953, -0.0005488991737365723, -0.0005034208297729492, -0.00045794248580932617, -0.0004124641418457031, -0.0003669857978820801, -0.00032150745391845703, -0.000276029109954834, -0.00023055076599121094, -0.0001850724220275879, -0.00013959407806396484, -9.41157341003418e-05, -4.863739013671875e-05, -3.159046173095703e-06, 4.2319297790527344e-05, 8.779764175415039e-05, 0.00013327598571777344, 0.00017875432968139648, 0.00022423267364501953, 0.0002697110176086426, 0.0003151893615722656, 0.00036066770553588867, 0.0004061460494995117, 0.00045162439346313477, 0.0004971027374267578, 0.0005425810813903809, 0.0005880594253540039, 0.000633537769317627, 0.00067901611328125, 0.000724494457244873, 0.0007699728012084961, 0.0008154511451721191, 0.0008609294891357422, 0.0009064078330993652, 0.0009518861770629883, 0.0009973645210266113, 0.0010428428649902344, 0.0010883212089538574, 0.0011337995529174805, 0.0011792778968811035, 0.0012247562408447266, 0.0012702345848083496, 0.0013157129287719727, 0.0013611912727355957, 0.0014066696166992188]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 12.0, 9.0, 18.0, 33.0, 27.0, 49.0, 51.0, 78.0, 149.0, 255.0, 441.0, 881.0, 2072.0, 5581.0, 17403.0, 61838.0, 585617.0, 307635.0, 45444.0, 13133.0, 4440.0, 1632.0, 750.0, 373.0, 206.0, 115.0, 80.0, 57.0, 51.0, 29.0, 26.0, 14.0, 11.0, 7.0, 9.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -2.99786376953125, -2.8863525390625, -2.77484130859375, -2.663330078125, -2.55181884765625, -2.4403076171875, -2.32879638671875, -2.21728515625, -2.10577392578125, -1.9942626953125, -1.88275146484375, -1.771240234375, -1.65972900390625, -1.5482177734375, -1.43670654296875, -1.3251953125, -1.21368408203125, -1.1021728515625, -0.99066162109375, -0.879150390625, -0.76763916015625, -0.6561279296875, -0.54461669921875, -0.43310546875, -0.32159423828125, -0.2100830078125, -0.09857177734375, 0.012939453125, 0.12445068359375, 0.2359619140625, 0.34747314453125, 0.458984375, 0.57049560546875, 0.6820068359375, 0.79351806640625, 0.905029296875, 1.01654052734375, 1.1280517578125, 1.23956298828125, 1.35107421875, 1.46258544921875, 1.5740966796875, 1.68560791015625, 1.797119140625, 1.90863037109375, 2.0201416015625, 2.13165283203125, 2.2431640625, 2.35467529296875, 2.4661865234375, 2.57769775390625, 2.689208984375, 2.80072021484375, 2.9122314453125, 3.02374267578125, 3.13525390625, 3.24676513671875, 3.3582763671875, 3.46978759765625, 3.581298828125, 3.69281005859375, 3.8043212890625, 3.91583251953125, 4.02734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 5.0, 11.0, 13.0, 12.0, 18.0, 30.0, 40.0, 54.0, 80.0, 128.0, 134.0, 122.0, 110.0, 64.0, 26.0, 22.0, 17.0, 16.0, 10.0, 10.0, 5.0, 6.0, 6.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9375, -1.864715576171875, -1.79193115234375, -1.719146728515625, -1.6463623046875, -1.573577880859375, -1.50079345703125, -1.428009033203125, -1.355224609375, -1.282440185546875, -1.20965576171875, -1.136871337890625, -1.0640869140625, -0.991302490234375, -0.91851806640625, -0.845733642578125, -0.77294921875, -0.700164794921875, -0.62738037109375, -0.554595947265625, -0.4818115234375, -0.409027099609375, -0.33624267578125, -0.263458251953125, -0.190673828125, -0.117889404296875, -0.04510498046875, 0.027679443359375, 0.1004638671875, 0.173248291015625, 0.24603271484375, 0.318817138671875, 0.3916015625, 0.464385986328125, 0.53717041015625, 0.609954833984375, 0.6827392578125, 0.755523681640625, 0.82830810546875, 0.901092529296875, 0.973876953125, 1.046661376953125, 1.11944580078125, 1.192230224609375, 1.2650146484375, 1.337799072265625, 1.41058349609375, 1.483367919921875, 1.55615234375, 1.628936767578125, 1.70172119140625, 1.774505615234375, 1.8472900390625, 1.920074462890625, 1.99285888671875, 2.065643310546875, 2.138427734375, 2.211212158203125, 2.28399658203125, 2.356781005859375, 2.4295654296875, 2.502349853515625, 2.57513427734375, 2.647918701171875, 2.720703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 19.0, 50.0, 126.0, 284.0, 272.0, 150.0, 69.0, 18.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.29727554321289, -34.63749694824219, -31.977718353271484, -29.31793975830078, -26.658161163330078, -23.998382568359375, -21.33860206604004, -18.678823471069336, -16.019044876098633, -13.35926628112793, -10.699487686157227, -8.039708137512207, -5.379929542541504, -2.720150947570801, -0.06037139892578125, 2.599407196044922, 5.259185791015625, 7.918964385986328, 10.578742980957031, 13.23852252960205, 15.898301124572754, 18.55807876586914, 21.217859268188477, 23.87763786315918, 26.537416458129883, 29.197195053100586, 31.85697364807129, 34.516754150390625, 37.17653274536133, 39.83631134033203, 42.496089935302734, 45.15586853027344, 47.815650939941406, 50.47542953491211, 53.13520812988281, 55.794986724853516, 58.45476531982422, 61.11454391479492, 63.774322509765625, 66.4341049194336, 69.09387969970703, 71.753662109375, 74.41343688964844, 77.0732192993164, 79.73299407958984, 82.39277648925781, 85.05255126953125, 87.71233367919922, 90.37211608886719, 93.03189849853516, 95.6916732788086, 98.35145568847656, 101.01123046875, 103.67101287841797, 106.3307876586914, 108.99057006835938, 111.65034484863281, 114.31012725830078, 116.96990203857422, 119.62968444824219, 122.28945922851562, 124.9492416381836, 127.60901641845703, 130.268798828125, 132.92857360839844]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 11.0, 6.0, 9.0, 8.0, 11.0, 15.0, 27.0, 22.0, 30.0, 29.0, 23.0, 40.0, 47.0, 36.0, 40.0, 42.0, 47.0, 46.0, 41.0, 35.0, 36.0, 44.0, 49.0, 24.0, 33.0, 32.0, 18.0, 19.0, 21.0, 30.0, 21.0, 12.0, 14.0, 15.0, 8.0, 9.0, 7.0, 9.0, 2.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-25.008899688720703, -24.302413940429688, -23.595928192138672, -22.889442443847656, -22.18295669555664, -21.476470947265625, -20.76998519897461, -20.063499450683594, -19.357013702392578, -18.650527954101562, -17.944042205810547, -17.23755645751953, -16.531070709228516, -15.8245849609375, -15.118099212646484, -14.411613464355469, -13.705127716064453, -12.998641967773438, -12.292156219482422, -11.585670471191406, -10.87918472290039, -10.172698974609375, -9.46621322631836, -8.759727478027344, -8.053241729736328, -7.3467559814453125, -6.640270233154297, -5.933784484863281, -5.227298736572266, -4.52081298828125, -3.8143272399902344, -3.1078414916992188, -2.401357650756836, -1.6948719024658203, -0.9883861541748047, -0.28190040588378906, 0.42458534240722656, 1.1310710906982422, 1.8375568389892578, 2.5440425872802734, 3.250528335571289, 3.9570140838623047, 4.66349983215332, 5.369985580444336, 6.076471328735352, 6.782957077026367, 7.489442825317383, 8.195928573608398, 8.902414321899414, 9.60890007019043, 10.315385818481445, 11.021871566772461, 11.728357315063477, 12.434843063354492, 13.141328811645508, 13.847814559936523, 14.554300308227539, 15.260786056518555, 15.96727180480957, 16.673757553100586, 17.3802433013916, 18.086729049682617, 18.793214797973633, 19.49970054626465, 20.206186294555664]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 17.0, 23.0, 29.0, 42.0, 76.0, 103.0, 178.0, 252.0, 414.0, 698.0, 1082.0, 2115.0, 3834.0, 7715.0, 16405.0, 39471.0, 124688.0, 1178317.0, 2602306.0, 138785.0, 42860.0, 17659.0, 7966.0, 3991.0, 2128.0, 1201.0, 681.0, 437.0, 280.0, 140.0, 125.0, 76.0, 48.0, 31.0, 31.0, 14.0, 12.0, 10.0, 4.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0], "bins": [-6.19921875, -6.0318603515625, -5.864501953125, -5.6971435546875, -5.52978515625, -5.3624267578125, -5.195068359375, -5.0277099609375, -4.8603515625, -4.6929931640625, -4.525634765625, -4.3582763671875, -4.19091796875, -4.0235595703125, -3.856201171875, -3.6888427734375, -3.521484375, -3.3541259765625, -3.186767578125, -3.0194091796875, -2.85205078125, -2.6846923828125, -2.517333984375, -2.3499755859375, -2.1826171875, -2.0152587890625, -1.847900390625, -1.6805419921875, -1.51318359375, -1.3458251953125, -1.178466796875, -1.0111083984375, -0.84375, -0.6763916015625, -0.509033203125, -0.3416748046875, -0.17431640625, -0.0069580078125, 0.160400390625, 0.3277587890625, 0.4951171875, 0.6624755859375, 0.829833984375, 0.9971923828125, 1.16455078125, 1.3319091796875, 1.499267578125, 1.6666259765625, 1.833984375, 2.0013427734375, 2.168701171875, 2.3360595703125, 2.50341796875, 2.6707763671875, 2.838134765625, 3.0054931640625, 3.1728515625, 3.3402099609375, 3.507568359375, 3.6749267578125, 3.84228515625, 4.0096435546875, 4.177001953125, 4.3443603515625, 4.51171875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 7.0, 5.0, 5.0, 9.0, 11.0, 8.0, 17.0, 28.0, 21.0, 23.0, 24.0, 29.0, 32.0, 33.0, 33.0, 36.0, 34.0, 54.0, 47.0, 55.0, 47.0, 42.0, 43.0, 57.0, 31.0, 42.0, 27.0, 37.0, 30.0, 15.0, 26.0, 15.0, 16.0, 10.0, 13.0, 12.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2783203125, -1.2425537109375, -1.206787109375, -1.1710205078125, -1.13525390625, -1.0994873046875, -1.063720703125, -1.0279541015625, -0.9921875, -0.9564208984375, -0.920654296875, -0.8848876953125, -0.84912109375, -0.8133544921875, -0.777587890625, -0.7418212890625, -0.7060546875, -0.6702880859375, -0.634521484375, -0.5987548828125, -0.56298828125, -0.5272216796875, -0.491455078125, -0.4556884765625, -0.419921875, -0.3841552734375, -0.348388671875, -0.3126220703125, -0.27685546875, -0.2410888671875, -0.205322265625, -0.1695556640625, -0.1337890625, -0.0980224609375, -0.062255859375, -0.0264892578125, 0.00927734375, 0.0450439453125, 0.080810546875, 0.1165771484375, 0.15234375, 0.1881103515625, 0.223876953125, 0.2596435546875, 0.29541015625, 0.3311767578125, 0.366943359375, 0.4027099609375, 0.4384765625, 0.4742431640625, 0.510009765625, 0.5457763671875, 0.58154296875, 0.6173095703125, 0.653076171875, 0.6888427734375, 0.724609375, 0.7603759765625, 0.796142578125, 0.8319091796875, 0.86767578125, 0.9034423828125, 0.939208984375, 0.9749755859375, 1.0107421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 6.0, 7.0, 10.0, 15.0, 34.0, 32.0, 50.0, 86.0, 116.0, 150.0, 216.0, 465.0, 735.0, 1392.0, 2673.0, 6130.0, 15262.0, 47248.0, 212564.0, 3422532.0, 381729.0, 67211.0, 20591.0, 7778.0, 3424.0, 1619.0, 851.0, 468.0, 319.0, 172.0, 120.0, 74.0, 48.0, 50.0, 21.0, 28.0, 14.0, 12.0, 7.0, 2.0, 9.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.65625, -9.37744140625, -9.0986328125, -8.81982421875, -8.541015625, -8.26220703125, -7.9833984375, -7.70458984375, -7.42578125, -7.14697265625, -6.8681640625, -6.58935546875, -6.310546875, -6.03173828125, -5.7529296875, -5.47412109375, -5.1953125, -4.91650390625, -4.6376953125, -4.35888671875, -4.080078125, -3.80126953125, -3.5224609375, -3.24365234375, -2.96484375, -2.68603515625, -2.4072265625, -2.12841796875, -1.849609375, -1.57080078125, -1.2919921875, -1.01318359375, -0.734375, -0.45556640625, -0.1767578125, 0.10205078125, 0.380859375, 0.65966796875, 0.9384765625, 1.21728515625, 1.49609375, 1.77490234375, 2.0537109375, 2.33251953125, 2.611328125, 2.89013671875, 3.1689453125, 3.44775390625, 3.7265625, 4.00537109375, 4.2841796875, 4.56298828125, 4.841796875, 5.12060546875, 5.3994140625, 5.67822265625, 5.95703125, 6.23583984375, 6.5146484375, 6.79345703125, 7.072265625, 7.35107421875, 7.6298828125, 7.90869140625, 8.1875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 9.0, 8.0, 12.0, 23.0, 31.0, 34.0, 53.0, 78.0, 132.0, 225.0, 750.0, 1878.0, 365.0, 157.0, 96.0, 49.0, 47.0, 19.0, 29.0, 18.0, 12.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.265625, -4.140869140625, -4.01611328125, -3.891357421875, -3.7666015625, -3.641845703125, -3.51708984375, -3.392333984375, -3.267578125, -3.142822265625, -3.01806640625, -2.893310546875, -2.7685546875, -2.643798828125, -2.51904296875, -2.394287109375, -2.26953125, -2.144775390625, -2.02001953125, -1.895263671875, -1.7705078125, -1.645751953125, -1.52099609375, -1.396240234375, -1.271484375, -1.146728515625, -1.02197265625, -0.897216796875, -0.7724609375, -0.647705078125, -0.52294921875, -0.398193359375, -0.2734375, -0.148681640625, -0.02392578125, 0.100830078125, 0.2255859375, 0.350341796875, 0.47509765625, 0.599853515625, 0.724609375, 0.849365234375, 0.97412109375, 1.098876953125, 1.2236328125, 1.348388671875, 1.47314453125, 1.597900390625, 1.72265625, 1.847412109375, 1.97216796875, 2.096923828125, 2.2216796875, 2.346435546875, 2.47119140625, 2.595947265625, 2.720703125, 2.845458984375, 2.97021484375, 3.094970703125, 3.2197265625, 3.344482421875, 3.46923828125, 3.593994140625, 3.71875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 17.0, 43.0, 89.0, 140.0, 188.0, 197.0, 166.0, 82.0, 32.0, 19.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.91409683227539, -26.752471923828125, -25.59084701538086, -24.429222106933594, -23.26759910583496, -22.105974197387695, -20.94434928894043, -19.782726287841797, -18.62110137939453, -17.459476470947266, -16.2978515625, -15.13622760772705, -13.974603652954102, -12.812978744506836, -11.65135383605957, -10.489729881286621, -9.328104019165039, -8.166479110717773, -7.004855155944824, -5.843230247497559, -4.681605815887451, -3.5199813842773438, -2.358356475830078, -1.196732521057129, -0.03510761260986328, 1.1265169382095337, 2.2881414890289307, 3.449766159057617, 4.611390590667725, 5.773015022277832, 6.934639930725098, 8.096263885498047, 9.257888793945312, 10.419513702392578, 11.581137657165527, 12.742762565612793, 13.904386520385742, 15.066011428833008, 16.227636337280273, 17.389259338378906, 18.550884246826172, 19.712509155273438, 20.874134063720703, 22.03575897216797, 23.1973819732666, 24.359006881713867, 25.520631790161133, 26.682254791259766, 27.843881607055664, 29.00550651550293, 30.167131423950195, 31.328754425048828, 32.490379333496094, 33.65200424194336, 34.813629150390625, 35.97525405883789, 37.136878967285156, 38.29850387573242, 39.46012878417969, 40.62175369262695, 41.78337860107422, 42.94499969482422, 44.10662841796875, 45.26824951171875, 46.429874420166016]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 12.0, 10.0, 11.0, 16.0, 12.0, 18.0, 23.0, 23.0, 22.0, 24.0, 37.0, 28.0, 37.0, 40.0, 44.0, 29.0, 52.0, 37.0, 57.0, 47.0, 34.0, 31.0, 46.0, 18.0, 37.0, 33.0, 26.0, 24.0, 14.0, 22.0, 18.0, 11.0, 17.0, 19.0, 13.0, 8.0, 6.0, 7.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-12.07717514038086, -11.72433090209961, -11.371485710144043, -11.018640518188477, -10.665796279907227, -10.312952041625977, -9.96010684967041, -9.607261657714844, -9.254417419433594, -8.901573181152344, -8.548727989196777, -8.195882797241211, -7.843038558959961, -7.490193843841553, -7.1373491287231445, -6.784504413604736, -6.431659698486328, -6.07881498336792, -5.725970268249512, -5.3731255531311035, -5.020280838012695, -4.667436122894287, -4.314591407775879, -3.9617466926574707, -3.6089019775390625, -3.2560572624206543, -2.903212547302246, -2.550367832183838, -2.1975231170654297, -1.8446784019470215, -1.4918336868286133, -1.138988971710205, -0.7861442565917969, -0.43329954147338867, -0.08045482635498047, 0.27238988876342773, 0.6252346038818359, 0.9780793190002441, 1.3309240341186523, 1.6837687492370605, 2.0366134643554688, 2.389458179473877, 2.742302894592285, 3.0951476097106934, 3.4479923248291016, 3.8008370399475098, 4.153681755065918, 4.506526470184326, 4.859371185302734, 5.212215900421143, 5.565060615539551, 5.917905330657959, 6.270750045776367, 6.623594760894775, 6.976439476013184, 7.329284191131592, 7.68212890625, 8.03497314453125, 8.387818336486816, 8.740663528442383, 9.093507766723633, 9.446352005004883, 9.79919719696045, 10.152042388916016, 10.504886627197266]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 9.0, 22.0, 15.0, 26.0, 44.0, 61.0, 102.0, 167.0, 241.0, 370.0, 579.0, 929.0, 1605.0, 2827.0, 5153.0, 10032.0, 19765.0, 39167.0, 78925.0, 170233.0, 356681.0, 188589.0, 85079.0, 42894.0, 21075.0, 10930.0, 5501.0, 3165.0, 1720.0, 1002.0, 603.0, 383.0, 209.0, 140.0, 87.0, 60.0, 51.0, 32.0, 19.0, 15.0, 13.0, 9.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.89971923828125, -3.7720947265625, -3.64447021484375, -3.516845703125, -3.38922119140625, -3.2615966796875, -3.13397216796875, -3.00634765625, -2.87872314453125, -2.7510986328125, -2.62347412109375, -2.495849609375, -2.36822509765625, -2.2406005859375, -2.11297607421875, -1.9853515625, -1.85772705078125, -1.7301025390625, -1.60247802734375, -1.474853515625, -1.34722900390625, -1.2196044921875, -1.09197998046875, -0.96435546875, -0.83673095703125, -0.7091064453125, -0.58148193359375, -0.453857421875, -0.32623291015625, -0.1986083984375, -0.07098388671875, 0.056640625, 0.18426513671875, 0.3118896484375, 0.43951416015625, 0.567138671875, 0.69476318359375, 0.8223876953125, 0.95001220703125, 1.07763671875, 1.20526123046875, 1.3328857421875, 1.46051025390625, 1.588134765625, 1.71575927734375, 1.8433837890625, 1.97100830078125, 2.0986328125, 2.22625732421875, 2.3538818359375, 2.48150634765625, 2.609130859375, 2.73675537109375, 2.8643798828125, 2.99200439453125, 3.11962890625, 3.24725341796875, 3.3748779296875, 3.50250244140625, 3.630126953125, 3.75775146484375, 3.8853759765625, 4.01300048828125, 4.140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 11.0, 5.0, 10.0, 7.0, 13.0, 11.0, 16.0, 11.0, 24.0, 22.0, 27.0, 29.0, 43.0, 30.0, 35.0, 27.0, 40.0, 32.0, 37.0, 36.0, 47.0, 35.0, 55.0, 47.0, 37.0, 33.0, 38.0, 29.0, 23.0, 33.0, 17.0, 25.0, 23.0, 13.0, 9.0, 18.0, 3.0, 11.0, 6.0, 6.0, 4.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0385284423828125, -1.001861572265625, -0.9651947021484375, -0.92852783203125, -0.8918609619140625, -0.855194091796875, -0.8185272216796875, -0.7818603515625, -0.7451934814453125, -0.708526611328125, -0.6718597412109375, -0.63519287109375, -0.5985260009765625, -0.561859130859375, -0.5251922607421875, -0.488525390625, -0.4518585205078125, -0.415191650390625, -0.3785247802734375, -0.34185791015625, -0.3051910400390625, -0.268524169921875, -0.2318572998046875, -0.1951904296875, -0.1585235595703125, -0.121856689453125, -0.0851898193359375, -0.04852294921875, -0.0118560791015625, 0.024810791015625, 0.0614776611328125, 0.09814453125, 0.1348114013671875, 0.171478271484375, 0.2081451416015625, 0.24481201171875, 0.2814788818359375, 0.318145751953125, 0.3548126220703125, 0.3914794921875, 0.4281463623046875, 0.464813232421875, 0.5014801025390625, 0.53814697265625, 0.5748138427734375, 0.611480712890625, 0.6481475830078125, 0.684814453125, 0.7214813232421875, 0.758148193359375, 0.7948150634765625, 0.83148193359375, 0.8681488037109375, 0.904815673828125, 0.9414825439453125, 0.9781494140625, 1.0148162841796875, 1.051483154296875, 1.0881500244140625, 1.12481689453125, 1.1614837646484375, 1.198150634765625, 1.2348175048828125, 1.271484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 8.0, 7.0, 11.0, 15.0, 22.0, 26.0, 39.0, 38.0, 65.0, 73.0, 134.0, 197.0, 284.0, 476.0, 883.0, 2172.0, 6267.0, 27112.0, 198569.0, 715330.0, 76554.0, 13301.0, 3633.0, 1446.0, 720.0, 401.0, 214.0, 145.0, 125.0, 67.0, 57.0, 46.0, 28.0, 22.0, 8.0, 10.0, 16.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.4306640625, -12.033203125, -11.6357421875, -11.23828125, -10.8408203125, -10.443359375, -10.0458984375, -9.6484375, -9.2509765625, -8.853515625, -8.4560546875, -8.05859375, -7.6611328125, -7.263671875, -6.8662109375, -6.46875, -6.0712890625, -5.673828125, -5.2763671875, -4.87890625, -4.4814453125, -4.083984375, -3.6865234375, -3.2890625, -2.8916015625, -2.494140625, -2.0966796875, -1.69921875, -1.3017578125, -0.904296875, -0.5068359375, -0.109375, 0.2880859375, 0.685546875, 1.0830078125, 1.48046875, 1.8779296875, 2.275390625, 2.6728515625, 3.0703125, 3.4677734375, 3.865234375, 4.2626953125, 4.66015625, 5.0576171875, 5.455078125, 5.8525390625, 6.25, 6.6474609375, 7.044921875, 7.4423828125, 7.83984375, 8.2373046875, 8.634765625, 9.0322265625, 9.4296875, 9.8271484375, 10.224609375, 10.6220703125, 11.01953125, 11.4169921875, 11.814453125, 12.2119140625, 12.609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 12.0, 13.0, 17.0, 18.0, 27.0, 37.0, 40.0, 43.0, 41.0, 53.0, 56.0, 45.0, 47.0, 73.0, 62.0, 65.0, 52.0, 40.0, 43.0, 28.0, 27.0, 21.0, 17.0, 16.0, 18.0, 10.0, 9.0, 4.0, 9.0, 5.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.927734375, -7.66015625, -7.392578125, -7.125, -6.857421875, -6.58984375, -6.322265625, -6.0546875, -5.787109375, -5.51953125, -5.251953125, -4.984375, -4.716796875, -4.44921875, -4.181640625, -3.9140625, -3.646484375, -3.37890625, -3.111328125, -2.84375, -2.576171875, -2.30859375, -2.041015625, -1.7734375, -1.505859375, -1.23828125, -0.970703125, -0.703125, -0.435546875, -0.16796875, 0.099609375, 0.3671875, 0.634765625, 0.90234375, 1.169921875, 1.4375, 1.705078125, 1.97265625, 2.240234375, 2.5078125, 2.775390625, 3.04296875, 3.310546875, 3.578125, 3.845703125, 4.11328125, 4.380859375, 4.6484375, 4.916015625, 5.18359375, 5.451171875, 5.71875, 5.986328125, 6.25390625, 6.521484375, 6.7890625, 7.056640625, 7.32421875, 7.591796875, 7.859375, 8.126953125, 8.39453125, 8.662109375, 8.9296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 15.0, 24.0, 30.0, 59.0, 82.0, 150.0, 237.0, 444.0, 709.0, 1492.0, 3216.0, 8825.0, 29916.0, 144431.0, 673657.0, 140756.0, 29325.0, 8674.0, 3169.0, 1511.0, 757.0, 434.0, 257.0, 132.0, 106.0, 50.0, 28.0, 16.0, 11.0, 12.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.6153564453125, -4.453369140625, -4.2913818359375, -4.12939453125, -3.9674072265625, -3.805419921875, -3.6434326171875, -3.4814453125, -3.3194580078125, -3.157470703125, -2.9954833984375, -2.83349609375, -2.6715087890625, -2.509521484375, -2.3475341796875, -2.185546875, -2.0235595703125, -1.861572265625, -1.6995849609375, -1.53759765625, -1.3756103515625, -1.213623046875, -1.0516357421875, -0.8896484375, -0.7276611328125, -0.565673828125, -0.4036865234375, -0.24169921875, -0.0797119140625, 0.082275390625, 0.2442626953125, 0.40625, 0.5682373046875, 0.730224609375, 0.8922119140625, 1.05419921875, 1.2161865234375, 1.378173828125, 1.5401611328125, 1.7021484375, 1.8641357421875, 2.026123046875, 2.1881103515625, 2.35009765625, 2.5120849609375, 2.674072265625, 2.8360595703125, 2.998046875, 3.1600341796875, 3.322021484375, 3.4840087890625, 3.64599609375, 3.8079833984375, 3.969970703125, 4.1319580078125, 4.2939453125, 4.4559326171875, 4.617919921875, 4.7799072265625, 4.94189453125, 5.1038818359375, 5.265869140625, 5.4278564453125, 5.58984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 16.0, 18.0, 20.0, 30.0, 39.0, 58.0, 104.0, 272.0, 182.0, 74.0, 52.0, 39.0, 29.0, 13.0, 14.0, 7.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.002014830708503723, -0.001960188150405884, -0.0019055455923080444, -0.001850903034210205, -0.0017962604761123657, -0.0017416179180145264, -0.001686975359916687, -0.0016323328018188477, -0.0015776902437210083, -0.001523047685623169, -0.0014684051275253296, -0.0014137625694274902, -0.0013591200113296509, -0.0013044774532318115, -0.0012498348951339722, -0.0011951923370361328, -0.0011405497789382935, -0.001085907220840454, -0.0010312646627426147, -0.0009766221046447754, -0.000921979546546936, -0.0008673369884490967, -0.0008126944303512573, -0.000758051872253418, -0.0007034093141555786, -0.0006487667560577393, -0.0005941241979598999, -0.0005394816398620605, -0.0004848390817642212, -0.00043019652366638184, -0.0003755539655685425, -0.0003209114074707031, -0.00026626884937286377, -0.00021162629127502441, -0.00015698373317718506, -0.0001023411750793457, -4.769861698150635e-05, 6.943941116333008e-06, 6.158649921417236e-05, 0.00011622905731201172, 0.00017087161540985107, 0.00022551417350769043, 0.0002801567316055298, 0.00033479928970336914, 0.0003894418478012085, 0.00044408440589904785, 0.0004987269639968872, 0.0005533695220947266, 0.0006080120801925659, 0.0006626546382904053, 0.0007172971963882446, 0.000771939754486084, 0.0008265823125839233, 0.0008812248706817627, 0.000935867428779602, 0.0009905099868774414, 0.0010451525449752808, 0.0010997951030731201, 0.0011544376611709595, 0.0012090802192687988, 0.0012637227773666382, 0.0013183653354644775, 0.001373007893562317, 0.0014276504516601562]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 5.0, 15.0, 14.0, 16.0, 26.0, 32.0, 45.0, 65.0, 95.0, 164.0, 277.0, 522.0, 1093.0, 2539.0, 8650.0, 49037.0, 546548.0, 390344.0, 37357.0, 7257.0, 2305.0, 941.0, 445.0, 266.0, 158.0, 112.0, 62.0, 39.0, 27.0, 22.0, 15.0, 20.0, 8.0, 7.0, 2.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.8299560546875, -6.628662109375, -6.4273681640625, -6.22607421875, -6.0247802734375, -5.823486328125, -5.6221923828125, -5.4208984375, -5.2196044921875, -5.018310546875, -4.8170166015625, -4.61572265625, -4.4144287109375, -4.213134765625, -4.0118408203125, -3.810546875, -3.6092529296875, -3.407958984375, -3.2066650390625, -3.00537109375, -2.8040771484375, -2.602783203125, -2.4014892578125, -2.2001953125, -1.9989013671875, -1.797607421875, -1.5963134765625, -1.39501953125, -1.1937255859375, -0.992431640625, -0.7911376953125, -0.58984375, -0.3885498046875, -0.187255859375, 0.0140380859375, 0.21533203125, 0.4166259765625, 0.617919921875, 0.8192138671875, 1.0205078125, 1.2218017578125, 1.423095703125, 1.6243896484375, 1.82568359375, 2.0269775390625, 2.228271484375, 2.4295654296875, 2.630859375, 2.8321533203125, 3.033447265625, 3.2347412109375, 3.43603515625, 3.6373291015625, 3.838623046875, 4.0399169921875, 4.2412109375, 4.4425048828125, 4.643798828125, 4.8450927734375, 5.04638671875, 5.2476806640625, 5.448974609375, 5.6502685546875, 5.8515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 8.0, 10.0, 4.0, 10.0, 24.0, 11.0, 23.0, 47.0, 41.0, 49.0, 84.0, 139.0, 155.0, 109.0, 47.0, 42.0, 40.0, 35.0, 23.0, 17.0, 21.0, 14.0, 11.0, 6.0, 6.0, 9.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.779296875, -3.644256591796875, -3.50921630859375, -3.374176025390625, -3.2391357421875, -3.104095458984375, -2.96905517578125, -2.834014892578125, -2.698974609375, -2.563934326171875, -2.42889404296875, -2.293853759765625, -2.1588134765625, -2.023773193359375, -1.88873291015625, -1.753692626953125, -1.61865234375, -1.483612060546875, -1.34857177734375, -1.213531494140625, -1.0784912109375, -0.943450927734375, -0.80841064453125, -0.673370361328125, -0.538330078125, -0.403289794921875, -0.26824951171875, -0.133209228515625, 0.0018310546875, 0.136871337890625, 0.27191162109375, 0.406951904296875, 0.5419921875, 0.677032470703125, 0.81207275390625, 0.947113037109375, 1.0821533203125, 1.217193603515625, 1.35223388671875, 1.487274169921875, 1.622314453125, 1.757354736328125, 1.89239501953125, 2.027435302734375, 2.1624755859375, 2.297515869140625, 2.43255615234375, 2.567596435546875, 2.70263671875, 2.837677001953125, 2.97271728515625, 3.107757568359375, 3.2427978515625, 3.377838134765625, 3.51287841796875, 3.647918701171875, 3.782958984375, 3.917999267578125, 4.05303955078125, 4.188079833984375, 4.3231201171875, 4.458160400390625, 4.59320068359375, 4.728240966796875, 4.86328125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 13.0, 8.0, 32.0, 67.0, 105.0, 112.0, 150.0, 165.0, 133.0, 96.0, 53.0, 39.0, 14.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-117.06661224365234, -114.57801055908203, -112.08941650390625, -109.60081481933594, -107.11222076416016, -104.62361907958984, -102.13502502441406, -99.64642333984375, -97.15782928466797, -94.66922760009766, -92.18063354492188, -89.69203186035156, -87.20343780517578, -84.71483612060547, -82.22624206542969, -79.73764038085938, -77.24903869628906, -74.76043701171875, -72.27184295654297, -69.78324127197266, -67.29464721679688, -64.80604553222656, -62.31745147705078, -59.82884979248047, -57.34025573730469, -54.85165786743164, -52.363059997558594, -49.87446212768555, -47.3858642578125, -44.89726638793945, -42.408668518066406, -39.920066833496094, -37.43147659301758, -34.94287872314453, -32.454280853271484, -29.965682983398438, -27.47708511352539, -24.988487243652344, -22.499887466430664, -20.011289596557617, -17.52269172668457, -15.034093856811523, -12.545495986938477, -10.056897163391113, -7.568299293518066, -5.0797014236450195, -2.5911026000976562, -0.10250473022460938, 2.3860931396484375, 4.874691009521484, 7.3632893562316895, 9.851887702941895, 12.340485572814941, 14.829083442687988, 17.31768226623535, 19.8062801361084, 22.294878005981445, 24.783475875854492, 27.27207374572754, 29.76067352294922, 32.249271392822266, 34.73786926269531, 37.22646713256836, 39.715065002441406, 42.20366287231445]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 9.0, 7.0, 5.0, 7.0, 10.0, 16.0, 23.0, 20.0, 25.0, 23.0, 31.0, 31.0, 42.0, 35.0, 63.0, 43.0, 41.0, 51.0, 31.0, 45.0, 40.0, 38.0, 37.0, 45.0, 37.0, 22.0, 33.0, 23.0, 34.0, 17.0, 18.0, 13.0, 10.0, 17.0, 17.0, 6.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.286705017089844, -39.012107849121094, -37.73751449584961, -36.46291732788086, -35.188323974609375, -33.913726806640625, -32.63913345336914, -31.36453628540039, -30.089942932128906, -28.81534767150879, -27.540752410888672, -26.266157150268555, -24.991561889648438, -23.71696662902832, -22.442371368408203, -21.167774200439453, -19.893178939819336, -18.61858367919922, -17.3439884185791, -16.069393157958984, -14.794797897338867, -13.52020263671875, -12.245606422424316, -10.9710111618042, -9.696415901184082, -8.421820640563965, -7.147225379943848, -5.872629642486572, -4.598034381866455, -3.323439121246338, -2.0488433837890625, -0.7742481231689453, 0.5003471374511719, 1.7749425172805786, 3.0495378971099854, 4.324133396148682, 5.598728656768799, 6.873323917388916, 8.147919654846191, 9.422514915466309, 10.697110176086426, 11.971705436706543, 13.24630069732666, 14.520896911621094, 15.795492172241211, 17.070087432861328, 18.344682693481445, 19.619277954101562, 20.89387321472168, 22.168468475341797, 23.443063735961914, 24.71765899658203, 25.99225425720215, 27.266849517822266, 28.541446685791016, 29.8160400390625, 31.09063720703125, 32.365234375, 33.639827728271484, 34.914424896240234, 36.18901824951172, 37.46361541748047, 38.73820877075195, 40.0128059387207, 41.28739929199219]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 11.0, 15.0, 29.0, 27.0, 42.0, 93.0, 159.0, 288.0, 531.0, 1058.0, 2435.0, 5516.0, 14161.0, 42572.0, 198254.0, 3472985.0, 366118.0, 58931.0, 18097.0, 6902.0, 3003.0, 1449.0, 703.0, 373.0, 213.0, 124.0, 70.0, 49.0, 24.0, 19.0, 6.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.54656982421875, -7.3079833984375, -7.06939697265625, -6.830810546875, -6.59222412109375, -6.3536376953125, -6.11505126953125, -5.87646484375, -5.63787841796875, -5.3992919921875, -5.16070556640625, -4.922119140625, -4.68353271484375, -4.4449462890625, -4.20635986328125, -3.9677734375, -3.72918701171875, -3.4906005859375, -3.25201416015625, -3.013427734375, -2.77484130859375, -2.5362548828125, -2.29766845703125, -2.05908203125, -1.82049560546875, -1.5819091796875, -1.34332275390625, -1.104736328125, -0.86614990234375, -0.6275634765625, -0.38897705078125, -0.150390625, 0.08819580078125, 0.3267822265625, 0.56536865234375, 0.803955078125, 1.04254150390625, 1.2811279296875, 1.51971435546875, 1.75830078125, 1.99688720703125, 2.2354736328125, 2.47406005859375, 2.712646484375, 2.95123291015625, 3.1898193359375, 3.42840576171875, 3.6669921875, 3.90557861328125, 4.1441650390625, 4.38275146484375, 4.621337890625, 4.85992431640625, 5.0985107421875, 5.33709716796875, 5.57568359375, 5.81427001953125, 6.0528564453125, 6.29144287109375, 6.530029296875, 6.76861572265625, 7.0072021484375, 7.24578857421875, 7.484375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 6.0, 10.0, 10.0, 15.0, 19.0, 23.0, 25.0, 30.0, 40.0, 40.0, 42.0, 42.0, 58.0, 58.0, 43.0, 49.0, 60.0, 47.0, 49.0, 42.0, 40.0, 33.0, 38.0, 33.0, 33.0, 19.0, 10.0, 20.0, 10.0, 13.0, 5.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51171875, -1.4586944580078125, -1.405670166015625, -1.3526458740234375, -1.29962158203125, -1.2465972900390625, -1.193572998046875, -1.1405487060546875, -1.0875244140625, -1.0345001220703125, -0.981475830078125, -0.9284515380859375, -0.87542724609375, -0.8224029541015625, -0.769378662109375, -0.7163543701171875, -0.663330078125, -0.6103057861328125, -0.557281494140625, -0.5042572021484375, -0.45123291015625, -0.3982086181640625, -0.345184326171875, -0.2921600341796875, -0.2391357421875, -0.1861114501953125, -0.133087158203125, -0.0800628662109375, -0.02703857421875, 0.0259857177734375, 0.079010009765625, 0.1320343017578125, 0.18505859375, 0.2380828857421875, 0.291107177734375, 0.3441314697265625, 0.39715576171875, 0.4501800537109375, 0.503204345703125, 0.5562286376953125, 0.6092529296875, 0.6622772216796875, 0.715301513671875, 0.7683258056640625, 0.82135009765625, 0.8743743896484375, 0.927398681640625, 0.9804229736328125, 1.033447265625, 1.0864715576171875, 1.139495849609375, 1.1925201416015625, 1.24554443359375, 1.2985687255859375, 1.351593017578125, 1.4046173095703125, 1.4576416015625, 1.5106658935546875, 1.563690185546875, 1.6167144775390625, 1.66973876953125, 1.7227630615234375, 1.775787353515625, 1.8288116455078125, 1.8818359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 6.0, 13.0, 24.0, 31.0, 31.0, 70.0, 111.0, 190.0, 260.0, 426.0, 739.0, 1358.0, 2632.0, 5420.0, 12130.0, 30316.0, 91830.0, 464357.0, 3191971.0, 279980.0, 68906.0, 23912.0, 9891.0, 4490.0, 2240.0, 1200.0, 659.0, 392.0, 244.0, 150.0, 94.0, 56.0, 48.0, 28.0, 24.0, 12.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0546875, -7.780517578125, -7.50634765625, -7.232177734375, -6.9580078125, -6.683837890625, -6.40966796875, -6.135498046875, -5.861328125, -5.587158203125, -5.31298828125, -5.038818359375, -4.7646484375, -4.490478515625, -4.21630859375, -3.942138671875, -3.66796875, -3.393798828125, -3.11962890625, -2.845458984375, -2.5712890625, -2.297119140625, -2.02294921875, -1.748779296875, -1.474609375, -1.200439453125, -0.92626953125, -0.652099609375, -0.3779296875, -0.103759765625, 0.17041015625, 0.444580078125, 0.71875, 0.992919921875, 1.26708984375, 1.541259765625, 1.8154296875, 2.089599609375, 2.36376953125, 2.637939453125, 2.912109375, 3.186279296875, 3.46044921875, 3.734619140625, 4.0087890625, 4.282958984375, 4.55712890625, 4.831298828125, 5.10546875, 5.379638671875, 5.65380859375, 5.927978515625, 6.2021484375, 6.476318359375, 6.75048828125, 7.024658203125, 7.298828125, 7.572998046875, 7.84716796875, 8.121337890625, 8.3955078125, 8.669677734375, 8.94384765625, 9.218017578125, 9.4921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 7.0, 9.0, 21.0, 33.0, 25.0, 46.0, 63.0, 101.0, 187.0, 298.0, 984.0, 1461.0, 346.0, 184.0, 92.0, 59.0, 37.0, 33.0, 18.0, 15.0, 15.0, 8.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.4476318359375, -4.270263671875, -4.0928955078125, -3.91552734375, -3.7381591796875, -3.560791015625, -3.3834228515625, -3.2060546875, -3.0286865234375, -2.851318359375, -2.6739501953125, -2.49658203125, -2.3192138671875, -2.141845703125, -1.9644775390625, -1.787109375, -1.6097412109375, -1.432373046875, -1.2550048828125, -1.07763671875, -0.9002685546875, -0.722900390625, -0.5455322265625, -0.3681640625, -0.1907958984375, -0.013427734375, 0.1639404296875, 0.34130859375, 0.5186767578125, 0.696044921875, 0.8734130859375, 1.05078125, 1.2281494140625, 1.405517578125, 1.5828857421875, 1.76025390625, 1.9376220703125, 2.114990234375, 2.2923583984375, 2.4697265625, 2.6470947265625, 2.824462890625, 3.0018310546875, 3.17919921875, 3.3565673828125, 3.533935546875, 3.7113037109375, 3.888671875, 4.0660400390625, 4.243408203125, 4.4207763671875, 4.59814453125, 4.7755126953125, 4.952880859375, 5.1302490234375, 5.3076171875, 5.4849853515625, 5.662353515625, 5.8397216796875, 6.01708984375, 6.1944580078125, 6.371826171875, 6.5491943359375, 6.7265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 16.0, 20.0, 36.0, 75.0, 111.0, 138.0, 157.0, 152.0, 110.0, 93.0, 43.0, 21.0, 12.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-69.02073669433594, -67.64192962646484, -66.26313018798828, -64.88432312011719, -63.50551986694336, -62.12671661376953, -60.74790954589844, -59.36910629272461, -57.99030303955078, -56.61149978637695, -55.232696533203125, -53.85388946533203, -52.4750862121582, -51.096282958984375, -49.71747589111328, -48.33867263793945, -46.959869384765625, -45.5810661315918, -44.20226287841797, -42.823455810546875, -41.44465255737305, -40.06584930419922, -38.687042236328125, -37.3082389831543, -35.92943572998047, -34.55063247680664, -33.17182922363281, -31.79302215576172, -30.41421890258789, -29.035415649414062, -27.6566104888916, -26.27780532836914, -24.898998260498047, -23.52019500732422, -22.141389846801758, -20.762584686279297, -19.38378143310547, -18.00497817993164, -16.62617301940918, -15.247368812561035, -13.86856460571289, -12.489760398864746, -11.110956192016602, -9.732151985168457, -8.353347778320312, -6.974543571472168, -5.595739364624023, -4.216935157775879, -2.8381309509277344, -1.4593267440795898, -0.08052253723144531, 1.2982816696166992, 2.6770858764648438, 4.055890083312988, 5.434694290161133, 6.813498497009277, 8.192302703857422, 9.571106910705566, 10.949911117553711, 12.328715324401855, 13.70751953125, 15.086323738098145, 16.46512794494629, 17.84393310546875, 19.222736358642578]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 1.0, 6.0, 8.0, 8.0, 9.0, 13.0, 13.0, 13.0, 19.0, 22.0, 32.0, 34.0, 29.0, 25.0, 52.0, 30.0, 49.0, 36.0, 50.0, 45.0, 33.0, 44.0, 53.0, 47.0, 51.0, 39.0, 37.0, 30.0, 27.0, 18.0, 16.0, 18.0, 14.0, 17.0, 16.0, 15.0, 8.0, 4.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.01418685913086, -18.439294815063477, -17.864402770996094, -17.28951072692871, -16.714618682861328, -16.139726638793945, -15.564833641052246, -14.989941596984863, -14.41504955291748, -13.840157508850098, -13.265265464782715, -12.690373420715332, -12.115480422973633, -11.54058837890625, -10.965696334838867, -10.390804290771484, -9.815912246704102, -9.241020202636719, -8.666128158569336, -8.091236114501953, -7.516343593597412, -6.941451549530029, -6.366559028625488, -5.7916669845581055, -5.216774940490723, -4.64188289642334, -4.066990852355957, -3.492098331451416, -2.917206287384033, -2.3423142433166504, -1.7674219608306885, -1.1925296783447266, -0.6176376342773438, -0.04274547100067139, 0.532146692276001, 1.1070388555526733, 1.6819310188293457, 2.2568230628967285, 2.8317153453826904, 3.4066076278686523, 3.981499671936035, 4.556391716003418, 5.131283760070801, 5.706176280975342, 6.281068325042725, 6.855960369110107, 7.430852890014648, 8.005744934082031, 8.580636978149414, 9.155529022216797, 9.73042106628418, 10.305313110351562, 10.880205154418945, 11.455097198486328, 12.029990196228027, 12.60488224029541, 13.179774284362793, 13.754666328430176, 14.329558372497559, 14.904450416564941, 15.47934341430664, 16.054235458374023, 16.629127502441406, 17.20401954650879, 17.778911590576172]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 10.0, 10.0, 9.0, 16.0, 31.0, 34.0, 51.0, 80.0, 107.0, 159.0, 222.0, 337.0, 497.0, 773.0, 1161.0, 1914.0, 2994.0, 5040.0, 8717.0, 15362.0, 28149.0, 54392.0, 106811.0, 202733.0, 259168.0, 170865.0, 88174.0, 44937.0, 23545.0, 13155.0, 7251.0, 4364.0, 2658.0, 1609.0, 1081.0, 704.0, 448.0, 302.0, 224.0, 152.0, 104.0, 52.0, 39.0, 34.0, 19.0, 11.0, 19.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-3.671875, -3.561798095703125, -3.45172119140625, -3.341644287109375, -3.2315673828125, -3.121490478515625, -3.01141357421875, -2.901336669921875, -2.791259765625, -2.681182861328125, -2.57110595703125, -2.461029052734375, -2.3509521484375, -2.240875244140625, -2.13079833984375, -2.020721435546875, -1.91064453125, -1.800567626953125, -1.69049072265625, -1.580413818359375, -1.4703369140625, -1.360260009765625, -1.25018310546875, -1.140106201171875, -1.030029296875, -0.919952392578125, -0.80987548828125, -0.699798583984375, -0.5897216796875, -0.479644775390625, -0.36956787109375, -0.259490966796875, -0.1494140625, -0.039337158203125, 0.07073974609375, 0.180816650390625, 0.2908935546875, 0.400970458984375, 0.51104736328125, 0.621124267578125, 0.731201171875, 0.841278076171875, 0.95135498046875, 1.061431884765625, 1.1715087890625, 1.281585693359375, 1.39166259765625, 1.501739501953125, 1.61181640625, 1.721893310546875, 1.83197021484375, 1.942047119140625, 2.0521240234375, 2.162200927734375, 2.27227783203125, 2.382354736328125, 2.492431640625, 2.602508544921875, 2.71258544921875, 2.822662353515625, 2.9327392578125, 3.042816162109375, 3.15289306640625, 3.262969970703125, 3.373046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 8.0, 12.0, 10.0, 9.0, 20.0, 20.0, 15.0, 29.0, 34.0, 28.0, 34.0, 40.0, 45.0, 40.0, 36.0, 43.0, 42.0, 54.0, 56.0, 41.0, 48.0, 30.0, 52.0, 34.0, 24.0, 23.0, 22.0, 25.0, 23.0, 14.0, 19.0, 11.0, 9.0, 12.0, 8.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78515625, -1.7300567626953125, -1.674957275390625, -1.6198577880859375, -1.56475830078125, -1.5096588134765625, -1.454559326171875, -1.3994598388671875, -1.3443603515625, -1.2892608642578125, -1.234161376953125, -1.1790618896484375, -1.12396240234375, -1.0688629150390625, -1.013763427734375, -0.9586639404296875, -0.903564453125, -0.8484649658203125, -0.793365478515625, -0.7382659912109375, -0.68316650390625, -0.6280670166015625, -0.572967529296875, -0.5178680419921875, -0.4627685546875, -0.4076690673828125, -0.352569580078125, -0.2974700927734375, -0.24237060546875, -0.1872711181640625, -0.132171630859375, -0.0770721435546875, -0.02197265625, 0.0331268310546875, 0.088226318359375, 0.1433258056640625, 0.19842529296875, 0.2535247802734375, 0.308624267578125, 0.3637237548828125, 0.4188232421875, 0.4739227294921875, 0.529022216796875, 0.5841217041015625, 0.63922119140625, 0.6943206787109375, 0.749420166015625, 0.8045196533203125, 0.859619140625, 0.9147186279296875, 0.969818115234375, 1.0249176025390625, 1.08001708984375, 1.1351165771484375, 1.190216064453125, 1.2453155517578125, 1.3004150390625, 1.3555145263671875, 1.410614013671875, 1.4657135009765625, 1.52081298828125, 1.5759124755859375, 1.631011962890625, 1.6861114501953125, 1.7412109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 10.0, 15.0, 14.0, 32.0, 40.0, 60.0, 98.0, 154.0, 199.0, 307.0, 522.0, 1015.0, 2385.0, 8382.0, 47656.0, 475984.0, 453388.0, 45276.0, 8101.0, 2403.0, 1017.0, 521.0, 307.0, 202.0, 141.0, 78.0, 67.0, 44.0, 28.0, 28.0, 18.0, 17.0, 10.0, 7.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.59375, -14.188232421875, -13.78271484375, -13.377197265625, -12.9716796875, -12.566162109375, -12.16064453125, -11.755126953125, -11.349609375, -10.944091796875, -10.53857421875, -10.133056640625, -9.7275390625, -9.322021484375, -8.91650390625, -8.510986328125, -8.10546875, -7.699951171875, -7.29443359375, -6.888916015625, -6.4833984375, -6.077880859375, -5.67236328125, -5.266845703125, -4.861328125, -4.455810546875, -4.05029296875, -3.644775390625, -3.2392578125, -2.833740234375, -2.42822265625, -2.022705078125, -1.6171875, -1.211669921875, -0.80615234375, -0.400634765625, 0.0048828125, 0.410400390625, 0.81591796875, 1.221435546875, 1.626953125, 2.032470703125, 2.43798828125, 2.843505859375, 3.2490234375, 3.654541015625, 4.06005859375, 4.465576171875, 4.87109375, 5.276611328125, 5.68212890625, 6.087646484375, 6.4931640625, 6.898681640625, 7.30419921875, 7.709716796875, 8.115234375, 8.520751953125, 8.92626953125, 9.331787109375, 9.7373046875, 10.142822265625, 10.54833984375, 10.953857421875, 11.359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 12.0, 8.0, 7.0, 14.0, 12.0, 18.0, 20.0, 17.0, 25.0, 26.0, 22.0, 33.0, 38.0, 36.0, 36.0, 39.0, 37.0, 38.0, 32.0, 39.0, 44.0, 43.0, 40.0, 41.0, 39.0, 33.0, 34.0, 26.0, 21.0, 32.0, 20.0, 19.0, 18.0, 13.0, 9.0, 11.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.859375, -9.5584716796875, -9.257568359375, -8.9566650390625, -8.65576171875, -8.3548583984375, -8.053955078125, -7.7530517578125, -7.4521484375, -7.1512451171875, -6.850341796875, -6.5494384765625, -6.24853515625, -5.9476318359375, -5.646728515625, -5.3458251953125, -5.044921875, -4.7440185546875, -4.443115234375, -4.1422119140625, -3.84130859375, -3.5404052734375, -3.239501953125, -2.9385986328125, -2.6376953125, -2.3367919921875, -2.035888671875, -1.7349853515625, -1.43408203125, -1.1331787109375, -0.832275390625, -0.5313720703125, -0.23046875, 0.0704345703125, 0.371337890625, 0.6722412109375, 0.97314453125, 1.2740478515625, 1.574951171875, 1.8758544921875, 2.1767578125, 2.4776611328125, 2.778564453125, 3.0794677734375, 3.38037109375, 3.6812744140625, 3.982177734375, 4.2830810546875, 4.583984375, 4.8848876953125, 5.185791015625, 5.4866943359375, 5.78759765625, 6.0885009765625, 6.389404296875, 6.6903076171875, 6.9912109375, 7.2921142578125, 7.593017578125, 7.8939208984375, 8.19482421875, 8.4957275390625, 8.796630859375, 9.0975341796875, 9.3984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 9.0, 12.0, 12.0, 30.0, 60.0, 73.0, 145.0, 336.0, 822.0, 2184.0, 7560.0, 36856.0, 349532.0, 575371.0, 60246.0, 10453.0, 2860.0, 1060.0, 459.0, 229.0, 99.0, 48.0, 34.0, 16.0, 17.0, 7.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.828125, -6.5667724609375, -6.305419921875, -6.0440673828125, -5.78271484375, -5.5213623046875, -5.260009765625, -4.9986572265625, -4.7373046875, -4.4759521484375, -4.214599609375, -3.9532470703125, -3.69189453125, -3.4305419921875, -3.169189453125, -2.9078369140625, -2.646484375, -2.3851318359375, -2.123779296875, -1.8624267578125, -1.60107421875, -1.3397216796875, -1.078369140625, -0.8170166015625, -0.5556640625, -0.2943115234375, -0.032958984375, 0.2283935546875, 0.48974609375, 0.7510986328125, 1.012451171875, 1.2738037109375, 1.53515625, 1.7965087890625, 2.057861328125, 2.3192138671875, 2.58056640625, 2.8419189453125, 3.103271484375, 3.3646240234375, 3.6259765625, 3.8873291015625, 4.148681640625, 4.4100341796875, 4.67138671875, 4.9327392578125, 5.194091796875, 5.4554443359375, 5.716796875, 5.9781494140625, 6.239501953125, 6.5008544921875, 6.76220703125, 7.0235595703125, 7.284912109375, 7.5462646484375, 7.8076171875, 8.0689697265625, 8.330322265625, 8.5916748046875, 8.85302734375, 9.1143798828125, 9.375732421875, 9.6370849609375, 9.8984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 8.0, 7.0, 7.0, 6.0, 9.0, 12.0, 16.0, 16.0, 24.0, 30.0, 21.0, 45.0, 68.0, 78.0, 91.0, 108.0, 99.0, 93.0, 55.0, 47.0, 39.0, 37.0, 18.0, 14.0, 12.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011138916015625, -0.0010773837566375732, -0.0010408759117126465, -0.0010043680667877197, -0.000967860221862793, -0.0009313523769378662, -0.0008948445320129395, -0.0008583366870880127, -0.0008218288421630859, -0.0007853209972381592, -0.0007488131523132324, -0.0007123053073883057, -0.0006757974624633789, -0.0006392896175384521, -0.0006027817726135254, -0.0005662739276885986, -0.0005297660827636719, -0.0004932582378387451, -0.00045675039291381836, -0.0004202425479888916, -0.00038373470306396484, -0.0003472268581390381, -0.00031071901321411133, -0.00027421116828918457, -0.0002377033233642578, -0.00020119547843933105, -0.0001646876335144043, -0.00012817978858947754, -9.167194366455078e-05, -5.5164098739624023e-05, -1.8656253814697266e-05, 1.7851591110229492e-05, 5.435943603515625e-05, 9.086728096008301e-05, 0.00012737512588500977, 0.00016388297080993652, 0.00020039081573486328, 0.00023689866065979004, 0.0002734065055847168, 0.00030991435050964355, 0.0003464221954345703, 0.00038293004035949707, 0.00041943788528442383, 0.0004559457302093506, 0.0004924535751342773, 0.0005289614200592041, 0.0005654692649841309, 0.0006019771099090576, 0.0006384849548339844, 0.0006749927997589111, 0.0007115006446838379, 0.0007480084896087646, 0.0007845163345336914, 0.0008210241794586182, 0.0008575320243835449, 0.0008940398693084717, 0.0009305477142333984, 0.0009670555591583252, 0.001003563404083252, 0.0010400712490081787, 0.0010765790939331055, 0.0011130869388580322, 0.001149594783782959, 0.0011861026287078857, 0.0012226104736328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 13.0, 14.0, 25.0, 37.0, 64.0, 102.0, 174.0, 325.0, 653.0, 1608.0, 5055.0, 25011.0, 284417.0, 659419.0, 58442.0, 8799.0, 2386.0, 960.0, 448.0, 219.0, 126.0, 68.0, 51.0, 33.0, 24.0, 18.0, 11.0, 7.0, 9.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.78125, -9.4952392578125, -9.209228515625, -8.9232177734375, -8.63720703125, -8.3511962890625, -8.065185546875, -7.7791748046875, -7.4931640625, -7.2071533203125, -6.921142578125, -6.6351318359375, -6.34912109375, -6.0631103515625, -5.777099609375, -5.4910888671875, -5.205078125, -4.9190673828125, -4.633056640625, -4.3470458984375, -4.06103515625, -3.7750244140625, -3.489013671875, -3.2030029296875, -2.9169921875, -2.6309814453125, -2.344970703125, -2.0589599609375, -1.77294921875, -1.4869384765625, -1.200927734375, -0.9149169921875, -0.62890625, -0.3428955078125, -0.056884765625, 0.2291259765625, 0.51513671875, 0.8011474609375, 1.087158203125, 1.3731689453125, 1.6591796875, 1.9451904296875, 2.231201171875, 2.5172119140625, 2.80322265625, 3.0892333984375, 3.375244140625, 3.6612548828125, 3.947265625, 4.2332763671875, 4.519287109375, 4.8052978515625, 5.09130859375, 5.3773193359375, 5.663330078125, 5.9493408203125, 6.2353515625, 6.5213623046875, 6.807373046875, 7.0933837890625, 7.37939453125, 7.6654052734375, 7.951416015625, 8.2374267578125, 8.5234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 11.0, 11.0, 16.0, 24.0, 28.0, 42.0, 59.0, 84.0, 115.0, 115.0, 104.0, 94.0, 73.0, 58.0, 46.0, 34.0, 18.0, 20.0, 6.0, 9.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.677978515625, -5.47314453125, -5.268310546875, -5.0634765625, -4.858642578125, -4.65380859375, -4.448974609375, -4.244140625, -4.039306640625, -3.83447265625, -3.629638671875, -3.4248046875, -3.219970703125, -3.01513671875, -2.810302734375, -2.60546875, -2.400634765625, -2.19580078125, -1.990966796875, -1.7861328125, -1.581298828125, -1.37646484375, -1.171630859375, -0.966796875, -0.761962890625, -0.55712890625, -0.352294921875, -0.1474609375, 0.057373046875, 0.26220703125, 0.467041015625, 0.671875, 0.876708984375, 1.08154296875, 1.286376953125, 1.4912109375, 1.696044921875, 1.90087890625, 2.105712890625, 2.310546875, 2.515380859375, 2.72021484375, 2.925048828125, 3.1298828125, 3.334716796875, 3.53955078125, 3.744384765625, 3.94921875, 4.154052734375, 4.35888671875, 4.563720703125, 4.7685546875, 4.973388671875, 5.17822265625, 5.383056640625, 5.587890625, 5.792724609375, 5.99755859375, 6.202392578125, 6.4072265625, 6.612060546875, 6.81689453125, 7.021728515625, 7.2265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 19.0, 39.0, 65.0, 152.0, 220.0, 251.0, 145.0, 64.0, 24.0, 10.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.026180267333984, -52.307796478271484, -48.58940887451172, -44.87102508544922, -41.15264129638672, -37.43425750732422, -33.71587371826172, -29.997486114501953, -26.279102325439453, -22.560718536376953, -18.84233283996582, -15.123948097229004, -11.405563354492188, -7.6871795654296875, -3.9687938690185547, -0.2504081726074219, 3.467975616455078, 7.1863603591918945, 10.904745101928711, 14.623129844665527, 18.341514587402344, 22.059898376464844, 25.778284072875977, 29.49666976928711, 33.21505355834961, 36.93343734741211, 40.651824951171875, 44.370208740234375, 48.088592529296875, 51.806976318359375, 55.525360107421875, 59.24374771118164, 62.962127685546875, 66.68051147460938, 70.39889526367188, 74.11727905273438, 77.83566284179688, 81.55404663085938, 85.2724380493164, 88.9908218383789, 92.7092056274414, 96.4275894165039, 100.1459732055664, 103.8643569946289, 107.58274841308594, 111.30113220214844, 115.01951599121094, 118.73789978027344, 122.45628356933594, 126.17466735839844, 129.89305114746094, 133.61143493652344, 137.32981872558594, 141.04820251464844, 144.76658630371094, 148.4849853515625, 152.203369140625, 155.9217529296875, 159.64013671875, 163.3585205078125, 167.076904296875, 170.7952880859375, 174.513671875, 178.2320556640625, 181.950439453125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 11.0, 17.0, 14.0, 11.0, 20.0, 22.0, 25.0, 40.0, 29.0, 35.0, 47.0, 38.0, 45.0, 53.0, 43.0, 41.0, 52.0, 42.0, 35.0, 48.0, 42.0, 36.0, 36.0, 32.0, 21.0, 25.0, 18.0, 14.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-51.45598602294922, -49.82484436035156, -48.19369888305664, -46.562557220458984, -44.93141555786133, -43.300270080566406, -41.66912841796875, -40.037986755371094, -38.40684509277344, -36.77570343017578, -35.14455795288086, -33.5134162902832, -31.882274627685547, -30.251131057739258, -28.61998748779297, -26.988845825195312, -25.35770034790039, -23.7265567779541, -22.095415115356445, -20.464271545410156, -18.8331298828125, -17.20198631286621, -15.570842742919922, -13.93970012664795, -12.308557510375977, -10.677414894104004, -9.046272277832031, -7.415128707885742, -5.7839860916137695, -4.152843475341797, -2.521699905395508, -0.8905572891235352, 0.7405853271484375, 2.3717281818389893, 4.002871036529541, 5.634014129638672, 7.2651567459106445, 8.896299362182617, 10.527442932128906, 12.158585548400879, 13.789728164672852, 15.420870780944824, 17.052013397216797, 18.683156967163086, 20.314300537109375, 21.94544219970703, 23.57658576965332, 25.20772933959961, 26.838871002197266, 28.470014572143555, 30.10115623474121, 31.7322998046875, 33.363441467285156, 34.99458312988281, 36.625728607177734, 38.25687026977539, 39.88801574707031, 41.51915740966797, 43.15030288696289, 44.78144454956055, 46.4125862121582, 48.043731689453125, 49.67487335205078, 51.30601501464844, 52.937156677246094]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 3.0, 5.0, 10.0, 9.0, 11.0, 23.0, 24.0, 32.0, 45.0, 53.0, 59.0, 87.0, 152.0, 305.0, 559.0, 1346.0, 3558.0, 12590.0, 180951.0, 3965638.0, 20656.0, 4710.0, 1795.0, 704.0, 325.0, 177.0, 136.0, 71.0, 57.0, 41.0, 35.0, 24.0, 23.0, 13.0, 14.0, 6.0, 9.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0], "bins": [-19.09375, -18.5931396484375, -18.092529296875, -17.5919189453125, -17.09130859375, -16.5906982421875, -16.090087890625, -15.5894775390625, -15.0888671875, -14.5882568359375, -14.087646484375, -13.5870361328125, -13.08642578125, -12.5858154296875, -12.085205078125, -11.5845947265625, -11.083984375, -10.5833740234375, -10.082763671875, -9.5821533203125, -9.08154296875, -8.5809326171875, -8.080322265625, -7.5797119140625, -7.0791015625, -6.5784912109375, -6.077880859375, -5.5772705078125, -5.07666015625, -4.5760498046875, -4.075439453125, -3.5748291015625, -3.07421875, -2.5736083984375, -2.072998046875, -1.5723876953125, -1.07177734375, -0.5711669921875, -0.070556640625, 0.4300537109375, 0.9306640625, 1.4312744140625, 1.931884765625, 2.4324951171875, 2.93310546875, 3.4337158203125, 3.934326171875, 4.4349365234375, 4.935546875, 5.4361572265625, 5.936767578125, 6.4373779296875, 6.93798828125, 7.4385986328125, 7.939208984375, 8.4398193359375, 8.9404296875, 9.4410400390625, 9.941650390625, 10.4422607421875, 10.94287109375, 11.4434814453125, 11.944091796875, 12.4447021484375, 12.9453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 14.0, 17.0, 18.0, 25.0, 27.0, 41.0, 41.0, 38.0, 60.0, 50.0, 56.0, 63.0, 76.0, 40.0, 52.0, 53.0, 58.0, 41.0, 38.0, 31.0, 28.0, 35.0, 20.0, 12.0, 16.0, 7.0, 10.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.514190673828125, -2.43267822265625, -2.351165771484375, -2.2696533203125, -2.188140869140625, -2.10662841796875, -2.025115966796875, -1.943603515625, -1.862091064453125, -1.78057861328125, -1.699066162109375, -1.6175537109375, -1.536041259765625, -1.45452880859375, -1.373016357421875, -1.29150390625, -1.209991455078125, -1.12847900390625, -1.046966552734375, -0.9654541015625, -0.883941650390625, -0.80242919921875, -0.720916748046875, -0.639404296875, -0.557891845703125, -0.47637939453125, -0.394866943359375, -0.3133544921875, -0.231842041015625, -0.15032958984375, -0.068817138671875, 0.0126953125, 0.094207763671875, 0.17572021484375, 0.257232666015625, 0.3387451171875, 0.420257568359375, 0.50177001953125, 0.583282470703125, 0.664794921875, 0.746307373046875, 0.82781982421875, 0.909332275390625, 0.9908447265625, 1.072357177734375, 1.15386962890625, 1.235382080078125, 1.31689453125, 1.398406982421875, 1.47991943359375, 1.561431884765625, 1.6429443359375, 1.724456787109375, 1.80596923828125, 1.887481689453125, 1.968994140625, 2.050506591796875, 2.13201904296875, 2.213531494140625, 2.2950439453125, 2.376556396484375, 2.45806884765625, 2.539581298828125, 2.62109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 12.0, 20.0, 23.0, 49.0, 75.0, 75.0, 145.0, 191.0, 327.0, 558.0, 1138.0, 2645.0, 7967.0, 40917.0, 4060695.0, 63017.0, 10274.0, 3144.0, 1317.0, 663.0, 352.0, 237.0, 153.0, 88.0, 62.0, 46.0, 40.0, 20.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -21.880126953125, -21.05712890625, -20.234130859375, -19.4111328125, -18.588134765625, -17.76513671875, -16.942138671875, -16.119140625, -15.296142578125, -14.47314453125, -13.650146484375, -12.8271484375, -12.004150390625, -11.18115234375, -10.358154296875, -9.53515625, -8.712158203125, -7.88916015625, -7.066162109375, -6.2431640625, -5.420166015625, -4.59716796875, -3.774169921875, -2.951171875, -2.128173828125, -1.30517578125, -0.482177734375, 0.3408203125, 1.163818359375, 1.98681640625, 2.809814453125, 3.6328125, 4.455810546875, 5.27880859375, 6.101806640625, 6.9248046875, 7.747802734375, 8.57080078125, 9.393798828125, 10.216796875, 11.039794921875, 11.86279296875, 12.685791015625, 13.5087890625, 14.331787109375, 15.15478515625, 15.977783203125, 16.80078125, 17.623779296875, 18.44677734375, 19.269775390625, 20.0927734375, 20.915771484375, 21.73876953125, 22.561767578125, 23.384765625, 24.207763671875, 25.03076171875, 25.853759765625, 26.6767578125, 27.499755859375, 28.32275390625, 29.145751953125, 29.96875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 10.0, 5.0, 22.0, 9.0, 27.0, 44.0, 190.0, 3329.0, 255.0, 61.0, 30.0, 25.0, 14.0, 8.0, 12.0, 6.0, 6.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.375, -3.260955810546875, -3.14691162109375, -3.032867431640625, -2.9188232421875, -2.804779052734375, -2.69073486328125, -2.576690673828125, -2.462646484375, -2.348602294921875, -2.23455810546875, -2.120513916015625, -2.0064697265625, -1.892425537109375, -1.77838134765625, -1.664337158203125, -1.55029296875, -1.436248779296875, -1.32220458984375, -1.208160400390625, -1.0941162109375, -0.980072021484375, -0.86602783203125, -0.751983642578125, -0.637939453125, -0.523895263671875, -0.40985107421875, -0.295806884765625, -0.1817626953125, -0.067718505859375, 0.04632568359375, 0.160369873046875, 0.2744140625, 0.388458251953125, 0.50250244140625, 0.616546630859375, 0.7305908203125, 0.844635009765625, 0.95867919921875, 1.072723388671875, 1.186767578125, 1.300811767578125, 1.41485595703125, 1.528900146484375, 1.6429443359375, 1.756988525390625, 1.87103271484375, 1.985076904296875, 2.09912109375, 2.213165283203125, 2.32720947265625, 2.441253662109375, 2.5552978515625, 2.669342041015625, 2.78338623046875, 2.897430419921875, 3.011474609375, 3.125518798828125, 3.23956298828125, 3.353607177734375, 3.4676513671875, 3.581695556640625, 3.69573974609375, 3.809783935546875, 3.923828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 13.0, 18.0, 24.0, 25.0, 44.0, 55.0, 72.0, 114.0, 102.0, 121.0, 103.0, 81.0, 67.0, 51.0, 35.0, 21.0, 18.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.147695541381836, -15.703191757202148, -15.258687973022461, -14.814184188842773, -14.369681358337402, -13.925177574157715, -13.480673789978027, -13.03617000579834, -12.591666221618652, -12.147162437438965, -11.702658653259277, -11.258155822753906, -10.813652038574219, -10.369148254394531, -9.924644470214844, -9.480140686035156, -9.035636901855469, -8.591133117675781, -8.146629333496094, -7.7021260261535645, -7.257622241973877, -6.813118934631348, -6.36861515045166, -5.924111366271973, -5.479608535766602, -5.035104751586914, -4.590601444244385, -4.146097660064697, -3.7015938758850098, -3.2570903301239014, -2.812586784362793, -2.3680830001831055, -1.923579216003418, -1.47907555103302, -1.034571886062622, -0.5900683403015137, -0.14556467533111572, 0.2989389896392822, 0.7434425354003906, 1.1879463195800781, 1.6324498653411865, 2.076953411102295, 2.5214571952819824, 2.965960741043091, 3.410464286804199, 3.8549680709838867, 4.299471855163574, 4.743975639343262, 5.188478946685791, 5.6329827308654785, 6.077486038208008, 6.521989822387695, 6.966493606567383, 7.41099739074707, 7.8555006980896, 8.300004959106445, 8.744507789611816, 9.189011573791504, 9.633515357971191, 10.078018188476562, 10.52252197265625, 10.967025756835938, 11.411529541015625, 11.856033325195312, 12.300537109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 5.0, 13.0, 10.0, 13.0, 17.0, 23.0, 24.0, 24.0, 33.0, 34.0, 31.0, 56.0, 54.0, 68.0, 42.0, 54.0, 54.0, 38.0, 41.0, 50.0, 50.0, 40.0, 42.0, 31.0, 31.0, 22.0, 21.0, 17.0, 8.0, 10.0, 11.0, 9.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.020988464355469, -10.693446159362793, -10.3659029006958, -10.038360595703125, -9.71081829071045, -9.383275985717773, -9.055732727050781, -8.728190422058105, -8.40064811706543, -8.073105812072754, -7.74556303024292, -7.418020248413086, -7.09047794342041, -6.762935161590576, -6.435392379760742, -6.107850074768066, -5.780307292938232, -5.452764511108398, -5.125222206115723, -4.797679424285889, -4.470137119293213, -4.142594337463379, -3.815051794052124, -3.487509250640869, -3.1599667072296143, -2.8324241638183594, -2.5048816204071045, -2.1773390769958496, -1.8497964143753052, -1.5222538709640503, -1.1947112083435059, -0.867168664932251, -0.5396261215209961, -0.21208354830741882, 0.11545902490615845, 0.4430016279220581, 0.770544171333313, 1.0980867147445679, 1.4256293773651123, 1.7531719207763672, 2.080714464187622, 2.408257007598877, 2.735799551010132, 3.0633420944213867, 3.3908848762512207, 3.7184271812438965, 4.0459699630737305, 4.373512268066406, 4.70105504989624, 5.028597831726074, 5.35614013671875, 5.683682918548584, 6.01122522354126, 6.338768005371094, 6.6663103103637695, 6.9938530921936035, 7.3213958740234375, 7.6489386558532715, 7.976480960845947, 8.304023742675781, 8.631566047668457, 8.959108352661133, 9.286651611328125, 9.6141939163208, 9.941736221313477]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 5.0, 13.0, 10.0, 14.0, 19.0, 28.0, 42.0, 62.0, 99.0, 171.0, 286.0, 559.0, 1132.0, 2317.0, 4870.0, 11467.0, 28511.0, 72834.0, 183030.0, 337588.0, 239718.0, 99289.0, 38618.0, 15360.0, 6470.0, 2957.0, 1429.0, 707.0, 392.0, 225.0, 117.0, 63.0, 57.0, 28.0, 15.0, 14.0, 14.0, 7.0, 9.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.3671875, -6.18865966796875, -6.0101318359375, -5.83160400390625, -5.653076171875, -5.47454833984375, -5.2960205078125, -5.11749267578125, -4.93896484375, -4.76043701171875, -4.5819091796875, -4.40338134765625, -4.224853515625, -4.04632568359375, -3.8677978515625, -3.68927001953125, -3.5107421875, -3.33221435546875, -3.1536865234375, -2.97515869140625, -2.796630859375, -2.61810302734375, -2.4395751953125, -2.26104736328125, -2.08251953125, -1.90399169921875, -1.7254638671875, -1.54693603515625, -1.368408203125, -1.18988037109375, -1.0113525390625, -0.83282470703125, -0.654296875, -0.47576904296875, -0.2972412109375, -0.11871337890625, 0.059814453125, 0.23834228515625, 0.4168701171875, 0.59539794921875, 0.77392578125, 0.95245361328125, 1.1309814453125, 1.30950927734375, 1.488037109375, 1.66656494140625, 1.8450927734375, 2.02362060546875, 2.2021484375, 2.38067626953125, 2.5592041015625, 2.73773193359375, 2.916259765625, 3.09478759765625, 3.2733154296875, 3.45184326171875, 3.63037109375, 3.80889892578125, 3.9874267578125, 4.16595458984375, 4.344482421875, 4.52301025390625, 4.7015380859375, 4.88006591796875, 5.05859375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 11.0, 10.0, 9.0, 12.0, 11.0, 11.0, 19.0, 21.0, 16.0, 22.0, 30.0, 30.0, 30.0, 33.0, 47.0, 43.0, 46.0, 50.0, 40.0, 39.0, 41.0, 42.0, 48.0, 36.0, 44.0, 50.0, 33.0, 32.0, 30.0, 23.0, 11.0, 20.0, 15.0, 7.0, 8.0, 6.0, 10.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.76953125, -2.694366455078125, -2.61920166015625, -2.544036865234375, -2.4688720703125, -2.393707275390625, -2.31854248046875, -2.243377685546875, -2.168212890625, -2.093048095703125, -2.01788330078125, -1.942718505859375, -1.8675537109375, -1.792388916015625, -1.71722412109375, -1.642059326171875, -1.56689453125, -1.491729736328125, -1.41656494140625, -1.341400146484375, -1.2662353515625, -1.191070556640625, -1.11590576171875, -1.040740966796875, -0.965576171875, -0.890411376953125, -0.81524658203125, -0.740081787109375, -0.6649169921875, -0.589752197265625, -0.51458740234375, -0.439422607421875, -0.3642578125, -0.289093017578125, -0.21392822265625, -0.138763427734375, -0.0635986328125, 0.011566162109375, 0.08673095703125, 0.161895751953125, 0.237060546875, 0.312225341796875, 0.38739013671875, 0.462554931640625, 0.5377197265625, 0.612884521484375, 0.68804931640625, 0.763214111328125, 0.83837890625, 0.913543701171875, 0.98870849609375, 1.063873291015625, 1.1390380859375, 1.214202880859375, 1.28936767578125, 1.364532470703125, 1.439697265625, 1.514862060546875, 1.59002685546875, 1.665191650390625, 1.7403564453125, 1.815521240234375, 1.89068603515625, 1.965850830078125, 2.041015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 9.0, 15.0, 20.0, 29.0, 31.0, 45.0, 73.0, 92.0, 169.0, 237.0, 388.0, 667.0, 1276.0, 3546.0, 15360.0, 133641.0, 730466.0, 139660.0, 16295.0, 3528.0, 1234.0, 620.0, 384.0, 268.0, 160.0, 101.0, 76.0, 43.0, 33.0, 20.0, 15.0, 10.0, 12.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.3253173828125, -15.838134765625, -15.3509521484375, -14.86376953125, -14.3765869140625, -13.889404296875, -13.4022216796875, -12.9150390625, -12.4278564453125, -11.940673828125, -11.4534912109375, -10.96630859375, -10.4791259765625, -9.991943359375, -9.5047607421875, -9.017578125, -8.5303955078125, -8.043212890625, -7.5560302734375, -7.06884765625, -6.5816650390625, -6.094482421875, -5.6072998046875, -5.1201171875, -4.6329345703125, -4.145751953125, -3.6585693359375, -3.17138671875, -2.6842041015625, -2.197021484375, -1.7098388671875, -1.22265625, -0.7354736328125, -0.248291015625, 0.2388916015625, 0.72607421875, 1.2132568359375, 1.700439453125, 2.1876220703125, 2.6748046875, 3.1619873046875, 3.649169921875, 4.1363525390625, 4.62353515625, 5.1107177734375, 5.597900390625, 6.0850830078125, 6.572265625, 7.0594482421875, 7.546630859375, 8.0338134765625, 8.52099609375, 9.0081787109375, 9.495361328125, 9.9825439453125, 10.4697265625, 10.9569091796875, 11.444091796875, 11.9312744140625, 12.41845703125, 12.9056396484375, 13.392822265625, 13.8800048828125, 14.3671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 8.0, 8.0, 10.0, 9.0, 14.0, 18.0, 15.0, 18.0, 20.0, 21.0, 40.0, 31.0, 22.0, 43.0, 46.0, 50.0, 43.0, 41.0, 33.0, 28.0, 41.0, 43.0, 35.0, 42.0, 45.0, 25.0, 32.0, 32.0, 20.0, 25.0, 25.0, 17.0, 11.0, 19.0, 11.0, 15.0, 10.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.9609375, -11.5943603515625, -11.227783203125, -10.8612060546875, -10.49462890625, -10.1280517578125, -9.761474609375, -9.3948974609375, -9.0283203125, -8.6617431640625, -8.295166015625, -7.9285888671875, -7.56201171875, -7.1954345703125, -6.828857421875, -6.4622802734375, -6.095703125, -5.7291259765625, -5.362548828125, -4.9959716796875, -4.62939453125, -4.2628173828125, -3.896240234375, -3.5296630859375, -3.1630859375, -2.7965087890625, -2.429931640625, -2.0633544921875, -1.69677734375, -1.3302001953125, -0.963623046875, -0.5970458984375, -0.23046875, 0.1361083984375, 0.502685546875, 0.8692626953125, 1.23583984375, 1.6024169921875, 1.968994140625, 2.3355712890625, 2.7021484375, 3.0687255859375, 3.435302734375, 3.8018798828125, 4.16845703125, 4.5350341796875, 4.901611328125, 5.2681884765625, 5.634765625, 6.0013427734375, 6.367919921875, 6.7344970703125, 7.10107421875, 7.4676513671875, 7.834228515625, 8.2008056640625, 8.5673828125, 8.9339599609375, 9.300537109375, 9.6671142578125, 10.03369140625, 10.4002685546875, 10.766845703125, 11.1334228515625, 11.5]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 10.0, 12.0, 13.0, 27.0, 48.0, 93.0, 118.0, 272.0, 524.0, 1137.0, 3618.0, 15450.0, 195186.0, 775202.0, 46052.0, 7158.0, 2078.0, 753.0, 371.0, 160.0, 96.0, 73.0, 35.0, 23.0, 13.0, 8.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1796875, -12.805908203125, -12.43212890625, -12.058349609375, -11.6845703125, -11.310791015625, -10.93701171875, -10.563232421875, -10.189453125, -9.815673828125, -9.44189453125, -9.068115234375, -8.6943359375, -8.320556640625, -7.94677734375, -7.572998046875, -7.19921875, -6.825439453125, -6.45166015625, -6.077880859375, -5.7041015625, -5.330322265625, -4.95654296875, -4.582763671875, -4.208984375, -3.835205078125, -3.46142578125, -3.087646484375, -2.7138671875, -2.340087890625, -1.96630859375, -1.592529296875, -1.21875, -0.844970703125, -0.47119140625, -0.097412109375, 0.2763671875, 0.650146484375, 1.02392578125, 1.397705078125, 1.771484375, 2.145263671875, 2.51904296875, 2.892822265625, 3.2666015625, 3.640380859375, 4.01416015625, 4.387939453125, 4.76171875, 5.135498046875, 5.50927734375, 5.883056640625, 6.2568359375, 6.630615234375, 7.00439453125, 7.378173828125, 7.751953125, 8.125732421875, 8.49951171875, 8.873291015625, 9.2470703125, 9.620849609375, 9.99462890625, 10.368408203125, 10.7421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 6.0, 15.0, 11.0, 18.0, 21.0, 36.0, 43.0, 53.0, 79.0, 91.0, 86.0, 85.0, 88.0, 77.0, 53.0, 55.0, 34.0, 32.0, 25.0, 14.0, 15.0, 13.0, 9.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013427734375, -0.001309424638748169, -0.0012760758399963379, -0.0012427270412445068, -0.0012093782424926758, -0.0011760294437408447, -0.0011426806449890137, -0.0011093318462371826, -0.0010759830474853516, -0.0010426342487335205, -0.0010092854499816895, -0.0009759366512298584, -0.0009425878524780273, -0.0009092390537261963, -0.0008758902549743652, -0.0008425414562225342, -0.0008091926574707031, -0.0007758438587188721, -0.000742495059967041, -0.00070914626121521, -0.0006757974624633789, -0.0006424486637115479, -0.0006090998649597168, -0.0005757510662078857, -0.0005424022674560547, -0.0005090534687042236, -0.0004757046699523926, -0.0004423558712005615, -0.00040900707244873047, -0.0003756582736968994, -0.00034230947494506836, -0.0003089606761932373, -0.00027561187744140625, -0.0002422630786895752, -0.00020891427993774414, -0.00017556548118591309, -0.00014221668243408203, -0.00010886788368225098, -7.551908493041992e-05, -4.217028617858887e-05, -8.821487426757812e-06, 2.4527311325073242e-05, 5.78761100769043e-05, 9.122490882873535e-05, 0.0001245737075805664, 0.00015792250633239746, 0.00019127130508422852, 0.00022462010383605957, 0.0002579689025878906, 0.0002913177013397217, 0.00032466650009155273, 0.0003580152988433838, 0.00039136409759521484, 0.0004247128963470459, 0.00045806169509887695, 0.000491410493850708, 0.0005247592926025391, 0.0005581080913543701, 0.0005914568901062012, 0.0006248056888580322, 0.0006581544876098633, 0.0006915032863616943, 0.0007248520851135254, 0.0007582008838653564, 0.0007915496826171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 3.0, 3.0, 13.0, 13.0, 14.0, 20.0, 21.0, 39.0, 44.0, 100.0, 147.0, 289.0, 485.0, 1202.0, 3474.0, 13564.0, 114702.0, 806603.0, 90341.0, 12098.0, 3102.0, 1156.0, 498.0, 235.0, 116.0, 71.0, 44.0, 32.0, 29.0, 17.0, 12.0, 12.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.7734375, -10.4415283203125, -10.109619140625, -9.7777099609375, -9.44580078125, -9.1138916015625, -8.781982421875, -8.4500732421875, -8.1181640625, -7.7862548828125, -7.454345703125, -7.1224365234375, -6.79052734375, -6.4586181640625, -6.126708984375, -5.7947998046875, -5.462890625, -5.1309814453125, -4.799072265625, -4.4671630859375, -4.13525390625, -3.8033447265625, -3.471435546875, -3.1395263671875, -2.8076171875, -2.4757080078125, -2.143798828125, -1.8118896484375, -1.47998046875, -1.1480712890625, -0.816162109375, -0.4842529296875, -0.15234375, 0.1795654296875, 0.511474609375, 0.8433837890625, 1.17529296875, 1.5072021484375, 1.839111328125, 2.1710205078125, 2.5029296875, 2.8348388671875, 3.166748046875, 3.4986572265625, 3.83056640625, 4.1624755859375, 4.494384765625, 4.8262939453125, 5.158203125, 5.4901123046875, 5.822021484375, 6.1539306640625, 6.48583984375, 6.8177490234375, 7.149658203125, 7.4815673828125, 7.8134765625, 8.1453857421875, 8.477294921875, 8.8092041015625, 9.14111328125, 9.4730224609375, 9.804931640625, 10.1368408203125, 10.46875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 13.0, 12.0, 11.0, 19.0, 34.0, 46.0, 59.0, 78.0, 103.0, 118.0, 131.0, 80.0, 74.0, 60.0, 44.0, 22.0, 19.0, 13.0, 10.0, 7.0, 5.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3125, -8.0809326171875, -7.849365234375, -7.6177978515625, -7.38623046875, -7.1546630859375, -6.923095703125, -6.6915283203125, -6.4599609375, -6.2283935546875, -5.996826171875, -5.7652587890625, -5.53369140625, -5.3021240234375, -5.070556640625, -4.8389892578125, -4.607421875, -4.3758544921875, -4.144287109375, -3.9127197265625, -3.68115234375, -3.4495849609375, -3.218017578125, -2.9864501953125, -2.7548828125, -2.5233154296875, -2.291748046875, -2.0601806640625, -1.82861328125, -1.5970458984375, -1.365478515625, -1.1339111328125, -0.90234375, -0.6707763671875, -0.439208984375, -0.2076416015625, 0.02392578125, 0.2554931640625, 0.487060546875, 0.7186279296875, 0.9501953125, 1.1817626953125, 1.413330078125, 1.6448974609375, 1.87646484375, 2.1080322265625, 2.339599609375, 2.5711669921875, 2.802734375, 3.0343017578125, 3.265869140625, 3.4974365234375, 3.72900390625, 3.9605712890625, 4.192138671875, 4.4237060546875, 4.6552734375, 4.8868408203125, 5.118408203125, 5.3499755859375, 5.58154296875, 5.8131103515625, 6.044677734375, 6.2762451171875, 6.5078125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 22.0, 40.0, 75.0, 110.0, 156.0, 169.0, 155.0, 104.0, 85.0, 32.0, 11.0, 15.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-180.37681579589844, -176.47836303710938, -172.5799102783203, -168.68145751953125, -164.7830047607422, -160.88455200195312, -156.98611450195312, -153.08766174316406, -149.189208984375, -145.29075622558594, -141.39230346679688, -137.4938507080078, -133.59539794921875, -129.69696044921875, -125.79850006103516, -121.9000473022461, -118.00159454345703, -114.10314178466797, -110.2046890258789, -106.30624389648438, -102.40779113769531, -98.50933837890625, -94.61088562011719, -90.71243286132812, -86.81398010253906, -82.91552734375, -79.01707458496094, -75.11862182617188, -71.22017669677734, -67.32172393798828, -63.42327117919922, -59.524818420410156, -55.626380920410156, -51.727928161621094, -47.8294792175293, -43.931026458740234, -40.03257751464844, -36.134124755859375, -32.23567199707031, -28.337221145629883, -24.438770294189453, -20.540319442749023, -16.641868591308594, -12.743415832519531, -8.844964981079102, -4.946514129638672, -1.0480613708496094, 2.8503894805908203, 6.74884033203125, 10.64729118347168, 14.545742988586426, 18.444194793701172, 22.3426456451416, 26.24109649658203, 30.139549255371094, 34.038002014160156, 37.93645095825195, 41.834903717041016, 45.73335266113281, 49.631805419921875, 53.53025817871094, 57.428707122802734, 61.3271598815918, 65.2256088256836, 69.12406158447266]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 7.0, 5.0, 12.0, 12.0, 20.0, 26.0, 14.0, 20.0, 30.0, 31.0, 39.0, 46.0, 35.0, 43.0, 53.0, 38.0, 62.0, 48.0, 64.0, 46.0, 38.0, 45.0, 34.0, 27.0, 26.0, 37.0, 20.0, 20.0, 20.0, 10.0, 14.0, 17.0, 9.0, 6.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.31622314453125, -57.11467742919922, -54.91313552856445, -52.71158981323242, -50.510047912597656, -48.308502197265625, -46.106956481933594, -43.90541458129883, -41.70387268066406, -39.50232696533203, -37.300785064697266, -35.099239349365234, -32.89769744873047, -30.696151733398438, -28.49460792541504, -26.29306411743164, -24.09151840209961, -21.88997459411621, -19.688430786132812, -17.48688507080078, -15.2853422164917, -13.0837984085083, -10.882253646850586, -8.680709838867188, -6.479166030883789, -4.277622222900391, -2.076077938079834, 0.12546634674072266, 2.327010154724121, 4.5285539627075195, 6.730098724365234, 8.931642532348633, 11.133186340332031, 13.33473014831543, 15.536273956298828, 17.73781967163086, 19.939361572265625, 22.140907287597656, 24.342451095581055, 26.543994903564453, 28.74553871154785, 30.94708251953125, 33.14862823486328, 35.35017013549805, 37.55171585083008, 39.753257751464844, 41.954803466796875, 44.156349182128906, 46.35789108276367, 48.5594367980957, 50.76097869873047, 52.9625244140625, 55.164066314697266, 57.3656120300293, 59.56715393066406, 61.768699645996094, 63.970245361328125, 66.17179107666016, 68.37333679199219, 70.57487487792969, 72.77642059326172, 74.97796630859375, 77.17951202392578, 79.38105773925781, 81.58259582519531]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 3.0, 3.0, 13.0, 14.0, 19.0, 10.0, 19.0, 32.0, 27.0, 34.0, 47.0, 81.0, 170.0, 437.0, 1514.0, 7168.0, 100322.0, 4063649.0, 16595.0, 2675.0, 786.0, 268.0, 120.0, 72.0, 41.0, 38.0, 19.0, 22.0, 21.0, 12.0, 9.0, 4.0, 4.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.21875, -21.5498046875, -20.880859375, -20.2119140625, -19.54296875, -18.8740234375, -18.205078125, -17.5361328125, -16.8671875, -16.1982421875, -15.529296875, -14.8603515625, -14.19140625, -13.5224609375, -12.853515625, -12.1845703125, -11.515625, -10.8466796875, -10.177734375, -9.5087890625, -8.83984375, -8.1708984375, -7.501953125, -6.8330078125, -6.1640625, -5.4951171875, -4.826171875, -4.1572265625, -3.48828125, -2.8193359375, -2.150390625, -1.4814453125, -0.8125, -0.1435546875, 0.525390625, 1.1943359375, 1.86328125, 2.5322265625, 3.201171875, 3.8701171875, 4.5390625, 5.2080078125, 5.876953125, 6.5458984375, 7.21484375, 7.8837890625, 8.552734375, 9.2216796875, 9.890625, 10.5595703125, 11.228515625, 11.8974609375, 12.56640625, 13.2353515625, 13.904296875, 14.5732421875, 15.2421875, 15.9111328125, 16.580078125, 17.2490234375, 17.91796875, 18.5869140625, 19.255859375, 19.9248046875, 20.59375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 9.0, 7.0, 11.0, 13.0, 11.0, 18.0, 15.0, 24.0, 28.0, 27.0, 38.0, 38.0, 34.0, 44.0, 61.0, 46.0, 47.0, 59.0, 54.0, 55.0, 53.0, 57.0, 54.0, 42.0, 31.0, 21.0, 19.0, 16.0, 14.0, 8.0, 8.0, 5.0, 9.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.244140625, -3.156280517578125, -3.06842041015625, -2.980560302734375, -2.8927001953125, -2.804840087890625, -2.71697998046875, -2.629119873046875, -2.541259765625, -2.453399658203125, -2.36553955078125, -2.277679443359375, -2.1898193359375, -2.101959228515625, -2.01409912109375, -1.926239013671875, -1.83837890625, -1.750518798828125, -1.66265869140625, -1.574798583984375, -1.4869384765625, -1.399078369140625, -1.31121826171875, -1.223358154296875, -1.135498046875, -1.047637939453125, -0.95977783203125, -0.871917724609375, -0.7840576171875, -0.696197509765625, -0.60833740234375, -0.520477294921875, -0.4326171875, -0.344757080078125, -0.25689697265625, -0.169036865234375, -0.0811767578125, 0.006683349609375, 0.09454345703125, 0.182403564453125, 0.270263671875, 0.358123779296875, 0.44598388671875, 0.533843994140625, 0.6217041015625, 0.709564208984375, 0.79742431640625, 0.885284423828125, 0.97314453125, 1.061004638671875, 1.14886474609375, 1.236724853515625, 1.3245849609375, 1.412445068359375, 1.50030517578125, 1.588165283203125, 1.676025390625, 1.763885498046875, 1.85174560546875, 1.939605712890625, 2.0274658203125, 2.115325927734375, 2.20318603515625, 2.291046142578125, 2.37890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 4.0, 2.0, 3.0, 9.0, 9.0, 12.0, 22.0, 31.0, 46.0, 76.0, 135.0, 156.0, 255.0, 458.0, 783.0, 1391.0, 2842.0, 6411.0, 18577.0, 113227.0, 3969489.0, 57152.0, 13002.0, 4928.0, 2385.0, 1168.0, 656.0, 398.0, 209.0, 138.0, 107.0, 54.0, 47.0, 35.0, 19.0, 12.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0], "bins": [-21.46875, -20.936767578125, -20.40478515625, -19.872802734375, -19.3408203125, -18.808837890625, -18.27685546875, -17.744873046875, -17.212890625, -16.680908203125, -16.14892578125, -15.616943359375, -15.0849609375, -14.552978515625, -14.02099609375, -13.489013671875, -12.95703125, -12.425048828125, -11.89306640625, -11.361083984375, -10.8291015625, -10.297119140625, -9.76513671875, -9.233154296875, -8.701171875, -8.169189453125, -7.63720703125, -7.105224609375, -6.5732421875, -6.041259765625, -5.50927734375, -4.977294921875, -4.4453125, -3.913330078125, -3.38134765625, -2.849365234375, -2.3173828125, -1.785400390625, -1.25341796875, -0.721435546875, -0.189453125, 0.342529296875, 0.87451171875, 1.406494140625, 1.9384765625, 2.470458984375, 3.00244140625, 3.534423828125, 4.06640625, 4.598388671875, 5.13037109375, 5.662353515625, 6.1943359375, 6.726318359375, 7.25830078125, 7.790283203125, 8.322265625, 8.854248046875, 9.38623046875, 9.918212890625, 10.4501953125, 10.982177734375, 11.51416015625, 12.046142578125, 12.578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 7.0, 12.0, 15.0, 27.0, 40.0, 68.0, 235.0, 3337.0, 174.0, 58.0, 32.0, 12.0, 15.0, 6.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3359375, -5.200775146484375, -5.06561279296875, -4.930450439453125, -4.7952880859375, -4.660125732421875, -4.52496337890625, -4.389801025390625, -4.254638671875, -4.119476318359375, -3.98431396484375, -3.849151611328125, -3.7139892578125, -3.578826904296875, -3.44366455078125, -3.308502197265625, -3.17333984375, -3.038177490234375, -2.90301513671875, -2.767852783203125, -2.6326904296875, -2.497528076171875, -2.36236572265625, -2.227203369140625, -2.092041015625, -1.956878662109375, -1.82171630859375, -1.686553955078125, -1.5513916015625, -1.416229248046875, -1.28106689453125, -1.145904541015625, -1.0107421875, -0.875579833984375, -0.74041748046875, -0.605255126953125, -0.4700927734375, -0.334930419921875, -0.19976806640625, -0.064605712890625, 0.070556640625, 0.205718994140625, 0.34088134765625, 0.476043701171875, 0.6112060546875, 0.746368408203125, 0.88153076171875, 1.016693115234375, 1.15185546875, 1.287017822265625, 1.42218017578125, 1.557342529296875, 1.6925048828125, 1.827667236328125, 1.96282958984375, 2.097991943359375, 2.233154296875, 2.368316650390625, 2.50347900390625, 2.638641357421875, 2.7738037109375, 2.908966064453125, 3.04412841796875, 3.179290771484375, 3.314453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 15.0, 17.0, 23.0, 44.0, 50.0, 65.0, 80.0, 85.0, 80.0, 116.0, 122.0, 87.0, 60.0, 33.0, 29.0, 23.0, 22.0, 11.0, 7.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.75586700439453, -18.306509017944336, -17.85715103149414, -17.407793045043945, -16.95843505859375, -16.509078979492188, -16.059720993041992, -15.610363006591797, -15.161005020141602, -14.711647033691406, -14.262289047241211, -13.812932014465332, -13.363574028015137, -12.914216041564941, -12.464859008789062, -12.015501022338867, -11.566143035888672, -11.116785049438477, -10.667427062988281, -10.218070030212402, -9.768712043762207, -9.319354057312012, -8.869997024536133, -8.420639038085938, -7.971281051635742, -7.521923065185547, -7.07256555557251, -6.623208045959473, -6.173850059509277, -5.724492073059082, -5.275134563446045, -4.825777053833008, -4.376418113708496, -3.92706036567688, -3.4777026176452637, -3.0283448696136475, -2.5789871215820312, -2.129629373550415, -1.6802716255187988, -1.2309138774871826, -0.7815561294555664, -0.3321983814239502, 0.11715936660766602, 0.5665171146392822, 1.0158748626708984, 1.4652326107025146, 1.9145903587341309, 2.363948106765747, 2.8133058547973633, 3.2626636028289795, 3.7120213508605957, 4.161378860473633, 4.610736846923828, 5.060094833374023, 5.5094523429870605, 5.958809852600098, 6.408167839050293, 6.857525825500488, 7.306883335113525, 7.7562408447265625, 8.205598831176758, 8.654956817626953, 9.104314804077148, 9.553671836853027, 10.003029823303223]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 7.0, 5.0, 11.0, 8.0, 12.0, 25.0, 18.0, 25.0, 21.0, 27.0, 33.0, 37.0, 45.0, 36.0, 40.0, 40.0, 46.0, 38.0, 46.0, 42.0, 42.0, 46.0, 36.0, 47.0, 32.0, 26.0, 16.0, 20.0, 26.0, 19.0, 23.0, 21.0, 7.0, 10.0, 12.0, 10.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.672354698181152, -8.419631958007812, -8.166910171508789, -7.914187908172607, -7.661465644836426, -7.408743381500244, -7.1560211181640625, -6.903298854827881, -6.650576591491699, -6.397854328155518, -6.145132064819336, -5.892409801483154, -5.639687538146973, -5.386965274810791, -5.134243011474609, -4.881520748138428, -4.628798484802246, -4.3760762214660645, -4.123353958129883, -3.870631694793701, -3.6179094314575195, -3.365187168121338, -3.1124649047851562, -2.8597426414489746, -2.607020378112793, -2.3542981147766113, -2.1015758514404297, -1.848853588104248, -1.5961313247680664, -1.3434090614318848, -1.0906867980957031, -0.8379645347595215, -0.5852417945861816, -0.33251953125, -0.07979726791381836, 0.17292499542236328, 0.4256472587585449, 0.6783695220947266, 0.9310917854309082, 1.1838140487670898, 1.4365363121032715, 1.6892585754394531, 1.9419808387756348, 2.1947031021118164, 2.447425365447998, 2.7001476287841797, 2.9528698921203613, 3.205592155456543, 3.4583144187927246, 3.7110366821289062, 3.963758945465088, 4.2164812088012695, 4.469203472137451, 4.721925735473633, 4.9746479988098145, 5.227370262145996, 5.480092525482178, 5.732814788818359, 5.985537052154541, 6.238259315490723, 6.490981578826904, 6.743703842163086, 6.996426105499268, 7.249148368835449, 7.501870632171631]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 16.0, 23.0, 36.0, 53.0, 90.0, 133.0, 209.0, 322.0, 578.0, 853.0, 1444.0, 2531.0, 4757.0, 9328.0, 18924.0, 41513.0, 93297.0, 202232.0, 305884.0, 197178.0, 90337.0, 40305.0, 18641.0, 9046.0, 4652.0, 2546.0, 1385.0, 816.0, 503.0, 341.0, 191.0, 135.0, 81.0, 45.0, 41.0, 20.0, 16.0, 13.0, 7.0, 7.0, 8.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.744140625, -3.602752685546875, -3.46136474609375, -3.319976806640625, -3.1785888671875, -3.037200927734375, -2.89581298828125, -2.754425048828125, -2.613037109375, -2.471649169921875, -2.33026123046875, -2.188873291015625, -2.0474853515625, -1.906097412109375, -1.76470947265625, -1.623321533203125, -1.48193359375, -1.340545654296875, -1.19915771484375, -1.057769775390625, -0.9163818359375, -0.774993896484375, -0.63360595703125, -0.492218017578125, -0.350830078125, -0.209442138671875, -0.06805419921875, 0.073333740234375, 0.2147216796875, 0.356109619140625, 0.49749755859375, 0.638885498046875, 0.7802734375, 0.921661376953125, 1.06304931640625, 1.204437255859375, 1.3458251953125, 1.487213134765625, 1.62860107421875, 1.769989013671875, 1.911376953125, 2.052764892578125, 2.19415283203125, 2.335540771484375, 2.4769287109375, 2.618316650390625, 2.75970458984375, 2.901092529296875, 3.04248046875, 3.183868408203125, 3.32525634765625, 3.466644287109375, 3.6080322265625, 3.749420166015625, 3.89080810546875, 4.032196044921875, 4.173583984375, 4.314971923828125, 4.45635986328125, 4.597747802734375, 4.7391357421875, 4.880523681640625, 5.02191162109375, 5.163299560546875, 5.3046875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 8.0, 7.0, 8.0, 12.0, 15.0, 23.0, 15.0, 17.0, 26.0, 32.0, 35.0, 44.0, 51.0, 48.0, 64.0, 51.0, 56.0, 57.0, 67.0, 61.0, 48.0, 59.0, 32.0, 34.0, 21.0, 29.0, 19.0, 11.0, 17.0, 5.0, 5.0, 3.0, 1.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.234375, -4.12921142578125, -4.0240478515625, -3.91888427734375, -3.813720703125, -3.70855712890625, -3.6033935546875, -3.49822998046875, -3.39306640625, -3.28790283203125, -3.1827392578125, -3.07757568359375, -2.972412109375, -2.86724853515625, -2.7620849609375, -2.65692138671875, -2.5517578125, -2.44659423828125, -2.3414306640625, -2.23626708984375, -2.131103515625, -2.02593994140625, -1.9207763671875, -1.81561279296875, -1.71044921875, -1.60528564453125, -1.5001220703125, -1.39495849609375, -1.289794921875, -1.18463134765625, -1.0794677734375, -0.97430419921875, -0.869140625, -0.76397705078125, -0.6588134765625, -0.55364990234375, -0.448486328125, -0.34332275390625, -0.2381591796875, -0.13299560546875, -0.02783203125, 0.07733154296875, 0.1824951171875, 0.28765869140625, 0.392822265625, 0.49798583984375, 0.6031494140625, 0.70831298828125, 0.8134765625, 0.91864013671875, 1.0238037109375, 1.12896728515625, 1.234130859375, 1.33929443359375, 1.4444580078125, 1.54962158203125, 1.65478515625, 1.75994873046875, 1.8651123046875, 1.97027587890625, 2.075439453125, 2.18060302734375, 2.2857666015625, 2.39093017578125, 2.49609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 12.0, 18.0, 29.0, 30.0, 36.0, 77.0, 115.0, 143.0, 232.0, 394.0, 718.0, 1439.0, 3919.0, 21673.0, 338987.0, 635995.0, 35562.0, 5485.0, 1667.0, 775.0, 401.0, 251.0, 170.0, 114.0, 80.0, 55.0, 30.0, 41.0, 28.0, 20.0, 7.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.65625, -14.094970703125, -13.53369140625, -12.972412109375, -12.4111328125, -11.849853515625, -11.28857421875, -10.727294921875, -10.166015625, -9.604736328125, -9.04345703125, -8.482177734375, -7.9208984375, -7.359619140625, -6.79833984375, -6.237060546875, -5.67578125, -5.114501953125, -4.55322265625, -3.991943359375, -3.4306640625, -2.869384765625, -2.30810546875, -1.746826171875, -1.185546875, -0.624267578125, -0.06298828125, 0.498291015625, 1.0595703125, 1.620849609375, 2.18212890625, 2.743408203125, 3.3046875, 3.865966796875, 4.42724609375, 4.988525390625, 5.5498046875, 6.111083984375, 6.67236328125, 7.233642578125, 7.794921875, 8.356201171875, 8.91748046875, 9.478759765625, 10.0400390625, 10.601318359375, 11.16259765625, 11.723876953125, 12.28515625, 12.846435546875, 13.40771484375, 13.968994140625, 14.5302734375, 15.091552734375, 15.65283203125, 16.214111328125, 16.775390625, 17.336669921875, 17.89794921875, 18.459228515625, 19.0205078125, 19.581787109375, 20.14306640625, 20.704345703125, 21.265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 8.0, 9.0, 10.0, 8.0, 17.0, 9.0, 17.0, 9.0, 16.0, 18.0, 31.0, 28.0, 33.0, 43.0, 43.0, 36.0, 44.0, 29.0, 45.0, 48.0, 44.0, 35.0, 32.0, 41.0, 46.0, 34.0, 34.0, 38.0, 34.0, 18.0, 19.0, 22.0, 19.0, 11.0, 15.0, 12.0, 7.0, 6.0, 8.0, 4.0, 7.0, 0.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.125, -12.7030029296875, -12.281005859375, -11.8590087890625, -11.43701171875, -11.0150146484375, -10.593017578125, -10.1710205078125, -9.7490234375, -9.3270263671875, -8.905029296875, -8.4830322265625, -8.06103515625, -7.6390380859375, -7.217041015625, -6.7950439453125, -6.373046875, -5.9510498046875, -5.529052734375, -5.1070556640625, -4.68505859375, -4.2630615234375, -3.841064453125, -3.4190673828125, -2.9970703125, -2.5750732421875, -2.153076171875, -1.7310791015625, -1.30908203125, -0.8870849609375, -0.465087890625, -0.0430908203125, 0.37890625, 0.8009033203125, 1.222900390625, 1.6448974609375, 2.06689453125, 2.4888916015625, 2.910888671875, 3.3328857421875, 3.7548828125, 4.1768798828125, 4.598876953125, 5.0208740234375, 5.44287109375, 5.8648681640625, 6.286865234375, 6.7088623046875, 7.130859375, 7.5528564453125, 7.974853515625, 8.3968505859375, 8.81884765625, 9.2408447265625, 9.662841796875, 10.0848388671875, 10.5068359375, 10.9288330078125, 11.350830078125, 11.7728271484375, 12.19482421875, 12.6168212890625, 13.038818359375, 13.4608154296875, 13.8828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 22.0, 35.0, 100.0, 192.0, 399.0, 1235.0, 5496.0, 113855.0, 891982.0, 30818.0, 3022.0, 760.0, 284.0, 151.0, 81.0, 39.0, 24.0, 13.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -14.8338623046875, -14.425537109375, -14.0172119140625, -13.60888671875, -13.2005615234375, -12.792236328125, -12.3839111328125, -11.9755859375, -11.5672607421875, -11.158935546875, -10.7506103515625, -10.34228515625, -9.9339599609375, -9.525634765625, -9.1173095703125, -8.708984375, -8.3006591796875, -7.892333984375, -7.4840087890625, -7.07568359375, -6.6673583984375, -6.259033203125, -5.8507080078125, -5.4423828125, -5.0340576171875, -4.625732421875, -4.2174072265625, -3.80908203125, -3.4007568359375, -2.992431640625, -2.5841064453125, -2.17578125, -1.7674560546875, -1.359130859375, -0.9508056640625, -0.54248046875, -0.1341552734375, 0.274169921875, 0.6824951171875, 1.0908203125, 1.4991455078125, 1.907470703125, 2.3157958984375, 2.72412109375, 3.1324462890625, 3.540771484375, 3.9490966796875, 4.357421875, 4.7657470703125, 5.174072265625, 5.5823974609375, 5.99072265625, 6.3990478515625, 6.807373046875, 7.2156982421875, 7.6240234375, 8.0323486328125, 8.440673828125, 8.8489990234375, 9.25732421875, 9.6656494140625, 10.073974609375, 10.4822998046875, 10.890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 8.0, 6.0, 12.0, 13.0, 16.0, 36.0, 25.0, 34.0, 48.0, 59.0, 77.0, 108.0, 99.0, 104.0, 85.0, 65.0, 52.0, 40.0, 24.0, 21.0, 10.0, 12.0, 11.0, 5.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011129379272460938, -0.0010774433612823486, -0.0010419487953186035, -0.0010064542293548584, -0.0009709596633911133, -0.0009354650974273682, -0.000899970531463623, -0.0008644759654998779, -0.0008289813995361328, -0.0007934868335723877, -0.0007579922676086426, -0.0007224977016448975, -0.0006870031356811523, -0.0006515085697174072, -0.0006160140037536621, -0.000580519437789917, -0.0005450248718261719, -0.0005095303058624268, -0.00047403573989868164, -0.0004385411739349365, -0.0004030466079711914, -0.0003675520420074463, -0.00033205747604370117, -0.00029656291007995605, -0.00026106834411621094, -0.00022557377815246582, -0.0001900792121887207, -0.00015458464622497559, -0.00011909008026123047, -8.359551429748535e-05, -4.8100948333740234e-05, -1.2606382369995117e-05, 2.288818359375e-05, 5.838274955749512e-05, 9.387731552124023e-05, 0.00012937188148498535, 0.00016486644744873047, 0.00020036101341247559, 0.0002358555793762207, 0.0002713501453399658, 0.00030684471130371094, 0.00034233927726745605, 0.00037783384323120117, 0.0004133284091949463, 0.0004488229751586914, 0.0004843175411224365, 0.0005198121070861816, 0.0005553066730499268, 0.0005908012390136719, 0.000626295804977417, 0.0006617903709411621, 0.0006972849369049072, 0.0007327795028686523, 0.0007682740688323975, 0.0008037686347961426, 0.0008392632007598877, 0.0008747577667236328, 0.0009102523326873779, 0.000945746898651123, 0.0009812414646148682, 0.0010167360305786133, 0.0010522305965423584, 0.0010877251625061035, 0.0011232197284698486, 0.0011587142944335938]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 7.0, 10.0, 12.0, 11.0, 26.0, 26.0, 39.0, 66.0, 110.0, 170.0, 332.0, 700.0, 1587.0, 5109.0, 31288.0, 556178.0, 421009.0, 24453.0, 4527.0, 1481.0, 606.0, 350.0, 174.0, 83.0, 62.0, 36.0, 28.0, 17.0, 8.0, 12.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.609375, -8.3311767578125, -8.052978515625, -7.7747802734375, -7.49658203125, -7.2183837890625, -6.940185546875, -6.6619873046875, -6.3837890625, -6.1055908203125, -5.827392578125, -5.5491943359375, -5.27099609375, -4.9927978515625, -4.714599609375, -4.4364013671875, -4.158203125, -3.8800048828125, -3.601806640625, -3.3236083984375, -3.04541015625, -2.7672119140625, -2.489013671875, -2.2108154296875, -1.9326171875, -1.6544189453125, -1.376220703125, -1.0980224609375, -0.81982421875, -0.5416259765625, -0.263427734375, 0.0147705078125, 0.29296875, 0.5711669921875, 0.849365234375, 1.1275634765625, 1.40576171875, 1.6839599609375, 1.962158203125, 2.2403564453125, 2.5185546875, 2.7967529296875, 3.074951171875, 3.3531494140625, 3.63134765625, 3.9095458984375, 4.187744140625, 4.4659423828125, 4.744140625, 5.0223388671875, 5.300537109375, 5.5787353515625, 5.85693359375, 6.1351318359375, 6.413330078125, 6.6915283203125, 6.9697265625, 7.2479248046875, 7.526123046875, 7.8043212890625, 8.08251953125, 8.3607177734375, 8.638916015625, 8.9171142578125, 9.1953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 7.0, 12.0, 17.0, 27.0, 31.0, 64.0, 87.0, 99.0, 142.0, 120.0, 121.0, 92.0, 65.0, 47.0, 28.0, 15.0, 5.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.418212890625, -7.17236328125, -6.926513671875, -6.6806640625, -6.434814453125, -6.18896484375, -5.943115234375, -5.697265625, -5.451416015625, -5.20556640625, -4.959716796875, -4.7138671875, -4.468017578125, -4.22216796875, -3.976318359375, -3.73046875, -3.484619140625, -3.23876953125, -2.992919921875, -2.7470703125, -2.501220703125, -2.25537109375, -2.009521484375, -1.763671875, -1.517822265625, -1.27197265625, -1.026123046875, -0.7802734375, -0.534423828125, -0.28857421875, -0.042724609375, 0.203125, 0.448974609375, 0.69482421875, 0.940673828125, 1.1865234375, 1.432373046875, 1.67822265625, 1.924072265625, 2.169921875, 2.415771484375, 2.66162109375, 2.907470703125, 3.1533203125, 3.399169921875, 3.64501953125, 3.890869140625, 4.13671875, 4.382568359375, 4.62841796875, 4.874267578125, 5.1201171875, 5.365966796875, 5.61181640625, 5.857666015625, 6.103515625, 6.349365234375, 6.59521484375, 6.841064453125, 7.0869140625, 7.332763671875, 7.57861328125, 7.824462890625, 8.0703125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 19.0, 66.0, 303.0, 423.0, 161.0, 27.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-482.3701171875, -472.9635314941406, -463.55694580078125, -454.15032958984375, -444.7437438964844, -435.337158203125, -425.9305725097656, -416.52398681640625, -407.11737060546875, -397.7107849121094, -388.30419921875, -378.8975830078125, -369.4909973144531, -360.08441162109375, -350.6778259277344, -341.271240234375, -331.8646545410156, -322.45806884765625, -313.0514831542969, -303.6448669433594, -294.23828125, -284.8316955566406, -275.42510986328125, -266.0185241699219, -256.6119384765625, -247.20535278320312, -237.7987518310547, -228.3921661376953, -218.98556518554688, -209.5789794921875, -200.17239379882812, -190.76580810546875, -181.35919189453125, -171.95260620117188, -162.54600524902344, -153.13941955566406, -143.73281860351562, -134.32623291015625, -124.91964721679688, -115.51305389404297, -106.10646057128906, -96.69986724853516, -87.29327392578125, -77.88668823242188, -68.48009490966797, -59.07350158691406, -49.66691207885742, -40.26032257080078, -30.853729248046875, -21.4471378326416, -12.040546417236328, -2.6339550018310547, 6.772636413574219, 16.179229736328125, 25.585819244384766, 34.992408752441406, 44.39900207519531, 53.80559539794922, 63.21218490600586, 72.6187744140625, 82.0253677368164, 91.43196105957031, 100.83854675292969, 110.2451400756836, 119.6517333984375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 2.0, 2.0, 6.0, 8.0, 15.0, 14.0, 14.0, 19.0, 13.0, 20.0, 29.0, 32.0, 38.0, 42.0, 40.0, 49.0, 60.0, 53.0, 53.0, 46.0, 64.0, 40.0, 45.0, 48.0, 33.0, 37.0, 27.0, 21.0, 27.0, 18.0, 14.0, 14.0, 15.0, 10.0, 8.0, 11.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.693328857421875, -56.40166091918945, -54.109989166259766, -51.818321228027344, -49.526649475097656, -47.234981536865234, -44.94331359863281, -42.651641845703125, -40.3599739074707, -38.06830596923828, -35.776634216308594, -33.48496627807617, -31.193296432495117, -28.901626586914062, -26.60995864868164, -24.318288803100586, -22.02661895751953, -19.734949111938477, -17.443279266357422, -15.151611328125, -12.859941482543945, -10.56827163696289, -8.276602745056152, -5.984933853149414, -3.6932640075683594, -1.401594638824463, 0.8900747299194336, 3.18174409866333, 5.473413467407227, 7.765083312988281, 10.05675220489502, 12.348421096801758, 14.640090942382812, 16.931760787963867, 19.223430633544922, 21.515098571777344, 23.8067684173584, 26.098438262939453, 28.390106201171875, 30.68177604675293, 32.973445892333984, 35.265113830566406, 37.556785583496094, 39.848453521728516, 42.14012145996094, 44.431793212890625, 46.72346115112305, 49.01512908935547, 51.306800842285156, 53.59846878051758, 55.890140533447266, 58.18180847167969, 60.473480224609375, 62.7651481628418, 65.05681610107422, 67.3484878540039, 69.64015197753906, 71.93182373046875, 74.2234878540039, 76.5151596069336, 78.80683135986328, 81.09849548339844, 83.39016723632812, 85.68183898925781, 87.9735107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 18.0, 21.0, 16.0, 30.0, 47.0, 77.0, 122.0, 169.0, 287.0, 501.0, 863.0, 1749.0, 3741.0, 10488.0, 50557.0, 4065435.0, 43128.0, 9617.0, 3533.0, 1662.0, 904.0, 468.0, 268.0, 163.0, 115.0, 75.0, 51.0, 33.0, 23.0, 20.0, 16.0, 5.0, 5.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.5234375, -11.1572265625, -10.791015625, -10.4248046875, -10.05859375, -9.6923828125, -9.326171875, -8.9599609375, -8.59375, -8.2275390625, -7.861328125, -7.4951171875, -7.12890625, -6.7626953125, -6.396484375, -6.0302734375, -5.6640625, -5.2978515625, -4.931640625, -4.5654296875, -4.19921875, -3.8330078125, -3.466796875, -3.1005859375, -2.734375, -2.3681640625, -2.001953125, -1.6357421875, -1.26953125, -0.9033203125, -0.537109375, -0.1708984375, 0.1953125, 0.5615234375, 0.927734375, 1.2939453125, 1.66015625, 2.0263671875, 2.392578125, 2.7587890625, 3.125, 3.4912109375, 3.857421875, 4.2236328125, 4.58984375, 4.9560546875, 5.322265625, 5.6884765625, 6.0546875, 6.4208984375, 6.787109375, 7.1533203125, 7.51953125, 7.8857421875, 8.251953125, 8.6181640625, 8.984375, 9.3505859375, 9.716796875, 10.0830078125, 10.44921875, 10.8154296875, 11.181640625, 11.5478515625, 11.9140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 13.0, 5.0, 18.0, 17.0, 23.0, 23.0, 31.0, 40.0, 35.0, 62.0, 53.0, 53.0, 54.0, 73.0, 79.0, 70.0, 71.0, 51.0, 43.0, 48.0, 26.0, 37.0, 18.0, 16.0, 7.0, 8.0, 10.0, 4.0, 1.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.340118408203125, -4.21148681640625, -4.082855224609375, -3.9542236328125, -3.825592041015625, -3.69696044921875, -3.568328857421875, -3.439697265625, -3.311065673828125, -3.18243408203125, -3.053802490234375, -2.9251708984375, -2.796539306640625, -2.66790771484375, -2.539276123046875, -2.41064453125, -2.282012939453125, -2.15338134765625, -2.024749755859375, -1.8961181640625, -1.767486572265625, -1.63885498046875, -1.510223388671875, -1.381591796875, -1.252960205078125, -1.12432861328125, -0.995697021484375, -0.8670654296875, -0.738433837890625, -0.60980224609375, -0.481170654296875, -0.3525390625, -0.223907470703125, -0.09527587890625, 0.033355712890625, 0.1619873046875, 0.290618896484375, 0.41925048828125, 0.547882080078125, 0.676513671875, 0.805145263671875, 0.93377685546875, 1.062408447265625, 1.1910400390625, 1.319671630859375, 1.44830322265625, 1.576934814453125, 1.70556640625, 1.834197998046875, 1.96282958984375, 2.091461181640625, 2.2200927734375, 2.348724365234375, 2.47735595703125, 2.605987548828125, 2.734619140625, 2.863250732421875, 2.99188232421875, 3.120513916015625, 3.2491455078125, 3.377777099609375, 3.50640869140625, 3.635040283203125, 3.763671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 6.0, 13.0, 19.0, 27.0, 58.0, 80.0, 100.0, 175.0, 290.0, 477.0, 753.0, 1334.0, 2601.0, 6448.0, 26391.0, 4056655.0, 79843.0, 10876.0, 3895.0, 1738.0, 953.0, 584.0, 332.0, 222.0, 119.0, 105.0, 72.0, 41.0, 20.0, 13.0, 16.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.265625, -22.6142578125, -21.962890625, -21.3115234375, -20.66015625, -20.0087890625, -19.357421875, -18.7060546875, -18.0546875, -17.4033203125, -16.751953125, -16.1005859375, -15.44921875, -14.7978515625, -14.146484375, -13.4951171875, -12.84375, -12.1923828125, -11.541015625, -10.8896484375, -10.23828125, -9.5869140625, -8.935546875, -8.2841796875, -7.6328125, -6.9814453125, -6.330078125, -5.6787109375, -5.02734375, -4.3759765625, -3.724609375, -3.0732421875, -2.421875, -1.7705078125, -1.119140625, -0.4677734375, 0.18359375, 0.8349609375, 1.486328125, 2.1376953125, 2.7890625, 3.4404296875, 4.091796875, 4.7431640625, 5.39453125, 6.0458984375, 6.697265625, 7.3486328125, 8.0, 8.6513671875, 9.302734375, 9.9541015625, 10.60546875, 11.2568359375, 11.908203125, 12.5595703125, 13.2109375, 13.8623046875, 14.513671875, 15.1650390625, 15.81640625, 16.4677734375, 17.119140625, 17.7705078125, 18.421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 10.0, 12.0, 23.0, 53.0, 137.0, 3571.0, 135.0, 43.0, 23.0, 19.0, 8.0, 5.0, 5.0, 7.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.33203125, -4.209869384765625, -4.08770751953125, -3.965545654296875, -3.8433837890625, -3.721221923828125, -3.59906005859375, -3.476898193359375, -3.354736328125, -3.232574462890625, -3.11041259765625, -2.988250732421875, -2.8660888671875, -2.743927001953125, -2.62176513671875, -2.499603271484375, -2.37744140625, -2.255279541015625, -2.13311767578125, -2.010955810546875, -1.8887939453125, -1.766632080078125, -1.64447021484375, -1.522308349609375, -1.400146484375, -1.277984619140625, -1.15582275390625, -1.033660888671875, -0.9114990234375, -0.789337158203125, -0.66717529296875, -0.545013427734375, -0.4228515625, -0.300689697265625, -0.17852783203125, -0.056365966796875, 0.0657958984375, 0.187957763671875, 0.31011962890625, 0.432281494140625, 0.554443359375, 0.676605224609375, 0.79876708984375, 0.920928955078125, 1.0430908203125, 1.165252685546875, 1.28741455078125, 1.409576416015625, 1.53173828125, 1.653900146484375, 1.77606201171875, 1.898223876953125, 2.0203857421875, 2.142547607421875, 2.26470947265625, 2.386871337890625, 2.509033203125, 2.631195068359375, 2.75335693359375, 2.875518798828125, 2.9976806640625, 3.119842529296875, 3.24200439453125, 3.364166259765625, 3.486328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 12.0, 11.0, 25.0, 45.0, 65.0, 125.0, 130.0, 125.0, 131.0, 97.0, 75.0, 71.0, 38.0, 19.0, 9.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.13488006591797, -17.63213348388672, -17.129384994506836, -16.626636505126953, -16.123889923095703, -15.621142387390137, -15.11839485168457, -14.615647315979004, -14.112899780273438, -13.610152244567871, -13.107404708862305, -12.604657173156738, -12.101909637451172, -11.599162101745605, -11.096414566040039, -10.593667030334473, -10.090919494628906, -9.58817195892334, -9.085424423217773, -8.582676887512207, -8.07992935180664, -7.577181816101074, -7.074434280395508, -6.571686744689941, -6.068939208984375, -5.566191673278809, -5.063444137573242, -4.560696601867676, -4.057949066162109, -3.555201530456543, -3.0524539947509766, -2.54970645904541, -2.0469608306884766, -1.5442132949829102, -1.0414657592773438, -0.5387182235717773, -0.03597068786621094, 0.46677684783935547, 0.9695243835449219, 1.4722719192504883, 1.9750194549560547, 2.477766990661621, 2.9805145263671875, 3.483262062072754, 3.9860095977783203, 4.488757133483887, 4.991504669189453, 5.4942522048950195, 5.996999740600586, 6.499747276306152, 7.002494812011719, 7.505242347717285, 8.007989883422852, 8.510737419128418, 9.013484954833984, 9.51623249053955, 10.018980026245117, 10.521727561950684, 11.02447509765625, 11.527222633361816, 12.029970169067383, 12.53271770477295, 13.035465240478516, 13.538212776184082, 14.040960311889648]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 10.0, 4.0, 12.0, 6.0, 19.0, 15.0, 16.0, 20.0, 22.0, 31.0, 29.0, 39.0, 29.0, 38.0, 37.0, 35.0, 41.0, 33.0, 30.0, 45.0, 40.0, 35.0, 31.0, 37.0, 41.0, 33.0, 31.0, 35.0, 25.0, 30.0, 22.0, 20.0, 16.0, 13.0, 12.0, 9.0, 7.0, 13.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.926447868347168, -7.689085483551025, -7.451723575592041, -7.214361190795898, -6.976998805999756, -6.739636421203613, -6.502274513244629, -6.264912128448486, -6.027549743652344, -5.790187358856201, -5.552825450897217, -5.315463066101074, -5.078100681304932, -4.840738296508789, -4.603376388549805, -4.366014003753662, -4.1286516189575195, -3.891289472579956, -3.6539270877838135, -3.41656494140625, -3.1792025566101074, -2.941840410232544, -2.7044782638549805, -2.467115879058838, -2.2297539710998535, -1.9923917055130005, -1.7550294399261475, -1.517667293548584, -1.2803049087524414, -1.042942762374878, -0.8055804967880249, -0.5682182312011719, -0.3308558464050293, -0.09349359571933746, 0.14386865496635437, 0.381230890750885, 0.618593156337738, 0.8559553623199463, 1.0933176279067993, 1.3306798934936523, 1.5680421590805054, 1.8054044246673584, 2.042766571044922, 2.2801289558410645, 2.517491102218628, 2.7548532485961914, 2.992215633392334, 3.2295780181884766, 3.46694016456604, 3.7043023109436035, 3.941664695739746, 4.179027080535889, 4.416388988494873, 4.653751373291016, 4.891113758087158, 5.128476142883301, 5.365838050842285, 5.603200435638428, 5.840562343597412, 6.077924728393555, 6.315287113189697, 6.55264949798584, 6.790011405944824, 7.027373790740967, 7.264736175537109]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 11.0, 6.0, 12.0, 16.0, 24.0, 41.0, 48.0, 88.0, 143.0, 216.0, 334.0, 517.0, 957.0, 1544.0, 2698.0, 5110.0, 9589.0, 18453.0, 37517.0, 77298.0, 164124.0, 300738.0, 220791.0, 105769.0, 50259.0, 24776.0, 12492.0, 6520.0, 3505.0, 1968.0, 1148.0, 707.0, 395.0, 245.0, 180.0, 116.0, 69.0, 50.0, 25.0, 21.0, 8.0, 15.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.959716796875, -3.82177734375, -3.683837890625, -3.5458984375, -3.407958984375, -3.27001953125, -3.132080078125, -2.994140625, -2.856201171875, -2.71826171875, -2.580322265625, -2.4423828125, -2.304443359375, -2.16650390625, -2.028564453125, -1.890625, -1.752685546875, -1.61474609375, -1.476806640625, -1.3388671875, -1.200927734375, -1.06298828125, -0.925048828125, -0.787109375, -0.649169921875, -0.51123046875, -0.373291015625, -0.2353515625, -0.097412109375, 0.04052734375, 0.178466796875, 0.31640625, 0.454345703125, 0.59228515625, 0.730224609375, 0.8681640625, 1.006103515625, 1.14404296875, 1.281982421875, 1.419921875, 1.557861328125, 1.69580078125, 1.833740234375, 1.9716796875, 2.109619140625, 2.24755859375, 2.385498046875, 2.5234375, 2.661376953125, 2.79931640625, 2.937255859375, 3.0751953125, 3.213134765625, 3.35107421875, 3.489013671875, 3.626953125, 3.764892578125, 3.90283203125, 4.040771484375, 4.1787109375, 4.316650390625, 4.45458984375, 4.592529296875, 4.73046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 18.0, 11.0, 15.0, 16.0, 20.0, 31.0, 37.0, 30.0, 50.0, 53.0, 58.0, 64.0, 66.0, 60.0, 61.0, 62.0, 53.0, 38.0, 37.0, 41.0, 36.0, 31.0, 21.0, 15.0, 11.0, 17.0, 8.0, 11.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.921875, -3.79681396484375, -3.6717529296875, -3.54669189453125, -3.421630859375, -3.29656982421875, -3.1715087890625, -3.04644775390625, -2.92138671875, -2.79632568359375, -2.6712646484375, -2.54620361328125, -2.421142578125, -2.29608154296875, -2.1710205078125, -2.04595947265625, -1.9208984375, -1.79583740234375, -1.6707763671875, -1.54571533203125, -1.420654296875, -1.29559326171875, -1.1705322265625, -1.04547119140625, -0.92041015625, -0.79534912109375, -0.6702880859375, -0.54522705078125, -0.420166015625, -0.29510498046875, -0.1700439453125, -0.04498291015625, 0.080078125, 0.20513916015625, 0.3302001953125, 0.45526123046875, 0.580322265625, 0.70538330078125, 0.8304443359375, 0.95550537109375, 1.08056640625, 1.20562744140625, 1.3306884765625, 1.45574951171875, 1.580810546875, 1.70587158203125, 1.8309326171875, 1.95599365234375, 2.0810546875, 2.20611572265625, 2.3311767578125, 2.45623779296875, 2.581298828125, 2.70635986328125, 2.8314208984375, 2.95648193359375, 3.08154296875, 3.20660400390625, 3.3316650390625, 3.45672607421875, 3.581787109375, 3.70684814453125, 3.8319091796875, 3.95697021484375, 4.08203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 7.0, 15.0, 16.0, 22.0, 22.0, 56.0, 61.0, 84.0, 132.0, 175.0, 270.0, 477.0, 815.0, 1819.0, 6885.0, 75849.0, 838018.0, 110786.0, 8576.0, 2123.0, 880.0, 499.0, 293.0, 209.0, 131.0, 107.0, 57.0, 50.0, 35.0, 19.0, 17.0, 12.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.40625, -16.854736328125, -16.30322265625, -15.751708984375, -15.2001953125, -14.648681640625, -14.09716796875, -13.545654296875, -12.994140625, -12.442626953125, -11.89111328125, -11.339599609375, -10.7880859375, -10.236572265625, -9.68505859375, -9.133544921875, -8.58203125, -8.030517578125, -7.47900390625, -6.927490234375, -6.3759765625, -5.824462890625, -5.27294921875, -4.721435546875, -4.169921875, -3.618408203125, -3.06689453125, -2.515380859375, -1.9638671875, -1.412353515625, -0.86083984375, -0.309326171875, 0.2421875, 0.793701171875, 1.34521484375, 1.896728515625, 2.4482421875, 2.999755859375, 3.55126953125, 4.102783203125, 4.654296875, 5.205810546875, 5.75732421875, 6.308837890625, 6.8603515625, 7.411865234375, 7.96337890625, 8.514892578125, 9.06640625, 9.617919921875, 10.16943359375, 10.720947265625, 11.2724609375, 11.823974609375, 12.37548828125, 12.927001953125, 13.478515625, 14.030029296875, 14.58154296875, 15.133056640625, 15.6845703125, 16.236083984375, 16.78759765625, 17.339111328125, 17.890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 8.0, 12.0, 6.0, 7.0, 7.0, 18.0, 27.0, 21.0, 22.0, 32.0, 28.0, 44.0, 34.0, 33.0, 40.0, 52.0, 49.0, 56.0, 54.0, 50.0, 58.0, 50.0, 44.0, 42.0, 35.0, 27.0, 24.0, 23.0, 18.0, 12.0, 7.0, 12.0, 13.0, 13.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.546875, -19.9837646484375, -19.420654296875, -18.8575439453125, -18.29443359375, -17.7313232421875, -17.168212890625, -16.6051025390625, -16.0419921875, -15.4788818359375, -14.915771484375, -14.3526611328125, -13.78955078125, -13.2264404296875, -12.663330078125, -12.1002197265625, -11.537109375, -10.9739990234375, -10.410888671875, -9.8477783203125, -9.28466796875, -8.7215576171875, -8.158447265625, -7.5953369140625, -7.0322265625, -6.4691162109375, -5.906005859375, -5.3428955078125, -4.77978515625, -4.2166748046875, -3.653564453125, -3.0904541015625, -2.52734375, -1.9642333984375, -1.401123046875, -0.8380126953125, -0.27490234375, 0.2882080078125, 0.851318359375, 1.4144287109375, 1.9775390625, 2.5406494140625, 3.103759765625, 3.6668701171875, 4.22998046875, 4.7930908203125, 5.356201171875, 5.9193115234375, 6.482421875, 7.0455322265625, 7.608642578125, 8.1717529296875, 8.73486328125, 9.2979736328125, 9.861083984375, 10.4241943359375, 10.9873046875, 11.5504150390625, 12.113525390625, 12.6766357421875, 13.23974609375, 13.8028564453125, 14.365966796875, 14.9290771484375, 15.4921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 14.0, 31.0, 41.0, 65.0, 147.0, 353.0, 1001.0, 4182.0, 71227.0, 930436.0, 36548.0, 3065.0, 841.0, 307.0, 113.0, 68.0, 42.0, 24.0, 15.0, 6.0, 12.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.875, -18.407958984375, -17.94091796875, -17.473876953125, -17.0068359375, -16.539794921875, -16.07275390625, -15.605712890625, -15.138671875, -14.671630859375, -14.20458984375, -13.737548828125, -13.2705078125, -12.803466796875, -12.33642578125, -11.869384765625, -11.40234375, -10.935302734375, -10.46826171875, -10.001220703125, -9.5341796875, -9.067138671875, -8.60009765625, -8.133056640625, -7.666015625, -7.198974609375, -6.73193359375, -6.264892578125, -5.7978515625, -5.330810546875, -4.86376953125, -4.396728515625, -3.9296875, -3.462646484375, -2.99560546875, -2.528564453125, -2.0615234375, -1.594482421875, -1.12744140625, -0.660400390625, -0.193359375, 0.273681640625, 0.74072265625, 1.207763671875, 1.6748046875, 2.141845703125, 2.60888671875, 3.075927734375, 3.54296875, 4.010009765625, 4.47705078125, 4.944091796875, 5.4111328125, 5.878173828125, 6.34521484375, 6.812255859375, 7.279296875, 7.746337890625, 8.21337890625, 8.680419921875, 9.1474609375, 9.614501953125, 10.08154296875, 10.548583984375, 11.015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 12.0, 11.0, 19.0, 14.0, 28.0, 45.0, 38.0, 80.0, 103.0, 124.0, 131.0, 108.0, 93.0, 54.0, 25.0, 30.0, 22.0, 22.0, 13.0, 9.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011777877807617188, -0.0011342167854309082, -0.0010906457901000977, -0.0010470747947692871, -0.0010035037994384766, -0.000959932804107666, -0.0009163618087768555, -0.0008727908134460449, -0.0008292198181152344, -0.0007856488227844238, -0.0007420778274536133, -0.0006985068321228027, -0.0006549358367919922, -0.0006113648414611816, -0.0005677938461303711, -0.0005242228507995605, -0.00048065185546875, -0.00043708086013793945, -0.0003935098648071289, -0.00034993886947631836, -0.0003063678741455078, -0.00026279687881469727, -0.00021922588348388672, -0.00017565488815307617, -0.00013208389282226562, -8.851289749145508e-05, -4.494190216064453e-05, -1.3709068298339844e-06, 4.220008850097656e-05, 8.577108383178711e-05, 0.00012934207916259766, 0.0001729130744934082, 0.00021648406982421875, 0.0002600550651550293, 0.00030362606048583984, 0.0003471970558166504, 0.00039076805114746094, 0.0004343390464782715, 0.00047791004180908203, 0.0005214810371398926, 0.0005650520324707031, 0.0006086230278015137, 0.0006521940231323242, 0.0006957650184631348, 0.0007393360137939453, 0.0007829070091247559, 0.0008264780044555664, 0.000870048999786377, 0.0009136199951171875, 0.000957190990447998, 0.0010007619857788086, 0.0010443329811096191, 0.0010879039764404297, 0.0011314749717712402, 0.0011750459671020508, 0.0012186169624328613, 0.0012621879577636719, 0.0013057589530944824, 0.001349329948425293, 0.0013929009437561035, 0.001436471939086914, 0.0014800429344177246, 0.0015236139297485352, 0.0015671849250793457, 0.0016107559204101562]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 16.0, 11.0, 18.0, 36.0, 43.0, 77.0, 136.0, 305.0, 586.0, 1620.0, 5646.0, 43763.0, 722372.0, 252015.0, 16720.0, 3089.0, 1073.0, 441.0, 239.0, 128.0, 71.0, 46.0, 42.0, 20.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.3125, -9.998046875, -9.68359375, -9.369140625, -9.0546875, -8.740234375, -8.42578125, -8.111328125, -7.796875, -7.482421875, -7.16796875, -6.853515625, -6.5390625, -6.224609375, -5.91015625, -5.595703125, -5.28125, -4.966796875, -4.65234375, -4.337890625, -4.0234375, -3.708984375, -3.39453125, -3.080078125, -2.765625, -2.451171875, -2.13671875, -1.822265625, -1.5078125, -1.193359375, -0.87890625, -0.564453125, -0.25, 0.064453125, 0.37890625, 0.693359375, 1.0078125, 1.322265625, 1.63671875, 1.951171875, 2.265625, 2.580078125, 2.89453125, 3.208984375, 3.5234375, 3.837890625, 4.15234375, 4.466796875, 4.78125, 5.095703125, 5.41015625, 5.724609375, 6.0390625, 6.353515625, 6.66796875, 6.982421875, 7.296875, 7.611328125, 7.92578125, 8.240234375, 8.5546875, 8.869140625, 9.18359375, 9.498046875, 9.8125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 22.0, 20.0, 24.0, 35.0, 51.0, 71.0, 99.0, 115.0, 150.0, 114.0, 84.0, 69.0, 45.0, 33.0, 27.0, 17.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.6368408203125, -9.328369140625, -9.0198974609375, -8.71142578125, -8.4029541015625, -8.094482421875, -7.7860107421875, -7.4775390625, -7.1690673828125, -6.860595703125, -6.5521240234375, -6.24365234375, -5.9351806640625, -5.626708984375, -5.3182373046875, -5.009765625, -4.7012939453125, -4.392822265625, -4.0843505859375, -3.77587890625, -3.4674072265625, -3.158935546875, -2.8504638671875, -2.5419921875, -2.2335205078125, -1.925048828125, -1.6165771484375, -1.30810546875, -0.9996337890625, -0.691162109375, -0.3826904296875, -0.07421875, 0.2342529296875, 0.542724609375, 0.8511962890625, 1.15966796875, 1.4681396484375, 1.776611328125, 2.0850830078125, 2.3935546875, 2.7020263671875, 3.010498046875, 3.3189697265625, 3.62744140625, 3.9359130859375, 4.244384765625, 4.5528564453125, 4.861328125, 5.1697998046875, 5.478271484375, 5.7867431640625, 6.09521484375, 6.4036865234375, 6.712158203125, 7.0206298828125, 7.3291015625, 7.6375732421875, 7.946044921875, 8.2545166015625, 8.56298828125, 8.8714599609375, 9.179931640625, 9.4884033203125, 9.796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 7.0, 12.0, 34.0, 63.0, 122.0, 155.0, 218.0, 157.0, 103.0, 71.0, 30.0, 10.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.50845336914062, -120.68656921386719, -116.86468505859375, -113.04280090332031, -109.22091674804688, -105.39903259277344, -101.5771484375, -97.75526428222656, -93.93338012695312, -90.11149597167969, -86.28961181640625, -82.46772766113281, -78.64584350585938, -74.82395935058594, -71.0020751953125, -67.18019104003906, -63.358299255371094, -59.536415100097656, -55.71453094482422, -51.89264678955078, -48.070762634277344, -44.248878479003906, -40.4269905090332, -36.605106353759766, -32.78322219848633, -28.96133804321289, -25.139453887939453, -21.317567825317383, -17.495683670043945, -13.673799514770508, -9.851913452148438, -6.030029296875, -2.2081375122070312, 1.6137471199035645, 5.43563175201416, 9.257516860961914, 13.079401016235352, 16.90128517150879, 20.72317123413086, 24.545055389404297, 28.366939544677734, 32.18882369995117, 36.01070785522461, 39.83259582519531, 43.65447998046875, 47.47636413574219, 51.298248291015625, 55.12013244628906, 58.9420166015625, 62.76390075683594, 66.58578491210938, 70.40766906738281, 74.22955322265625, 78.05143737792969, 81.87332153320312, 85.69520568847656, 89.51708984375, 93.33897399902344, 97.16085815429688, 100.98274230957031, 104.80462646484375, 108.62651062011719, 112.44839477539062, 116.27027893066406, 120.09217071533203]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 10.0, 6.0, 7.0, 26.0, 14.0, 22.0, 25.0, 35.0, 36.0, 55.0, 42.0, 49.0, 56.0, 67.0, 59.0, 62.0, 56.0, 45.0, 52.0, 44.0, 27.0, 36.0, 44.0, 27.0, 19.0, 16.0, 13.0, 9.0, 7.0, 2.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.97936248779297, -74.18052673339844, -71.38169860839844, -68.5828628540039, -65.78402709960938, -62.98519515991211, -60.186363220214844, -57.38752746582031, -54.58869552612305, -51.78986358642578, -48.99102783203125, -46.192195892333984, -43.39336395263672, -40.59452819824219, -37.79569625854492, -34.996864318847656, -32.198028564453125, -29.399194717407227, -26.600360870361328, -23.801528930664062, -21.002695083618164, -18.203861236572266, -15.405029296875, -12.606195449829102, -9.807361602783203, -7.008528232574463, -4.209694862365723, -1.4108619689941406, 1.3879718780517578, 4.186805725097656, 6.985637664794922, 9.78447151184082, 12.583305358886719, 15.382139205932617, 18.180973052978516, 20.97980499267578, 23.77863883972168, 26.577472686767578, 29.376304626464844, 32.175140380859375, 34.97397232055664, 37.772804260253906, 40.57164001464844, 43.3704719543457, 46.16930389404297, 48.9681396484375, 51.766971588134766, 54.56580352783203, 57.36463928222656, 60.16347122192383, 62.96230697631836, 65.76113891601562, 68.55997467041016, 71.35881042480469, 74.15763854980469, 76.95647430419922, 79.75531005859375, 82.55414581298828, 85.35297393798828, 88.15180969238281, 90.95064544677734, 93.74948120117188, 96.54830932617188, 99.3471450805664, 102.1459732055664]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 12.0, 6.0, 17.0, 15.0, 24.0, 28.0, 40.0, 56.0, 91.0, 108.0, 153.0, 281.0, 467.0, 906.0, 1916.0, 4958.0, 17894.0, 230549.0, 3897869.0, 27185.0, 6574.0, 2488.0, 1121.0, 570.0, 324.0, 195.0, 149.0, 92.0, 63.0, 41.0, 24.0, 18.0, 11.0, 16.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.328125, -10.89453125, -10.4609375, -10.02734375, -9.59375, -9.16015625, -8.7265625, -8.29296875, -7.859375, -7.42578125, -6.9921875, -6.55859375, -6.125, -5.69140625, -5.2578125, -4.82421875, -4.390625, -3.95703125, -3.5234375, -3.08984375, -2.65625, -2.22265625, -1.7890625, -1.35546875, -0.921875, -0.48828125, -0.0546875, 0.37890625, 0.8125, 1.24609375, 1.6796875, 2.11328125, 2.546875, 2.98046875, 3.4140625, 3.84765625, 4.28125, 4.71484375, 5.1484375, 5.58203125, 6.015625, 6.44921875, 6.8828125, 7.31640625, 7.75, 8.18359375, 8.6171875, 9.05078125, 9.484375, 9.91796875, 10.3515625, 10.78515625, 11.21875, 11.65234375, 12.0859375, 12.51953125, 12.953125, 13.38671875, 13.8203125, 14.25390625, 14.6875, 15.12109375, 15.5546875, 15.98828125, 16.421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 11.0, 19.0, 12.0, 17.0, 24.0, 24.0, 31.0, 30.0, 44.0, 59.0, 55.0, 66.0, 68.0, 74.0, 64.0, 85.0, 67.0, 55.0, 43.0, 41.0, 23.0, 16.0, 12.0, 20.0, 6.0, 12.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.7532958984375, -3.619873046875, -3.4864501953125, -3.35302734375, -3.2196044921875, -3.086181640625, -2.9527587890625, -2.8193359375, -2.6859130859375, -2.552490234375, -2.4190673828125, -2.28564453125, -2.1522216796875, -2.018798828125, -1.8853759765625, -1.751953125, -1.6185302734375, -1.485107421875, -1.3516845703125, -1.21826171875, -1.0848388671875, -0.951416015625, -0.8179931640625, -0.6845703125, -0.5511474609375, -0.417724609375, -0.2843017578125, -0.15087890625, -0.0174560546875, 0.115966796875, 0.2493896484375, 0.3828125, 0.5162353515625, 0.649658203125, 0.7830810546875, 0.91650390625, 1.0499267578125, 1.183349609375, 1.3167724609375, 1.4501953125, 1.5836181640625, 1.717041015625, 1.8504638671875, 1.98388671875, 2.1173095703125, 2.250732421875, 2.3841552734375, 2.517578125, 2.6510009765625, 2.784423828125, 2.9178466796875, 3.05126953125, 3.1846923828125, 3.318115234375, 3.4515380859375, 3.5849609375, 3.7183837890625, 3.851806640625, 3.9852294921875, 4.11865234375, 4.2520751953125, 4.385498046875, 4.5189208984375, 4.65234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 7.0, 6.0, 5.0, 11.0, 19.0, 22.0, 40.0, 57.0, 66.0, 95.0, 148.0, 241.0, 345.0, 581.0, 1152.0, 2658.0, 6602.0, 23414.0, 483471.0, 3633795.0, 28316.0, 7433.0, 2811.0, 1222.0, 668.0, 374.0, 225.0, 152.0, 108.0, 65.0, 45.0, 44.0, 19.0, 25.0, 7.0, 3.0, 13.0, 5.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.2274169921875, -13.681396484375, -13.1353759765625, -12.58935546875, -12.0433349609375, -11.497314453125, -10.9512939453125, -10.4052734375, -9.8592529296875, -9.313232421875, -8.7672119140625, -8.22119140625, -7.6751708984375, -7.129150390625, -6.5831298828125, -6.037109375, -5.4910888671875, -4.945068359375, -4.3990478515625, -3.85302734375, -3.3070068359375, -2.760986328125, -2.2149658203125, -1.6689453125, -1.1229248046875, -0.576904296875, -0.0308837890625, 0.51513671875, 1.0611572265625, 1.607177734375, 2.1531982421875, 2.69921875, 3.2452392578125, 3.791259765625, 4.3372802734375, 4.88330078125, 5.4293212890625, 5.975341796875, 6.5213623046875, 7.0673828125, 7.6134033203125, 8.159423828125, 8.7054443359375, 9.25146484375, 9.7974853515625, 10.343505859375, 10.8895263671875, 11.435546875, 11.9815673828125, 12.527587890625, 13.0736083984375, 13.61962890625, 14.1656494140625, 14.711669921875, 15.2576904296875, 15.8037109375, 16.3497314453125, 16.895751953125, 17.4417724609375, 17.98779296875, 18.5338134765625, 19.079833984375, 19.6258544921875, 20.171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 11.0, 9.0, 12.0, 20.0, 34.0, 67.0, 161.0, 3215.0, 373.0, 72.0, 26.0, 19.0, 10.0, 8.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.57940673828125, -6.3502197265625, -6.12103271484375, -5.891845703125, -5.66265869140625, -5.4334716796875, -5.20428466796875, -4.97509765625, -4.74591064453125, -4.5167236328125, -4.28753662109375, -4.058349609375, -3.82916259765625, -3.5999755859375, -3.37078857421875, -3.1416015625, -2.91241455078125, -2.6832275390625, -2.45404052734375, -2.224853515625, -1.99566650390625, -1.7664794921875, -1.53729248046875, -1.30810546875, -1.07891845703125, -0.8497314453125, -0.62054443359375, -0.391357421875, -0.16217041015625, 0.0670166015625, 0.29620361328125, 0.525390625, 0.75457763671875, 0.9837646484375, 1.21295166015625, 1.442138671875, 1.67132568359375, 1.9005126953125, 2.12969970703125, 2.35888671875, 2.58807373046875, 2.8172607421875, 3.04644775390625, 3.275634765625, 3.50482177734375, 3.7340087890625, 3.96319580078125, 4.1923828125, 4.42156982421875, 4.6507568359375, 4.87994384765625, 5.109130859375, 5.33831787109375, 5.5675048828125, 5.79669189453125, 6.02587890625, 6.25506591796875, 6.4842529296875, 6.71343994140625, 6.942626953125, 7.17181396484375, 7.4010009765625, 7.63018798828125, 7.859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 3.0, 12.0, 17.0, 20.0, 29.0, 52.0, 75.0, 88.0, 113.0, 143.0, 125.0, 134.0, 70.0, 49.0, 23.0, 18.0, 8.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.415435791015625, -39.537105560302734, -38.65877914428711, -37.78044891357422, -36.90211868286133, -36.02378845214844, -35.14546203613281, -34.26713180541992, -33.38880157470703, -32.51047134399414, -31.632143020629883, -30.753814697265625, -29.875484466552734, -28.997156143188477, -28.11882781982422, -27.240497589111328, -26.36216926574707, -25.483840942382812, -24.605510711669922, -23.727182388305664, -22.848852157592773, -21.970523834228516, -21.092193603515625, -20.213865280151367, -19.33553695678711, -18.45720863342285, -17.57887840270996, -16.700550079345703, -15.822219848632812, -14.943891525268555, -14.06556224822998, -13.187232971191406, -12.308900833129883, -11.430571556091309, -10.552242279052734, -9.673913955688477, -8.795583724975586, -7.91725492477417, -7.038926124572754, -6.16059684753418, -5.2822675704956055, -4.403938293457031, -3.525609254837036, -2.647280216217041, -1.7689509391784668, -0.8906216621398926, -0.012292861938476562, 0.8660364151000977, 1.7443656921386719, 2.622694969177246, 3.501024007797241, 4.379353046417236, 5.2576823234558105, 6.136011600494385, 7.014340400695801, 7.892669677734375, 8.77099895477295, 9.649328231811523, 10.527657508850098, 11.405986785888672, 12.28431510925293, 13.16264533996582, 14.040973663330078, 14.919302940368652, 15.797632217407227]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 6.0, 6.0, 10.0, 18.0, 12.0, 19.0, 15.0, 26.0, 29.0, 18.0, 35.0, 32.0, 43.0, 48.0, 52.0, 45.0, 38.0, 34.0, 38.0, 49.0, 52.0, 42.0, 45.0, 43.0, 29.0, 30.0, 20.0, 31.0, 20.0, 22.0, 16.0, 10.0, 19.0, 8.0, 1.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.903388977050781, -14.439169883728027, -13.974949836730957, -13.510730743408203, -13.046510696411133, -12.582291603088379, -12.118072509765625, -11.653852462768555, -11.189632415771484, -10.72541332244873, -10.26119327545166, -9.796974182128906, -9.332754135131836, -8.868535041809082, -8.404315948486328, -7.940095901489258, -7.475876808166504, -7.011657238006592, -6.54743766784668, -6.083218574523926, -5.6189985275268555, -5.154779434204102, -4.6905598640441895, -4.226340293884277, -3.7621207237243652, -3.297901153564453, -2.833681583404541, -2.369462251663208, -1.905242681503296, -1.4410231113433838, -0.9768037796020508, -0.5125842094421387, -0.048363685607910156, 0.4158558249473572, 0.8800753355026245, 1.344294786453247, 1.8085143566131592, 2.2727339267730713, 2.7369532585144043, 3.2011728286743164, 3.6653923988342285, 4.129611968994141, 4.593831539154053, 5.058051109313965, 5.522270202636719, 5.986490249633789, 6.450709342956543, 6.914928913116455, 7.379148483276367, 7.843368053436279, 8.307587623596191, 8.771806716918945, 9.236026763916016, 9.70024585723877, 10.164464950561523, 10.628684997558594, 11.092905044555664, 11.557124137878418, 12.021344184875488, 12.485563278198242, 12.949783325195312, 13.414002418518066, 13.87822151184082, 14.34244155883789, 14.806660652160645]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 6.0, 8.0, 16.0, 15.0, 23.0, 36.0, 59.0, 95.0, 159.0, 280.0, 521.0, 1068.0, 2217.0, 5326.0, 13914.0, 38046.0, 109565.0, 361368.0, 349674.0, 105982.0, 36939.0, 13394.0, 5274.0, 2255.0, 1088.0, 553.0, 270.0, 152.0, 94.0, 53.0, 23.0, 18.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.140625, -8.8548583984375, -8.569091796875, -8.2833251953125, -7.99755859375, -7.7117919921875, -7.426025390625, -7.1402587890625, -6.8544921875, -6.5687255859375, -6.282958984375, -5.9971923828125, -5.71142578125, -5.4256591796875, -5.139892578125, -4.8541259765625, -4.568359375, -4.2825927734375, -3.996826171875, -3.7110595703125, -3.42529296875, -3.1395263671875, -2.853759765625, -2.5679931640625, -2.2822265625, -1.9964599609375, -1.710693359375, -1.4249267578125, -1.13916015625, -0.8533935546875, -0.567626953125, -0.2818603515625, 0.00390625, 0.2896728515625, 0.575439453125, 0.8612060546875, 1.14697265625, 1.4327392578125, 1.718505859375, 2.0042724609375, 2.2900390625, 2.5758056640625, 2.861572265625, 3.1473388671875, 3.43310546875, 3.7188720703125, 4.004638671875, 4.2904052734375, 4.576171875, 4.8619384765625, 5.147705078125, 5.4334716796875, 5.71923828125, 6.0050048828125, 6.290771484375, 6.5765380859375, 6.8623046875, 7.1480712890625, 7.433837890625, 7.7196044921875, 8.00537109375, 8.2911376953125, 8.576904296875, 8.8626708984375, 9.1484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 10.0, 12.0, 13.0, 17.0, 10.0, 25.0, 21.0, 25.0, 32.0, 47.0, 48.0, 51.0, 73.0, 56.0, 75.0, 47.0, 60.0, 76.0, 44.0, 58.0, 47.0, 40.0, 27.0, 20.0, 19.0, 15.0, 4.0, 8.0, 3.0, 12.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.36376953125, -3.2275390625, -3.09130859375, -2.955078125, -2.81884765625, -2.6826171875, -2.54638671875, -2.41015625, -2.27392578125, -2.1376953125, -2.00146484375, -1.865234375, -1.72900390625, -1.5927734375, -1.45654296875, -1.3203125, -1.18408203125, -1.0478515625, -0.91162109375, -0.775390625, -0.63916015625, -0.5029296875, -0.36669921875, -0.23046875, -0.09423828125, 0.0419921875, 0.17822265625, 0.314453125, 0.45068359375, 0.5869140625, 0.72314453125, 0.859375, 0.99560546875, 1.1318359375, 1.26806640625, 1.404296875, 1.54052734375, 1.6767578125, 1.81298828125, 1.94921875, 2.08544921875, 2.2216796875, 2.35791015625, 2.494140625, 2.63037109375, 2.7666015625, 2.90283203125, 3.0390625, 3.17529296875, 3.3115234375, 3.44775390625, 3.583984375, 3.72021484375, 3.8564453125, 3.99267578125, 4.12890625, 4.26513671875, 4.4013671875, 4.53759765625, 4.673828125, 4.81005859375, 4.9462890625, 5.08251953125, 5.21875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 4.0, 9.0, 22.0, 11.0, 27.0, 36.0, 60.0, 78.0, 116.0, 177.0, 252.0, 403.0, 693.0, 1249.0, 3205.0, 12634.0, 109207.0, 784481.0, 116101.0, 13283.0, 3271.0, 1278.0, 700.0, 405.0, 251.0, 163.0, 128.0, 73.0, 54.0, 47.0, 32.0, 26.0, 21.0, 12.0, 8.0, 5.0, 9.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8046875, -15.2503662109375, -14.696044921875, -14.1417236328125, -13.58740234375, -13.0330810546875, -12.478759765625, -11.9244384765625, -11.3701171875, -10.8157958984375, -10.261474609375, -9.7071533203125, -9.15283203125, -8.5985107421875, -8.044189453125, -7.4898681640625, -6.935546875, -6.3812255859375, -5.826904296875, -5.2725830078125, -4.71826171875, -4.1639404296875, -3.609619140625, -3.0552978515625, -2.5009765625, -1.9466552734375, -1.392333984375, -0.8380126953125, -0.28369140625, 0.2706298828125, 0.824951171875, 1.3792724609375, 1.93359375, 2.4879150390625, 3.042236328125, 3.5965576171875, 4.15087890625, 4.7052001953125, 5.259521484375, 5.8138427734375, 6.3681640625, 6.9224853515625, 7.476806640625, 8.0311279296875, 8.58544921875, 9.1397705078125, 9.694091796875, 10.2484130859375, 10.802734375, 11.3570556640625, 11.911376953125, 12.4656982421875, 13.02001953125, 13.5743408203125, 14.128662109375, 14.6829833984375, 15.2373046875, 15.7916259765625, 16.345947265625, 16.9002685546875, 17.45458984375, 18.0089111328125, 18.563232421875, 19.1175537109375, 19.671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 8.0, 3.0, 11.0, 20.0, 11.0, 9.0, 18.0, 26.0, 21.0, 29.0, 35.0, 35.0, 31.0, 41.0, 31.0, 34.0, 45.0, 50.0, 44.0, 57.0, 38.0, 45.0, 41.0, 34.0, 35.0, 39.0, 24.0, 29.0, 27.0, 25.0, 19.0, 13.0, 11.0, 7.0, 10.0, 7.0, 7.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.0546875, -11.6341552734375, -11.213623046875, -10.7930908203125, -10.37255859375, -9.9520263671875, -9.531494140625, -9.1109619140625, -8.6904296875, -8.2698974609375, -7.849365234375, -7.4288330078125, -7.00830078125, -6.5877685546875, -6.167236328125, -5.7467041015625, -5.326171875, -4.9056396484375, -4.485107421875, -4.0645751953125, -3.64404296875, -3.2235107421875, -2.802978515625, -2.3824462890625, -1.9619140625, -1.5413818359375, -1.120849609375, -0.7003173828125, -0.27978515625, 0.1407470703125, 0.561279296875, 0.9818115234375, 1.40234375, 1.8228759765625, 2.243408203125, 2.6639404296875, 3.08447265625, 3.5050048828125, 3.925537109375, 4.3460693359375, 4.7666015625, 5.1871337890625, 5.607666015625, 6.0281982421875, 6.44873046875, 6.8692626953125, 7.289794921875, 7.7103271484375, 8.130859375, 8.5513916015625, 8.971923828125, 9.3924560546875, 9.81298828125, 10.2335205078125, 10.654052734375, 11.0745849609375, 11.4951171875, 11.9156494140625, 12.336181640625, 12.7567138671875, 13.17724609375, 13.5977783203125, 14.018310546875, 14.4388427734375, 14.859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 11.0, 16.0, 20.0, 35.0, 35.0, 55.0, 68.0, 135.0, 215.0, 356.0, 669.0, 1286.0, 3000.0, 7889.0, 25570.0, 112830.0, 578233.0, 247729.0, 48607.0, 13109.0, 4586.0, 1945.0, 912.0, 468.0, 254.0, 152.0, 115.0, 68.0, 42.0, 33.0, 26.0, 24.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.796875, -4.6546630859375, -4.512451171875, -4.3702392578125, -4.22802734375, -4.0858154296875, -3.943603515625, -3.8013916015625, -3.6591796875, -3.5169677734375, -3.374755859375, -3.2325439453125, -3.09033203125, -2.9481201171875, -2.805908203125, -2.6636962890625, -2.521484375, -2.3792724609375, -2.237060546875, -2.0948486328125, -1.95263671875, -1.8104248046875, -1.668212890625, -1.5260009765625, -1.3837890625, -1.2415771484375, -1.099365234375, -0.9571533203125, -0.81494140625, -0.6727294921875, -0.530517578125, -0.3883056640625, -0.24609375, -0.1038818359375, 0.038330078125, 0.1805419921875, 0.32275390625, 0.4649658203125, 0.607177734375, 0.7493896484375, 0.8916015625, 1.0338134765625, 1.176025390625, 1.3182373046875, 1.46044921875, 1.6026611328125, 1.744873046875, 1.8870849609375, 2.029296875, 2.1715087890625, 2.313720703125, 2.4559326171875, 2.59814453125, 2.7403564453125, 2.882568359375, 3.0247802734375, 3.1669921875, 3.3092041015625, 3.451416015625, 3.5936279296875, 3.73583984375, 3.8780517578125, 4.020263671875, 4.1624755859375, 4.3046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 21.0, 13.0, 19.0, 33.0, 27.0, 40.0, 49.0, 60.0, 90.0, 113.0, 135.0, 72.0, 63.0, 48.0, 39.0, 34.0, 22.0, 22.0, 19.0, 8.0, 6.0, 11.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00135040283203125, -0.0013118237257003784, -0.0012732446193695068, -0.0012346655130386353, -0.0011960864067077637, -0.001157507300376892, -0.0011189281940460205, -0.001080349087715149, -0.0010417699813842773, -0.0010031908750534058, -0.0009646117687225342, -0.0009260326623916626, -0.000887453556060791, -0.0008488744497299194, -0.0008102953433990479, -0.0007717162370681763, -0.0007331371307373047, -0.0006945580244064331, -0.0006559789180755615, -0.0006173998117446899, -0.0005788207054138184, -0.0005402415990829468, -0.0005016624927520752, -0.0004630833864212036, -0.00042450428009033203, -0.00038592517375946045, -0.00034734606742858887, -0.0003087669610977173, -0.0002701878547668457, -0.00023160874843597412, -0.00019302964210510254, -0.00015445053577423096, -0.00011587142944335938, -7.729232311248779e-05, -3.871321678161621e-05, -1.341104507446289e-07, 3.844499588012695e-05, 7.702410221099854e-05, 0.00011560320854187012, 0.0001541823148727417, 0.00019276142120361328, 0.00023134052753448486, 0.00026991963386535645, 0.00030849874019622803, 0.0003470778465270996, 0.0003856569528579712, 0.0004242360591888428, 0.00046281516551971436, 0.0005013942718505859, 0.0005399733781814575, 0.0005785524845123291, 0.0006171315908432007, 0.0006557106971740723, 0.0006942898035049438, 0.0007328689098358154, 0.000771448016166687, 0.0008100271224975586, 0.0008486062288284302, 0.0008871853351593018, 0.0009257644414901733, 0.0009643435478210449, 0.0010029226541519165, 0.001041501760482788, 0.0010800808668136597, 0.0011186599731445312]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 8.0, 4.0, 6.0, 8.0, 14.0, 24.0, 47.0, 55.0, 97.0, 143.0, 278.0, 512.0, 1135.0, 3084.0, 12816.0, 100556.0, 737338.0, 167541.0, 18184.0, 3986.0, 1262.0, 650.0, 311.0, 192.0, 103.0, 63.0, 59.0, 22.0, 24.0, 12.0, 11.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73828125, -4.52862548828125, -4.3189697265625, -4.10931396484375, -3.899658203125, -3.69000244140625, -3.4803466796875, -3.27069091796875, -3.06103515625, -2.85137939453125, -2.6417236328125, -2.43206787109375, -2.222412109375, -2.01275634765625, -1.8031005859375, -1.59344482421875, -1.3837890625, -1.17413330078125, -0.9644775390625, -0.75482177734375, -0.545166015625, -0.33551025390625, -0.1258544921875, 0.08380126953125, 0.29345703125, 0.50311279296875, 0.7127685546875, 0.92242431640625, 1.132080078125, 1.34173583984375, 1.5513916015625, 1.76104736328125, 1.970703125, 2.18035888671875, 2.3900146484375, 2.59967041015625, 2.809326171875, 3.01898193359375, 3.2286376953125, 3.43829345703125, 3.64794921875, 3.85760498046875, 4.0672607421875, 4.27691650390625, 4.486572265625, 4.69622802734375, 4.9058837890625, 5.11553955078125, 5.3251953125, 5.53485107421875, 5.7445068359375, 5.95416259765625, 6.163818359375, 6.37347412109375, 6.5831298828125, 6.79278564453125, 7.00244140625, 7.21209716796875, 7.4217529296875, 7.63140869140625, 7.841064453125, 8.05072021484375, 8.2603759765625, 8.47003173828125, 8.6796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 12.0, 5.0, 8.0, 14.0, 13.0, 14.0, 21.0, 31.0, 37.0, 32.0, 35.0, 52.0, 65.0, 72.0, 106.0, 76.0, 66.0, 77.0, 52.0, 39.0, 36.0, 32.0, 22.0, 19.0, 18.0, 16.0, 11.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.558258056640625, -3.41534423828125, -3.272430419921875, -3.1295166015625, -2.986602783203125, -2.84368896484375, -2.700775146484375, -2.557861328125, -2.414947509765625, -2.27203369140625, -2.129119873046875, -1.9862060546875, -1.843292236328125, -1.70037841796875, -1.557464599609375, -1.41455078125, -1.271636962890625, -1.12872314453125, -0.985809326171875, -0.8428955078125, -0.699981689453125, -0.55706787109375, -0.414154052734375, -0.271240234375, -0.128326416015625, 0.01458740234375, 0.157501220703125, 0.3004150390625, 0.443328857421875, 0.58624267578125, 0.729156494140625, 0.8720703125, 1.014984130859375, 1.15789794921875, 1.300811767578125, 1.4437255859375, 1.586639404296875, 1.72955322265625, 1.872467041015625, 2.015380859375, 2.158294677734375, 2.30120849609375, 2.444122314453125, 2.5870361328125, 2.729949951171875, 2.87286376953125, 3.015777587890625, 3.15869140625, 3.301605224609375, 3.44451904296875, 3.587432861328125, 3.7303466796875, 3.873260498046875, 4.01617431640625, 4.159088134765625, 4.302001953125, 4.444915771484375, 4.58782958984375, 4.730743408203125, 4.8736572265625, 5.016571044921875, 5.15948486328125, 5.302398681640625, 5.4453125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 14.0, 22.0, 36.0, 66.0, 102.0, 126.0, 132.0, 149.0, 115.0, 67.0, 71.0, 36.0, 14.0, 12.0, 13.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.14347839355469, -90.04429626464844, -86.94512176513672, -83.845947265625, -80.74676513671875, -77.6475830078125, -74.54840850830078, -71.44923400878906, -68.35005187988281, -65.25086975097656, -62.151695251464844, -59.05251693725586, -55.953338623046875, -52.85416030883789, -49.754981994628906, -46.65580368041992, -43.55662536621094, -40.45744705200195, -37.35826873779297, -34.259090423583984, -31.159912109375, -28.060733795166016, -24.96155548095703, -21.862377166748047, -18.763198852539062, -15.664020538330078, -12.564842224121094, -9.46566390991211, -6.366485595703125, -3.2673072814941406, -0.16812896728515625, 2.931049346923828, 6.0302276611328125, 9.129405975341797, 12.228584289550781, 15.327762603759766, 18.42694091796875, 21.526119232177734, 24.62529754638672, 27.724475860595703, 30.823654174804688, 33.92283248901367, 37.022010803222656, 40.12118911743164, 43.220367431640625, 46.31954574584961, 49.418724060058594, 52.51790237426758, 55.61708068847656, 58.71625900268555, 61.81543731689453, 64.91461181640625, 68.0137939453125, 71.11297607421875, 74.21215057373047, 77.31132507324219, 80.41050720214844, 83.50968933105469, 86.6088638305664, 89.70803833007812, 92.80722045898438, 95.90640258789062, 99.00557708740234, 102.10475158691406, 105.20393371582031]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 7.0, 12.0, 13.0, 12.0, 21.0, 22.0, 19.0, 32.0, 21.0, 30.0, 39.0, 43.0, 39.0, 49.0, 37.0, 38.0, 52.0, 52.0, 45.0, 37.0, 37.0, 34.0, 34.0, 37.0, 29.0, 28.0, 26.0, 25.0, 16.0, 15.0, 16.0, 19.0, 9.0, 7.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-59.2274169921875, -57.429813385009766, -55.632205963134766, -53.83460235595703, -52.0369987487793, -50.23939514160156, -48.44178771972656, -46.64418411254883, -44.846580505371094, -43.04897689819336, -41.25136947631836, -39.453765869140625, -37.65616226196289, -35.858558654785156, -34.060951232910156, -32.26334762573242, -30.465742111206055, -28.668136596679688, -26.870532989501953, -25.072927474975586, -23.27532386779785, -21.477718353271484, -19.68011474609375, -17.882509231567383, -16.084903717041016, -14.287299156188965, -12.489694595336914, -10.692089080810547, -8.894485473632812, -7.096879959106445, -5.2992753982543945, -3.5016708374023438, -1.7040672302246094, 0.09353744983673096, 1.8911421298980713, 3.688746929168701, 5.486351490020752, 7.283956527709961, 9.081561088562012, 10.879165649414062, 12.676770210266113, 14.474374771118164, 16.27198028564453, 18.069583892822266, 19.867189407348633, 21.664794921875, 23.462398529052734, 25.26000213623047, 27.057607650756836, 28.855213165283203, 30.652816772460938, 32.45042037963867, 34.24802780151367, 36.045631408691406, 37.84323501586914, 39.640838623046875, 41.438446044921875, 43.23604965209961, 45.03365707397461, 46.831260681152344, 48.62886428833008, 50.42646789550781, 52.22407531738281, 54.02167892456055, 55.81928253173828]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 14.0, 17.0, 24.0, 33.0, 62.0, 74.0, 114.0, 186.0, 286.0, 435.0, 667.0, 1084.0, 1783.0, 3139.0, 5763.0, 11411.0, 25009.0, 65608.0, 273457.0, 2667924.0, 940070.0, 123460.0, 39238.0, 16162.0, 7777.0, 4116.0, 2377.0, 1420.0, 854.0, 571.0, 391.0, 238.0, 171.0, 93.0, 73.0, 56.0, 31.0, 31.0, 20.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.703125, -5.511474609375, -5.31982421875, -5.128173828125, -4.9365234375, -4.744873046875, -4.55322265625, -4.361572265625, -4.169921875, -3.978271484375, -3.78662109375, -3.594970703125, -3.4033203125, -3.211669921875, -3.02001953125, -2.828369140625, -2.63671875, -2.445068359375, -2.25341796875, -2.061767578125, -1.8701171875, -1.678466796875, -1.48681640625, -1.295166015625, -1.103515625, -0.911865234375, -0.72021484375, -0.528564453125, -0.3369140625, -0.145263671875, 0.04638671875, 0.238037109375, 0.4296875, 0.621337890625, 0.81298828125, 1.004638671875, 1.1962890625, 1.387939453125, 1.57958984375, 1.771240234375, 1.962890625, 2.154541015625, 2.34619140625, 2.537841796875, 2.7294921875, 2.921142578125, 3.11279296875, 3.304443359375, 3.49609375, 3.687744140625, 3.87939453125, 4.071044921875, 4.2626953125, 4.454345703125, 4.64599609375, 4.837646484375, 5.029296875, 5.220947265625, 5.41259765625, 5.604248046875, 5.7958984375, 5.987548828125, 6.17919921875, 6.370849609375, 6.5625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 9.0, 10.0, 18.0, 21.0, 28.0, 41.0, 46.0, 48.0, 69.0, 69.0, 85.0, 75.0, 79.0, 80.0, 69.0, 62.0, 44.0, 46.0, 30.0, 20.0, 14.0, 11.0, 7.0, 3.0, 12.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.359588623046875, -3.20550537109375, -3.051422119140625, -2.8973388671875, -2.743255615234375, -2.58917236328125, -2.435089111328125, -2.281005859375, -2.126922607421875, -1.97283935546875, -1.818756103515625, -1.6646728515625, -1.510589599609375, -1.35650634765625, -1.202423095703125, -1.04833984375, -0.894256591796875, -0.74017333984375, -0.586090087890625, -0.4320068359375, -0.277923583984375, -0.12384033203125, 0.030242919921875, 0.184326171875, 0.338409423828125, 0.49249267578125, 0.646575927734375, 0.8006591796875, 0.954742431640625, 1.10882568359375, 1.262908935546875, 1.4169921875, 1.571075439453125, 1.72515869140625, 1.879241943359375, 2.0333251953125, 2.187408447265625, 2.34149169921875, 2.495574951171875, 2.649658203125, 2.803741455078125, 2.95782470703125, 3.111907958984375, 3.2659912109375, 3.420074462890625, 3.57415771484375, 3.728240966796875, 3.88232421875, 4.036407470703125, 4.19049072265625, 4.344573974609375, 4.4986572265625, 4.652740478515625, 4.80682373046875, 4.960906982421875, 5.114990234375, 5.269073486328125, 5.42315673828125, 5.577239990234375, 5.7313232421875, 5.885406494140625, 6.03948974609375, 6.193572998046875, 6.34765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 5.0, 8.0, 16.0, 11.0, 11.0, 18.0, 22.0, 32.0, 45.0, 71.0, 134.0, 242.0, 426.0, 953.0, 1971.0, 5009.0, 14270.0, 49730.0, 261152.0, 3259080.0, 497072.0, 72748.0, 19798.0, 6451.0, 2491.0, 1157.0, 540.0, 307.0, 161.0, 120.0, 70.0, 39.0, 28.0, 23.0, 13.0, 14.0, 8.0, 8.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.5601806640625, -9.237548828125, -8.9149169921875, -8.59228515625, -8.2696533203125, -7.947021484375, -7.6243896484375, -7.3017578125, -6.9791259765625, -6.656494140625, -6.3338623046875, -6.01123046875, -5.6885986328125, -5.365966796875, -5.0433349609375, -4.720703125, -4.3980712890625, -4.075439453125, -3.7528076171875, -3.43017578125, -3.1075439453125, -2.784912109375, -2.4622802734375, -2.1396484375, -1.8170166015625, -1.494384765625, -1.1717529296875, -0.84912109375, -0.5264892578125, -0.203857421875, 0.1187744140625, 0.44140625, 0.7640380859375, 1.086669921875, 1.4093017578125, 1.73193359375, 2.0545654296875, 2.377197265625, 2.6998291015625, 3.0224609375, 3.3450927734375, 3.667724609375, 3.9903564453125, 4.31298828125, 4.6356201171875, 4.958251953125, 5.2808837890625, 5.603515625, 5.9261474609375, 6.248779296875, 6.5714111328125, 6.89404296875, 7.2166748046875, 7.539306640625, 7.8619384765625, 8.1845703125, 8.5072021484375, 8.829833984375, 9.1524658203125, 9.47509765625, 9.7977294921875, 10.120361328125, 10.4429931640625, 10.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 10.0, 3.0, 5.0, 7.0, 8.0, 15.0, 23.0, 23.0, 34.0, 34.0, 51.0, 60.0, 99.0, 134.0, 184.0, 350.0, 588.0, 890.0, 582.0, 309.0, 158.0, 125.0, 84.0, 61.0, 54.0, 41.0, 28.0, 16.0, 22.0, 16.0, 13.0, 11.0, 6.0, 1.0, 7.0, 8.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.53125, -9.246337890625, -8.96142578125, -8.676513671875, -8.3916015625, -8.106689453125, -7.82177734375, -7.536865234375, -7.251953125, -6.967041015625, -6.68212890625, -6.397216796875, -6.1123046875, -5.827392578125, -5.54248046875, -5.257568359375, -4.97265625, -4.687744140625, -4.40283203125, -4.117919921875, -3.8330078125, -3.548095703125, -3.26318359375, -2.978271484375, -2.693359375, -2.408447265625, -2.12353515625, -1.838623046875, -1.5537109375, -1.268798828125, -0.98388671875, -0.698974609375, -0.4140625, -0.129150390625, 0.15576171875, 0.440673828125, 0.7255859375, 1.010498046875, 1.29541015625, 1.580322265625, 1.865234375, 2.150146484375, 2.43505859375, 2.719970703125, 3.0048828125, 3.289794921875, 3.57470703125, 3.859619140625, 4.14453125, 4.429443359375, 4.71435546875, 4.999267578125, 5.2841796875, 5.569091796875, 5.85400390625, 6.138916015625, 6.423828125, 6.708740234375, 6.99365234375, 7.278564453125, 7.5634765625, 7.848388671875, 8.13330078125, 8.418212890625, 8.703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 46.0, 71.0, 121.0, 176.0, 193.0, 166.0, 92.0, 38.0, 22.0, 14.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-145.06201171875, -141.28384399414062, -137.5056915283203, -133.72752380371094, -129.94937133789062, -126.17121124267578, -122.39305114746094, -118.6148910522461, -114.83673095703125, -111.0585708618164, -107.28041076660156, -103.50225067138672, -99.72409057617188, -95.94593048095703, -92.16777038574219, -88.38961029052734, -84.6114501953125, -80.83329010009766, -77.05513000488281, -73.27696990966797, -69.49880981445312, -65.72064971923828, -61.94248962402344, -58.164329528808594, -54.38616180419922, -50.608001708984375, -46.82984161376953, -43.05168151855469, -39.273521423339844, -35.495361328125, -31.717199325561523, -27.93903923034668, -24.16088104248047, -20.382720947265625, -16.60456085205078, -12.826399803161621, -9.048239707946777, -5.270078659057617, -1.4919185638427734, 2.2862415313720703, 6.064401626586914, 9.842561721801758, 13.620721817016602, 17.398883819580078, 21.177043914794922, 24.955204010009766, 28.73336410522461, 32.51152420043945, 36.2896842956543, 40.06784439086914, 43.846004486083984, 47.62416458129883, 51.40232467651367, 55.18048858642578, 58.958648681640625, 62.73680877685547, 66.51496887207031, 70.29312896728516, 74.0712890625, 77.84944915771484, 81.62760925292969, 85.40576934814453, 89.18392944335938, 92.96208953857422, 96.74024963378906]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 13.0, 7.0, 11.0, 15.0, 20.0, 34.0, 25.0, 31.0, 33.0, 35.0, 42.0, 48.0, 56.0, 51.0, 39.0, 50.0, 41.0, 62.0, 43.0, 41.0, 35.0, 43.0, 39.0, 27.0, 28.0, 18.0, 23.0, 15.0, 9.0, 8.0, 9.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.46091842651367, -54.84055709838867, -53.220191955566406, -51.599830627441406, -49.979469299316406, -48.359107971191406, -46.738746643066406, -45.11838150024414, -43.49802017211914, -41.87765884399414, -40.257293701171875, -38.636932373046875, -37.016571044921875, -35.396209716796875, -33.775848388671875, -32.15548324584961, -30.53512191772461, -28.91476058959961, -27.294397354125977, -25.674034118652344, -24.053672790527344, -22.433311462402344, -20.81294822692871, -19.192584991455078, -17.572223663330078, -15.951861381530762, -14.331499099731445, -12.711136817932129, -11.090774536132812, -9.470412254333496, -7.85004997253418, -6.229687690734863, -4.6093292236328125, -2.988966941833496, -1.3686046600341797, 0.2517576217651367, 1.8721199035644531, 3.4924821853637695, 5.112844467163086, 6.733206748962402, 8.353569030761719, 9.973931312561035, 11.594293594360352, 13.214655876159668, 14.835018157958984, 16.455379486083984, 18.075742721557617, 19.69610595703125, 21.31646728515625, 22.93682861328125, 24.557191848754883, 26.177555084228516, 27.797916412353516, 29.418277740478516, 31.03864097595215, 32.65900421142578, 34.27936553955078, 35.89972686767578, 37.52008819580078, 39.14045333862305, 40.76081466674805, 42.38117599487305, 44.00154113769531, 45.62190246582031, 47.24226379394531]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 6.0, 12.0, 17.0, 23.0, 49.0, 73.0, 107.0, 172.0, 276.0, 539.0, 837.0, 1433.0, 2627.0, 4996.0, 9425.0, 19808.0, 42737.0, 101133.0, 346007.0, 336783.0, 99196.0, 42508.0, 19545.0, 9412.0, 4796.0, 2588.0, 1451.0, 786.0, 501.0, 270.0, 154.0, 110.0, 66.0, 44.0, 28.0, 21.0, 10.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.74285888671875, -5.5130615234375, -5.28326416015625, -5.053466796875, -4.82366943359375, -4.5938720703125, -4.36407470703125, -4.13427734375, -3.90447998046875, -3.6746826171875, -3.44488525390625, -3.215087890625, -2.98529052734375, -2.7554931640625, -2.52569580078125, -2.2958984375, -2.06610107421875, -1.8363037109375, -1.60650634765625, -1.376708984375, -1.14691162109375, -0.9171142578125, -0.68731689453125, -0.45751953125, -0.22772216796875, 0.0020751953125, 0.23187255859375, 0.461669921875, 0.69146728515625, 0.9212646484375, 1.15106201171875, 1.380859375, 1.61065673828125, 1.8404541015625, 2.07025146484375, 2.300048828125, 2.52984619140625, 2.7596435546875, 2.98944091796875, 3.21923828125, 3.44903564453125, 3.6788330078125, 3.90863037109375, 4.138427734375, 4.36822509765625, 4.5980224609375, 4.82781982421875, 5.0576171875, 5.28741455078125, 5.5172119140625, 5.74700927734375, 5.976806640625, 6.20660400390625, 6.4364013671875, 6.66619873046875, 6.89599609375, 7.12579345703125, 7.3555908203125, 7.58538818359375, 7.815185546875, 8.04498291015625, 8.2747802734375, 8.50457763671875, 8.734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 9.0, 5.0, 8.0, 7.0, 15.0, 19.0, 23.0, 25.0, 33.0, 29.0, 47.0, 49.0, 43.0, 48.0, 45.0, 69.0, 59.0, 58.0, 53.0, 40.0, 48.0, 45.0, 34.0, 38.0, 32.0, 21.0, 16.0, 15.0, 15.0, 6.0, 10.0, 6.0, 2.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9609375, -2.847900390625, -2.73486328125, -2.621826171875, -2.5087890625, -2.395751953125, -2.28271484375, -2.169677734375, -2.056640625, -1.943603515625, -1.83056640625, -1.717529296875, -1.6044921875, -1.491455078125, -1.37841796875, -1.265380859375, -1.15234375, -1.039306640625, -0.92626953125, -0.813232421875, -0.7001953125, -0.587158203125, -0.47412109375, -0.361083984375, -0.248046875, -0.135009765625, -0.02197265625, 0.091064453125, 0.2041015625, 0.317138671875, 0.43017578125, 0.543212890625, 0.65625, 0.769287109375, 0.88232421875, 0.995361328125, 1.1083984375, 1.221435546875, 1.33447265625, 1.447509765625, 1.560546875, 1.673583984375, 1.78662109375, 1.899658203125, 2.0126953125, 2.125732421875, 2.23876953125, 2.351806640625, 2.46484375, 2.577880859375, 2.69091796875, 2.803955078125, 2.9169921875, 3.030029296875, 3.14306640625, 3.256103515625, 3.369140625, 3.482177734375, 3.59521484375, 3.708251953125, 3.8212890625, 3.934326171875, 4.04736328125, 4.160400390625, 4.2734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 14.0, 11.0, 18.0, 19.0, 26.0, 37.0, 84.0, 91.0, 152.0, 252.0, 348.0, 615.0, 1210.0, 2868.0, 10420.0, 84460.0, 860041.0, 73014.0, 9293.0, 2741.0, 1100.0, 622.0, 394.0, 223.0, 145.0, 108.0, 75.0, 63.0, 28.0, 22.0, 15.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.9375, -19.260986328125, -18.58447265625, -17.907958984375, -17.2314453125, -16.554931640625, -15.87841796875, -15.201904296875, -14.525390625, -13.848876953125, -13.17236328125, -12.495849609375, -11.8193359375, -11.142822265625, -10.46630859375, -9.789794921875, -9.11328125, -8.436767578125, -7.76025390625, -7.083740234375, -6.4072265625, -5.730712890625, -5.05419921875, -4.377685546875, -3.701171875, -3.024658203125, -2.34814453125, -1.671630859375, -0.9951171875, -0.318603515625, 0.35791015625, 1.034423828125, 1.7109375, 2.387451171875, 3.06396484375, 3.740478515625, 4.4169921875, 5.093505859375, 5.77001953125, 6.446533203125, 7.123046875, 7.799560546875, 8.47607421875, 9.152587890625, 9.8291015625, 10.505615234375, 11.18212890625, 11.858642578125, 12.53515625, 13.211669921875, 13.88818359375, 14.564697265625, 15.2412109375, 15.917724609375, 16.59423828125, 17.270751953125, 17.947265625, 18.623779296875, 19.30029296875, 19.976806640625, 20.6533203125, 21.329833984375, 22.00634765625, 22.682861328125, 23.359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 9.0, 9.0, 2.0, 19.0, 17.0, 22.0, 26.0, 32.0, 36.0, 54.0, 34.0, 57.0, 62.0, 68.0, 56.0, 58.0, 57.0, 60.0, 59.0, 49.0, 34.0, 29.0, 25.0, 24.0, 14.0, 10.0, 14.0, 9.0, 8.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -15.852783203125, -15.26806640625, -14.683349609375, -14.0986328125, -13.513916015625, -12.92919921875, -12.344482421875, -11.759765625, -11.175048828125, -10.59033203125, -10.005615234375, -9.4208984375, -8.836181640625, -8.25146484375, -7.666748046875, -7.08203125, -6.497314453125, -5.91259765625, -5.327880859375, -4.7431640625, -4.158447265625, -3.57373046875, -2.989013671875, -2.404296875, -1.819580078125, -1.23486328125, -0.650146484375, -0.0654296875, 0.519287109375, 1.10400390625, 1.688720703125, 2.2734375, 2.858154296875, 3.44287109375, 4.027587890625, 4.6123046875, 5.197021484375, 5.78173828125, 6.366455078125, 6.951171875, 7.535888671875, 8.12060546875, 8.705322265625, 9.2900390625, 9.874755859375, 10.45947265625, 11.044189453125, 11.62890625, 12.213623046875, 12.79833984375, 13.383056640625, 13.9677734375, 14.552490234375, 15.13720703125, 15.721923828125, 16.306640625, 16.891357421875, 17.47607421875, 18.060791015625, 18.6455078125, 19.230224609375, 19.81494140625, 20.399658203125, 20.984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 22.0, 28.0, 40.0, 78.0, 117.0, 222.0, 473.0, 1043.0, 2807.0, 10702.0, 60391.0, 756531.0, 185818.0, 22284.0, 5019.0, 1658.0, 614.0, 298.0, 146.0, 88.0, 51.0, 37.0, 15.0, 15.0, 5.0, 6.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.46014404296875, -8.2093505859375, -7.95855712890625, -7.707763671875, -7.45697021484375, -7.2061767578125, -6.95538330078125, -6.70458984375, -6.45379638671875, -6.2030029296875, -5.95220947265625, -5.701416015625, -5.45062255859375, -5.1998291015625, -4.94903564453125, -4.6982421875, -4.44744873046875, -4.1966552734375, -3.94586181640625, -3.695068359375, -3.44427490234375, -3.1934814453125, -2.94268798828125, -2.69189453125, -2.44110107421875, -2.1903076171875, -1.93951416015625, -1.688720703125, -1.43792724609375, -1.1871337890625, -0.93634033203125, -0.685546875, -0.43475341796875, -0.1839599609375, 0.06683349609375, 0.317626953125, 0.56842041015625, 0.8192138671875, 1.07000732421875, 1.32080078125, 1.57159423828125, 1.8223876953125, 2.07318115234375, 2.323974609375, 2.57476806640625, 2.8255615234375, 3.07635498046875, 3.3271484375, 3.57794189453125, 3.8287353515625, 4.07952880859375, 4.330322265625, 4.58111572265625, 4.8319091796875, 5.08270263671875, 5.33349609375, 5.58428955078125, 5.8350830078125, 6.08587646484375, 6.336669921875, 6.58746337890625, 6.8382568359375, 7.08905029296875, 7.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 1.0, 7.0, 9.0, 7.0, 17.0, 14.0, 27.0, 42.0, 44.0, 86.0, 228.0, 202.0, 110.0, 49.0, 38.0, 21.0, 21.0, 15.0, 9.0, 10.0, 9.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00228118896484375, -0.002212047576904297, -0.0021429061889648438, -0.0020737648010253906, -0.0020046234130859375, -0.0019354820251464844, -0.0018663406372070312, -0.0017971992492675781, -0.001728057861328125, -0.0016589164733886719, -0.0015897750854492188, -0.0015206336975097656, -0.0014514923095703125, -0.0013823509216308594, -0.0013132095336914062, -0.0012440681457519531, -0.0011749267578125, -0.0011057853698730469, -0.0010366439819335938, -0.0009675025939941406, -0.0008983612060546875, -0.0008292198181152344, -0.0007600784301757812, -0.0006909370422363281, -0.000621795654296875, -0.0005526542663574219, -0.00048351287841796875, -0.0004143714904785156, -0.0003452301025390625, -0.0002760887145996094, -0.00020694732666015625, -0.00013780593872070312, -6.866455078125e-05, 4.76837158203125e-07, 6.961822509765625e-05, 0.00013875961303710938, 0.0002079010009765625, 0.0002770423889160156, 0.00034618377685546875, 0.0004153251647949219, 0.000484466552734375, 0.0005536079406738281, 0.0006227493286132812, 0.0006918907165527344, 0.0007610321044921875, 0.0008301734924316406, 0.0008993148803710938, 0.0009684562683105469, 0.00103759765625, 0.0011067390441894531, 0.0011758804321289062, 0.0012450218200683594, 0.0013141632080078125, 0.0013833045959472656, 0.0014524459838867188, 0.0015215873718261719, 0.001590728759765625, 0.0016598701477050781, 0.0017290115356445312, 0.0017981529235839844, 0.0018672943115234375, 0.0019364356994628906, 0.0020055770874023438, 0.002074718475341797, 0.00214385986328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 6.0, 12.0, 11.0, 15.0, 36.0, 27.0, 43.0, 68.0, 112.0, 134.0, 204.0, 325.0, 506.0, 867.0, 1645.0, 3775.0, 10785.0, 45229.0, 345185.0, 555729.0, 61567.0, 13322.0, 4485.0, 1878.0, 991.0, 535.0, 331.0, 212.0, 168.0, 98.0, 71.0, 40.0, 31.0, 31.0, 13.0, 14.0, 13.0, 6.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-6.15234375, -5.97186279296875, -5.7913818359375, -5.61090087890625, -5.430419921875, -5.24993896484375, -5.0694580078125, -4.88897705078125, -4.70849609375, -4.52801513671875, -4.3475341796875, -4.16705322265625, -3.986572265625, -3.80609130859375, -3.6256103515625, -3.44512939453125, -3.2646484375, -3.08416748046875, -2.9036865234375, -2.72320556640625, -2.542724609375, -2.36224365234375, -2.1817626953125, -2.00128173828125, -1.82080078125, -1.64031982421875, -1.4598388671875, -1.27935791015625, -1.098876953125, -0.91839599609375, -0.7379150390625, -0.55743408203125, -0.376953125, -0.19647216796875, -0.0159912109375, 0.16448974609375, 0.344970703125, 0.52545166015625, 0.7059326171875, 0.88641357421875, 1.06689453125, 1.24737548828125, 1.4278564453125, 1.60833740234375, 1.788818359375, 1.96929931640625, 2.1497802734375, 2.33026123046875, 2.5107421875, 2.69122314453125, 2.8717041015625, 3.05218505859375, 3.232666015625, 3.41314697265625, 3.5936279296875, 3.77410888671875, 3.95458984375, 4.13507080078125, 4.3155517578125, 4.49603271484375, 4.676513671875, 4.85699462890625, 5.0374755859375, 5.21795654296875, 5.3984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 2.0, 6.0, 10.0, 9.0, 14.0, 16.0, 11.0, 29.0, 21.0, 21.0, 37.0, 33.0, 54.0, 56.0, 75.0, 64.0, 74.0, 64.0, 50.0, 62.0, 58.0, 38.0, 38.0, 24.0, 24.0, 18.0, 15.0, 11.0, 14.0, 9.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.171417236328125, -3.03228759765625, -2.893157958984375, -2.7540283203125, -2.614898681640625, -2.47576904296875, -2.336639404296875, -2.197509765625, -2.058380126953125, -1.91925048828125, -1.780120849609375, -1.6409912109375, -1.501861572265625, -1.36273193359375, -1.223602294921875, -1.08447265625, -0.945343017578125, -0.80621337890625, -0.667083740234375, -0.5279541015625, -0.388824462890625, -0.24969482421875, -0.110565185546875, 0.028564453125, 0.167694091796875, 0.30682373046875, 0.445953369140625, 0.5850830078125, 0.724212646484375, 0.86334228515625, 1.002471923828125, 1.1416015625, 1.280731201171875, 1.41986083984375, 1.558990478515625, 1.6981201171875, 1.837249755859375, 1.97637939453125, 2.115509033203125, 2.254638671875, 2.393768310546875, 2.53289794921875, 2.672027587890625, 2.8111572265625, 2.950286865234375, 3.08941650390625, 3.228546142578125, 3.36767578125, 3.506805419921875, 3.64593505859375, 3.785064697265625, 3.9241943359375, 4.063323974609375, 4.20245361328125, 4.341583251953125, 4.480712890625, 4.619842529296875, 4.75897216796875, 4.898101806640625, 5.0372314453125, 5.176361083984375, 5.31549072265625, 5.454620361328125, 5.59375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 19.0, 39.0, 127.0, 283.0, 302.0, 143.0, 49.0, 12.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-317.2892761230469, -310.4152526855469, -303.54119873046875, -296.66717529296875, -289.7931213378906, -282.9190979003906, -276.0450439453125, -269.1710205078125, -262.2969665527344, -255.4229278564453, -248.54888916015625, -241.6748504638672, -234.80081176757812, -227.92677307128906, -221.052734375, -214.1787109375, -207.30467224121094, -200.43063354492188, -193.5565948486328, -186.68255615234375, -179.8085174560547, -172.93447875976562, -166.06045532226562, -159.1864013671875, -152.3123779296875, -145.43833923339844, -138.56430053710938, -131.6902618408203, -124.81622314453125, -117.94218444824219, -111.06815338134766, -104.1941146850586, -97.32008361816406, -90.446044921875, -83.57200622558594, -76.69796752929688, -69.82392883300781, -62.949893951416016, -56.07585906982422, -49.201820373535156, -42.327781677246094, -35.45374298095703, -28.5797061920166, -21.705669403076172, -14.83163070678711, -7.957592010498047, -1.08355712890625, 5.7904815673828125, 12.664520263671875, 19.538558959960938, 26.412595748901367, 33.2866325378418, 40.16067123413086, 47.03470993041992, 53.90874481201172, 60.78278350830078, 67.65682220458984, 74.5308609008789, 81.40489959716797, 88.2789306640625, 95.15296936035156, 102.02700805664062, 108.90104675292969, 115.77508544921875, 122.64912414550781]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 16.0, 23.0, 27.0, 35.0, 46.0, 39.0, 49.0, 58.0, 73.0, 62.0, 84.0, 70.0, 61.0, 68.0, 40.0, 37.0, 39.0, 43.0, 24.0, 25.0, 20.0, 12.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-110.33940887451172, -107.59660339355469, -104.85380554199219, -102.11100006103516, -99.36819458007812, -96.6253890991211, -93.88258361816406, -91.13978576660156, -88.39698028564453, -85.6541748046875, -82.911376953125, -80.16857147216797, -77.42576599121094, -74.6829605102539, -71.94015502929688, -69.19735717773438, -66.45455169677734, -63.71174621582031, -60.96894454956055, -58.22614288330078, -55.48333740234375, -52.74053192138672, -49.99773025512695, -47.25492858886719, -44.512123107910156, -41.769317626953125, -39.02651596069336, -36.283714294433594, -33.54090881347656, -30.798105239868164, -28.055301666259766, -25.312498092651367, -22.569686889648438, -19.82688331604004, -17.08407974243164, -14.341276168823242, -11.598472595214844, -8.855669021606445, -6.112865447998047, -3.3700618743896484, -0.62725830078125, 2.1155452728271484, 4.858348846435547, 7.601152420043945, 10.343955993652344, 13.086759567260742, 15.82956314086914, 18.57236671447754, 21.315170288085938, 24.057973861694336, 26.800777435302734, 29.543581008911133, 32.28638458251953, 35.02919006347656, 37.77199172973633, 40.514793395996094, 43.257598876953125, 46.000404357910156, 48.74320602416992, 51.48600769042969, 54.22881317138672, 56.97161865234375, 59.714420318603516, 62.45722198486328, 65.20002746582031]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 7.0, 10.0, 12.0, 12.0, 22.0, 33.0, 43.0, 52.0, 86.0, 151.0, 252.0, 639.0, 2199.0, 10602.0, 125597.0, 3914857.0, 125356.0, 10798.0, 2187.0, 654.0, 256.0, 142.0, 89.0, 56.0, 52.0, 22.0, 16.0, 17.0, 17.0, 6.0, 2.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.84375, -16.3409423828125, -15.838134765625, -15.3353271484375, -14.83251953125, -14.3297119140625, -13.826904296875, -13.3240966796875, -12.8212890625, -12.3184814453125, -11.815673828125, -11.3128662109375, -10.81005859375, -10.3072509765625, -9.804443359375, -9.3016357421875, -8.798828125, -8.2960205078125, -7.793212890625, -7.2904052734375, -6.78759765625, -6.2847900390625, -5.781982421875, -5.2791748046875, -4.7763671875, -4.2735595703125, -3.770751953125, -3.2679443359375, -2.76513671875, -2.2623291015625, -1.759521484375, -1.2567138671875, -0.75390625, -0.2510986328125, 0.251708984375, 0.7545166015625, 1.25732421875, 1.7601318359375, 2.262939453125, 2.7657470703125, 3.2685546875, 3.7713623046875, 4.274169921875, 4.7769775390625, 5.27978515625, 5.7825927734375, 6.285400390625, 6.7882080078125, 7.291015625, 7.7938232421875, 8.296630859375, 8.7994384765625, 9.30224609375, 9.8050537109375, 10.307861328125, 10.8106689453125, 11.3134765625, 11.8162841796875, 12.319091796875, 12.8218994140625, 13.32470703125, 13.8275146484375, 14.330322265625, 14.8331298828125, 15.3359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 11.0, 29.0, 36.0, 64.0, 84.0, 93.0, 120.0, 127.0, 129.0, 97.0, 85.0, 40.0, 36.0, 23.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.859375, -8.6015625, -8.34375, -8.0859375, -7.828125, -7.5703125, -7.3125, -7.0546875, -6.796875, -6.5390625, -6.28125, -6.0234375, -5.765625, -5.5078125, -5.25, -4.9921875, -4.734375, -4.4765625, -4.21875, -3.9609375, -3.703125, -3.4453125, -3.1875, -2.9296875, -2.671875, -2.4140625, -2.15625, -1.8984375, -1.640625, -1.3828125, -1.125, -0.8671875, -0.609375, -0.3515625, -0.09375, 0.1640625, 0.421875, 0.6796875, 0.9375, 1.1953125, 1.453125, 1.7109375, 1.96875, 2.2265625, 2.484375, 2.7421875, 3.0, 3.2578125, 3.515625, 3.7734375, 4.03125, 4.2890625, 4.546875, 4.8046875, 5.0625, 5.3203125, 5.578125, 5.8359375, 6.09375, 6.3515625, 6.609375, 6.8671875, 7.125, 7.3828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 5.0, 5.0, 9.0, 17.0, 32.0, 47.0, 69.0, 115.0, 198.0, 357.0, 668.0, 1431.0, 2881.0, 6715.0, 17341.0, 54838.0, 279785.0, 2952097.0, 735920.0, 96397.0, 27258.0, 10135.0, 4186.0, 1857.0, 904.0, 427.0, 245.0, 124.0, 90.0, 36.0, 38.0, 17.0, 9.0, 14.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7247314453125, -8.449462890625, -8.1741943359375, -7.89892578125, -7.6236572265625, -7.348388671875, -7.0731201171875, -6.7978515625, -6.5225830078125, -6.247314453125, -5.9720458984375, -5.69677734375, -5.4215087890625, -5.146240234375, -4.8709716796875, -4.595703125, -4.3204345703125, -4.045166015625, -3.7698974609375, -3.49462890625, -3.2193603515625, -2.944091796875, -2.6688232421875, -2.3935546875, -2.1182861328125, -1.843017578125, -1.5677490234375, -1.29248046875, -1.0172119140625, -0.741943359375, -0.4666748046875, -0.19140625, 0.0838623046875, 0.359130859375, 0.6343994140625, 0.90966796875, 1.1849365234375, 1.460205078125, 1.7354736328125, 2.0107421875, 2.2860107421875, 2.561279296875, 2.8365478515625, 3.11181640625, 3.3870849609375, 3.662353515625, 3.9376220703125, 4.212890625, 4.4881591796875, 4.763427734375, 5.0386962890625, 5.31396484375, 5.5892333984375, 5.864501953125, 6.1397705078125, 6.4150390625, 6.6903076171875, 6.965576171875, 7.2408447265625, 7.51611328125, 7.7913818359375, 8.066650390625, 8.3419189453125, 8.6171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 6.0, 6.0, 19.0, 10.0, 21.0, 30.0, 32.0, 56.0, 76.0, 124.0, 189.0, 308.0, 515.0, 756.0, 694.0, 442.0, 238.0, 148.0, 111.0, 73.0, 42.0, 36.0, 27.0, 27.0, 11.0, 10.0, 5.0, 14.0, 5.0, 7.0, 2.0, 4.0, 3.0, 6.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.671875, -9.3858642578125, -9.099853515625, -8.8138427734375, -8.52783203125, -8.2418212890625, -7.955810546875, -7.6697998046875, -7.3837890625, -7.0977783203125, -6.811767578125, -6.5257568359375, -6.23974609375, -5.9537353515625, -5.667724609375, -5.3817138671875, -5.095703125, -4.8096923828125, -4.523681640625, -4.2376708984375, -3.95166015625, -3.6656494140625, -3.379638671875, -3.0936279296875, -2.8076171875, -2.5216064453125, -2.235595703125, -1.9495849609375, -1.66357421875, -1.3775634765625, -1.091552734375, -0.8055419921875, -0.51953125, -0.2335205078125, 0.052490234375, 0.3385009765625, 0.62451171875, 0.9105224609375, 1.196533203125, 1.4825439453125, 1.7685546875, 2.0545654296875, 2.340576171875, 2.6265869140625, 2.91259765625, 3.1986083984375, 3.484619140625, 3.7706298828125, 4.056640625, 4.3426513671875, 4.628662109375, 4.9146728515625, 5.20068359375, 5.4866943359375, 5.772705078125, 6.0587158203125, 6.3447265625, 6.6307373046875, 6.916748046875, 7.2027587890625, 7.48876953125, 7.7747802734375, 8.060791015625, 8.3468017578125, 8.6328125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 4.0, 4.0, 13.0, 29.0, 39.0, 99.0, 176.0, 193.0, 176.0, 122.0, 61.0, 38.0, 20.0, 7.0, 9.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.94498443603516, -75.87718963623047, -72.80940246582031, -69.74160766601562, -66.67381286621094, -63.60601806640625, -60.53822708129883, -57.470436096191406, -54.40264129638672, -51.33484649658203, -48.26705551147461, -45.19926452636719, -42.1314697265625, -39.06367492675781, -35.99588394165039, -32.92809295654297, -29.86029815673828, -26.792505264282227, -23.724712371826172, -20.656919479370117, -17.589126586914062, -14.521333694458008, -11.453540802001953, -8.385747909545898, -5.317955017089844, -2.250162124633789, 0.8176307678222656, 3.8854236602783203, 6.953216552734375, 10.02100944519043, 13.088802337646484, 16.15659523010254, 19.224395751953125, 22.29218864440918, 25.359981536865234, 28.42777442932129, 31.495567321777344, 34.56336212158203, 37.63115310668945, 40.698944091796875, 43.76673889160156, 46.83453369140625, 49.90232467651367, 52.970115661621094, 56.03791046142578, 59.10570526123047, 62.17349624633789, 65.24128723144531, 68.30908203125, 71.37687683105469, 74.44467163085938, 77.51245880126953, 80.58025360107422, 83.6480484008789, 86.71583557128906, 89.78363037109375, 92.85142517089844, 95.91921997070312, 98.98701477050781, 102.05480194091797, 105.12259674072266, 108.19039154052734, 111.2581787109375, 114.32597351074219, 117.39376831054688]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 4.0, 12.0, 11.0, 8.0, 12.0, 17.0, 15.0, 21.0, 20.0, 40.0, 33.0, 39.0, 50.0, 50.0, 56.0, 53.0, 46.0, 47.0, 57.0, 60.0, 45.0, 44.0, 41.0, 40.0, 34.0, 25.0, 25.0, 23.0, 20.0, 15.0, 12.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.248558044433594, -44.79008102416992, -43.331607818603516, -41.873130798339844, -40.41465759277344, -38.956180572509766, -37.497703552246094, -36.03923034667969, -34.580753326416016, -33.122276306152344, -31.663803100585938, -30.205326080322266, -28.746850967407227, -27.288375854492188, -25.829898834228516, -24.371423721313477, -22.912948608398438, -21.4544734954834, -19.99599838256836, -18.537521362304688, -17.07904624938965, -15.62057113647461, -14.162095069885254, -12.703619003295898, -11.24514389038086, -9.78666877746582, -8.328192710876465, -6.869717121124268, -5.41124153137207, -3.952765941619873, -2.494290351867676, -1.0358142852783203, 0.42266082763671875, 1.881136417388916, 3.3396120071411133, 4.7980875968933105, 6.256563186645508, 7.715038776397705, 9.173514366149902, 10.631990432739258, 12.090465545654297, 13.548940658569336, 15.007416725158691, 16.465892791748047, 17.924367904663086, 19.382843017578125, 20.841320037841797, 22.299795150756836, 23.758270263671875, 25.216745376586914, 26.675220489501953, 28.133697509765625, 29.592172622680664, 31.050647735595703, 32.509124755859375, 33.96759796142578, 35.42607498168945, 36.884552001953125, 38.34302520751953, 39.8015022277832, 41.259979248046875, 42.71845245361328, 44.17692947387695, 45.635406494140625, 47.09387969970703]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 8.0, 23.0, 38.0, 58.0, 81.0, 129.0, 216.0, 279.0, 570.0, 938.0, 1873.0, 3601.0, 7225.0, 15380.0, 35003.0, 97088.0, 395865.0, 343692.0, 86096.0, 32339.0, 14056.0, 6716.0, 3333.0, 1605.0, 962.0, 531.0, 308.0, 194.0, 122.0, 68.0, 56.0, 25.0, 22.0, 11.0, 10.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.28125, -8.0299072265625, -7.778564453125, -7.5272216796875, -7.27587890625, -7.0245361328125, -6.773193359375, -6.5218505859375, -6.2705078125, -6.0191650390625, -5.767822265625, -5.5164794921875, -5.26513671875, -5.0137939453125, -4.762451171875, -4.5111083984375, -4.259765625, -4.0084228515625, -3.757080078125, -3.5057373046875, -3.25439453125, -3.0030517578125, -2.751708984375, -2.5003662109375, -2.2490234375, -1.9976806640625, -1.746337890625, -1.4949951171875, -1.24365234375, -0.9923095703125, -0.740966796875, -0.4896240234375, -0.23828125, 0.0130615234375, 0.264404296875, 0.5157470703125, 0.76708984375, 1.0184326171875, 1.269775390625, 1.5211181640625, 1.7724609375, 2.0238037109375, 2.275146484375, 2.5264892578125, 2.77783203125, 3.0291748046875, 3.280517578125, 3.5318603515625, 3.783203125, 4.0345458984375, 4.285888671875, 4.5372314453125, 4.78857421875, 5.0399169921875, 5.291259765625, 5.5426025390625, 5.7939453125, 6.0452880859375, 6.296630859375, 6.5479736328125, 6.79931640625, 7.0506591796875, 7.302001953125, 7.5533447265625, 7.8046875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 19.0, 20.0, 27.0, 26.0, 44.0, 45.0, 47.0, 59.0, 71.0, 87.0, 50.0, 70.0, 69.0, 64.0, 59.0, 47.0, 50.0, 33.0, 27.0, 27.0, 16.0, 7.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.2109375, -5.05609130859375, -4.9012451171875, -4.74639892578125, -4.591552734375, -4.43670654296875, -4.2818603515625, -4.12701416015625, -3.97216796875, -3.81732177734375, -3.6624755859375, -3.50762939453125, -3.352783203125, -3.19793701171875, -3.0430908203125, -2.88824462890625, -2.7333984375, -2.57855224609375, -2.4237060546875, -2.26885986328125, -2.114013671875, -1.95916748046875, -1.8043212890625, -1.64947509765625, -1.49462890625, -1.33978271484375, -1.1849365234375, -1.03009033203125, -0.875244140625, -0.72039794921875, -0.5655517578125, -0.41070556640625, -0.255859375, -0.10101318359375, 0.0538330078125, 0.20867919921875, 0.363525390625, 0.51837158203125, 0.6732177734375, 0.82806396484375, 0.98291015625, 1.13775634765625, 1.2926025390625, 1.44744873046875, 1.602294921875, 1.75714111328125, 1.9119873046875, 2.06683349609375, 2.2216796875, 2.37652587890625, 2.5313720703125, 2.68621826171875, 2.841064453125, 2.99591064453125, 3.1507568359375, 3.30560302734375, 3.46044921875, 3.61529541015625, 3.7701416015625, 3.92498779296875, 4.079833984375, 4.23468017578125, 4.3895263671875, 4.54437255859375, 4.69921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 8.0, 9.0, 13.0, 13.0, 29.0, 42.0, 40.0, 70.0, 97.0, 168.0, 253.0, 441.0, 750.0, 1405.0, 3188.0, 9616.0, 37913.0, 353534.0, 576305.0, 46647.0, 10808.0, 3648.0, 1542.0, 752.0, 470.0, 233.0, 194.0, 120.0, 65.0, 43.0, 39.0, 28.0, 19.0, 15.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.3026123046875, -15.823974609375, -15.3453369140625, -14.86669921875, -14.3880615234375, -13.909423828125, -13.4307861328125, -12.9521484375, -12.4735107421875, -11.994873046875, -11.5162353515625, -11.03759765625, -10.5589599609375, -10.080322265625, -9.6016845703125, -9.123046875, -8.6444091796875, -8.165771484375, -7.6871337890625, -7.20849609375, -6.7298583984375, -6.251220703125, -5.7725830078125, -5.2939453125, -4.8153076171875, -4.336669921875, -3.8580322265625, -3.37939453125, -2.9007568359375, -2.422119140625, -1.9434814453125, -1.46484375, -0.9862060546875, -0.507568359375, -0.0289306640625, 0.44970703125, 0.9283447265625, 1.406982421875, 1.8856201171875, 2.3642578125, 2.8428955078125, 3.321533203125, 3.8001708984375, 4.27880859375, 4.7574462890625, 5.236083984375, 5.7147216796875, 6.193359375, 6.6719970703125, 7.150634765625, 7.6292724609375, 8.10791015625, 8.5865478515625, 9.065185546875, 9.5438232421875, 10.0224609375, 10.5010986328125, 10.979736328125, 11.4583740234375, 11.93701171875, 12.4156494140625, 12.894287109375, 13.3729248046875, 13.8515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 16.0, 12.0, 23.0, 21.0, 26.0, 23.0, 30.0, 29.0, 44.0, 40.0, 46.0, 50.0, 53.0, 37.0, 63.0, 42.0, 50.0, 57.0, 49.0, 28.0, 33.0, 23.0, 27.0, 26.0, 25.0, 18.0, 14.0, 16.0, 7.0, 12.0, 4.0, 3.0, 1.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.796875, -16.3310546875, -15.865234375, -15.3994140625, -14.93359375, -14.4677734375, -14.001953125, -13.5361328125, -13.0703125, -12.6044921875, -12.138671875, -11.6728515625, -11.20703125, -10.7412109375, -10.275390625, -9.8095703125, -9.34375, -8.8779296875, -8.412109375, -7.9462890625, -7.48046875, -7.0146484375, -6.548828125, -6.0830078125, -5.6171875, -5.1513671875, -4.685546875, -4.2197265625, -3.75390625, -3.2880859375, -2.822265625, -2.3564453125, -1.890625, -1.4248046875, -0.958984375, -0.4931640625, -0.02734375, 0.4384765625, 0.904296875, 1.3701171875, 1.8359375, 2.3017578125, 2.767578125, 3.2333984375, 3.69921875, 4.1650390625, 4.630859375, 5.0966796875, 5.5625, 6.0283203125, 6.494140625, 6.9599609375, 7.42578125, 7.8916015625, 8.357421875, 8.8232421875, 9.2890625, 9.7548828125, 10.220703125, 10.6865234375, 11.15234375, 11.6181640625, 12.083984375, 12.5498046875, 13.015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 12.0, 24.0, 32.0, 41.0, 96.0, 212.0, 540.0, 1724.0, 8444.0, 80409.0, 842615.0, 101702.0, 9695.0, 1933.0, 529.0, 247.0, 104.0, 61.0, 38.0, 24.0, 7.0, 18.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3515625, -10.033447265625, -9.71533203125, -9.397216796875, -9.0791015625, -8.760986328125, -8.44287109375, -8.124755859375, -7.806640625, -7.488525390625, -7.17041015625, -6.852294921875, -6.5341796875, -6.216064453125, -5.89794921875, -5.579833984375, -5.26171875, -4.943603515625, -4.62548828125, -4.307373046875, -3.9892578125, -3.671142578125, -3.35302734375, -3.034912109375, -2.716796875, -2.398681640625, -2.08056640625, -1.762451171875, -1.4443359375, -1.126220703125, -0.80810546875, -0.489990234375, -0.171875, 0.146240234375, 0.46435546875, 0.782470703125, 1.1005859375, 1.418701171875, 1.73681640625, 2.054931640625, 2.373046875, 2.691162109375, 3.00927734375, 3.327392578125, 3.6455078125, 3.963623046875, 4.28173828125, 4.599853515625, 4.91796875, 5.236083984375, 5.55419921875, 5.872314453125, 6.1904296875, 6.508544921875, 6.82666015625, 7.144775390625, 7.462890625, 7.781005859375, 8.09912109375, 8.417236328125, 8.7353515625, 9.053466796875, 9.37158203125, 9.689697265625, 10.0078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 1.0, 2.0, 9.0, 11.0, 12.0, 13.0, 13.0, 20.0, 27.0, 42.0, 61.0, 75.0, 124.0, 135.0, 124.0, 94.0, 65.0, 50.0, 37.0, 17.0, 12.0, 19.0, 8.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.001766204833984375, -0.0017193853855133057, -0.0016725659370422363, -0.001625746488571167, -0.0015789270401000977, -0.0015321075916290283, -0.001485288143157959, -0.0014384686946868896, -0.0013916492462158203, -0.001344829797744751, -0.0012980103492736816, -0.0012511909008026123, -0.001204371452331543, -0.0011575520038604736, -0.0011107325553894043, -0.001063913106918335, -0.0010170936584472656, -0.0009702742099761963, -0.000923454761505127, -0.0008766353130340576, -0.0008298158645629883, -0.0007829964160919189, -0.0007361769676208496, -0.0006893575191497803, -0.0006425380706787109, -0.0005957186222076416, -0.0005488991737365723, -0.0005020797252655029, -0.0004552602767944336, -0.00040844082832336426, -0.0003616213798522949, -0.0003148019313812256, -0.00026798248291015625, -0.00022116303443908691, -0.00017434358596801758, -0.00012752413749694824, -8.07046890258789e-05, -3.388524055480957e-05, 1.2934207916259766e-05, 5.97536563873291e-05, 0.00010657310485839844, 0.00015339255332946777, 0.0002002120018005371, 0.00024703145027160645, 0.0002938508987426758, 0.0003406703472137451, 0.00038748979568481445, 0.0004343092441558838, 0.0004811286926269531, 0.0005279481410980225, 0.0005747675895690918, 0.0006215870380401611, 0.0006684064865112305, 0.0007152259349822998, 0.0007620453834533691, 0.0008088648319244385, 0.0008556842803955078, 0.0009025037288665771, 0.0009493231773376465, 0.0009961426258087158, 0.0010429620742797852, 0.0010897815227508545, 0.0011366009712219238, 0.0011834204196929932, 0.0012302398681640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 10.0, 15.0, 13.0, 42.0, 38.0, 70.0, 118.0, 191.0, 335.0, 732.0, 1648.0, 4815.0, 18643.0, 135974.0, 738874.0, 122090.0, 17346.0, 4431.0, 1604.0, 735.0, 346.0, 194.0, 102.0, 70.0, 40.0, 19.0, 19.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.2734375, -8.05841064453125, -7.8433837890625, -7.62835693359375, -7.413330078125, -7.19830322265625, -6.9832763671875, -6.76824951171875, -6.55322265625, -6.33819580078125, -6.1231689453125, -5.90814208984375, -5.693115234375, -5.47808837890625, -5.2630615234375, -5.04803466796875, -4.8330078125, -4.61798095703125, -4.4029541015625, -4.18792724609375, -3.972900390625, -3.75787353515625, -3.5428466796875, -3.32781982421875, -3.11279296875, -2.89776611328125, -2.6827392578125, -2.46771240234375, -2.252685546875, -2.03765869140625, -1.8226318359375, -1.60760498046875, -1.392578125, -1.17755126953125, -0.9625244140625, -0.74749755859375, -0.532470703125, -0.31744384765625, -0.1024169921875, 0.11260986328125, 0.32763671875, 0.54266357421875, 0.7576904296875, 0.97271728515625, 1.187744140625, 1.40277099609375, 1.6177978515625, 1.83282470703125, 2.0478515625, 2.26287841796875, 2.4779052734375, 2.69293212890625, 2.907958984375, 3.12298583984375, 3.3380126953125, 3.55303955078125, 3.76806640625, 3.98309326171875, 4.1981201171875, 4.41314697265625, 4.628173828125, 4.84320068359375, 5.0582275390625, 5.27325439453125, 5.48828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 4.0, 4.0, 9.0, 14.0, 14.0, 18.0, 26.0, 27.0, 31.0, 32.0, 56.0, 69.0, 58.0, 56.0, 64.0, 73.0, 74.0, 67.0, 56.0, 52.0, 42.0, 33.0, 18.0, 17.0, 15.0, 14.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.73046875, -3.6016845703125, -3.472900390625, -3.3441162109375, -3.21533203125, -3.0865478515625, -2.957763671875, -2.8289794921875, -2.7001953125, -2.5714111328125, -2.442626953125, -2.3138427734375, -2.18505859375, -2.0562744140625, -1.927490234375, -1.7987060546875, -1.669921875, -1.5411376953125, -1.412353515625, -1.2835693359375, -1.15478515625, -1.0260009765625, -0.897216796875, -0.7684326171875, -0.6396484375, -0.5108642578125, -0.382080078125, -0.2532958984375, -0.12451171875, 0.0042724609375, 0.133056640625, 0.2618408203125, 0.390625, 0.5194091796875, 0.648193359375, 0.7769775390625, 0.90576171875, 1.0345458984375, 1.163330078125, 1.2921142578125, 1.4208984375, 1.5496826171875, 1.678466796875, 1.8072509765625, 1.93603515625, 2.0648193359375, 2.193603515625, 2.3223876953125, 2.451171875, 2.5799560546875, 2.708740234375, 2.8375244140625, 2.96630859375, 3.0950927734375, 3.223876953125, 3.3526611328125, 3.4814453125, 3.6102294921875, 3.739013671875, 3.8677978515625, 3.99658203125, 4.1253662109375, 4.254150390625, 4.3829345703125, 4.51171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 16.0, 59.0, 166.0, 399.0, 247.0, 76.0, 14.0, 5.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.3475036621094, -262.9935607910156, -255.63961791992188, -248.28567504882812, -240.93173217773438, -233.57778930664062, -226.2238311767578, -218.86988830566406, -211.5159454345703, -204.16200256347656, -196.8080596923828, -189.45411682128906, -182.10015869140625, -174.7462158203125, -167.39227294921875, -160.038330078125, -152.68438720703125, -145.3304443359375, -137.97650146484375, -130.62255859375, -123.26860809326172, -115.91466522216797, -108.56071472167969, -101.20677185058594, -93.85282897949219, -86.49888610839844, -79.14494323730469, -71.7909927368164, -64.43704986572266, -57.083106994628906, -49.72916030883789, -42.375213623046875, -35.02128601074219, -27.667341232299805, -20.313396453857422, -12.959451675415039, -5.605506896972656, 1.7484359741210938, 9.10238265991211, 16.456329345703125, 23.810272216796875, 31.164216995239258, 38.51816177368164, 45.872108459472656, 53.226051330566406, 60.579994201660156, 67.93394470214844, 75.28788757324219, 82.64183044433594, 89.99577331542969, 97.34971618652344, 104.70366668701172, 112.05760955810547, 119.41155242919922, 126.7655029296875, 134.11944580078125, 141.473388671875, 148.82733154296875, 156.1812744140625, 163.53521728515625, 170.88916015625, 178.24310302734375, 185.59706115722656, 192.9510040283203, 200.30494689941406]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 19.0, 14.0, 25.0, 19.0, 22.0, 25.0, 37.0, 39.0, 42.0, 31.0, 46.0, 59.0, 63.0, 83.0, 62.0, 58.0, 40.0, 45.0, 40.0, 40.0, 21.0, 29.0, 18.0, 20.0, 18.0, 12.0, 18.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.0403823852539, -63.86643600463867, -61.69248580932617, -59.51853942871094, -57.34458923339844, -55.1706428527832, -52.99669647216797, -50.82274627685547, -48.648799896240234, -46.474853515625, -44.3009033203125, -42.126956939697266, -39.95301055908203, -37.77906036376953, -35.6051139831543, -33.43116760253906, -31.257217407226562, -29.083269119262695, -26.909320831298828, -24.735374450683594, -22.561426162719727, -20.38747787475586, -18.213531494140625, -16.039583206176758, -13.86563491821289, -11.691686630249023, -9.517739295959473, -7.343791484832764, -5.169843673706055, -2.9958953857421875, -0.8219480514526367, 1.351999282836914, 3.52593994140625, 5.699887752532959, 7.873835563659668, 10.047782897949219, 12.221731185913086, 14.395679473876953, 16.569625854492188, 18.743574142456055, 20.917522430419922, 23.09147071838379, 25.265419006347656, 27.43936538696289, 29.613313674926758, 31.787261962890625, 33.96120834350586, 36.135154724121094, 38.309104919433594, 40.48305130004883, 42.65700149536133, 44.83094787597656, 47.00489807128906, 49.1788444519043, 51.35279083251953, 53.52674102783203, 55.700687408447266, 57.8746337890625, 60.048583984375, 62.222530364990234, 64.39647674560547, 66.57042694091797, 68.74437713623047, 70.91831970214844, 73.09226989746094]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 11.0, 17.0, 29.0, 44.0, 89.0, 131.0, 198.0, 317.0, 511.0, 1000.0, 1679.0, 3077.0, 5602.0, 11014.0, 22171.0, 49661.0, 126981.0, 452175.0, 1699446.0, 1323191.0, 317136.0, 98732.0, 40770.0, 19164.0, 9514.0, 5062.0, 2716.0, 1608.0, 878.0, 508.0, 311.0, 177.0, 127.0, 81.0, 42.0, 29.0, 25.0, 13.0, 8.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.769866943359375, -3.63934326171875, -3.508819580078125, -3.3782958984375, -3.247772216796875, -3.11724853515625, -2.986724853515625, -2.856201171875, -2.725677490234375, -2.59515380859375, -2.464630126953125, -2.3341064453125, -2.203582763671875, -2.07305908203125, -1.942535400390625, -1.81201171875, -1.681488037109375, -1.55096435546875, -1.420440673828125, -1.2899169921875, -1.159393310546875, -1.02886962890625, -0.898345947265625, -0.767822265625, -0.637298583984375, -0.50677490234375, -0.376251220703125, -0.2457275390625, -0.115203857421875, 0.01531982421875, 0.145843505859375, 0.2763671875, 0.406890869140625, 0.53741455078125, 0.667938232421875, 0.7984619140625, 0.928985595703125, 1.05950927734375, 1.190032958984375, 1.320556640625, 1.451080322265625, 1.58160400390625, 1.712127685546875, 1.8426513671875, 1.973175048828125, 2.10369873046875, 2.234222412109375, 2.36474609375, 2.495269775390625, 2.62579345703125, 2.756317138671875, 2.8868408203125, 3.017364501953125, 3.14788818359375, 3.278411865234375, 3.408935546875, 3.539459228515625, 3.66998291015625, 3.800506591796875, 3.9310302734375, 4.061553955078125, 4.19207763671875, 4.322601318359375, 4.453125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 4.0, 18.0, 12.0, 23.0, 25.0, 27.0, 23.0, 29.0, 43.0, 39.0, 56.0, 41.0, 44.0, 48.0, 49.0, 45.0, 49.0, 56.0, 47.0, 44.0, 46.0, 33.0, 27.0, 31.0, 30.0, 18.0, 21.0, 13.0, 15.0, 13.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.533203125, -3.4248046875, -3.31640625, -3.2080078125, -3.099609375, -2.9912109375, -2.8828125, -2.7744140625, -2.666015625, -2.5576171875, -2.44921875, -2.3408203125, -2.232421875, -2.1240234375, -2.015625, -1.9072265625, -1.798828125, -1.6904296875, -1.58203125, -1.4736328125, -1.365234375, -1.2568359375, -1.1484375, -1.0400390625, -0.931640625, -0.8232421875, -0.71484375, -0.6064453125, -0.498046875, -0.3896484375, -0.28125, -0.1728515625, -0.064453125, 0.0439453125, 0.15234375, 0.2607421875, 0.369140625, 0.4775390625, 0.5859375, 0.6943359375, 0.802734375, 0.9111328125, 1.01953125, 1.1279296875, 1.236328125, 1.3447265625, 1.453125, 1.5615234375, 1.669921875, 1.7783203125, 1.88671875, 1.9951171875, 2.103515625, 2.2119140625, 2.3203125, 2.4287109375, 2.537109375, 2.6455078125, 2.75390625, 2.8623046875, 2.970703125, 3.0791015625, 3.1875, 3.2958984375, 3.404296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 5.0, 8.0, 8.0, 16.0, 20.0, 20.0, 34.0, 54.0, 57.0, 109.0, 171.0, 328.0, 566.0, 990.0, 2054.0, 4204.0, 10778.0, 31911.0, 119241.0, 733102.0, 2761132.0, 402685.0, 83919.0, 25213.0, 9141.0, 3941.0, 1900.0, 1024.0, 583.0, 346.0, 228.0, 133.0, 94.0, 71.0, 53.0, 38.0, 30.0, 15.0, 12.0, 12.0, 7.0, 6.0, 3.0, 6.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.875, -7.6068115234375, -7.338623046875, -7.0704345703125, -6.80224609375, -6.5340576171875, -6.265869140625, -5.9976806640625, -5.7294921875, -5.4613037109375, -5.193115234375, -4.9249267578125, -4.65673828125, -4.3885498046875, -4.120361328125, -3.8521728515625, -3.583984375, -3.3157958984375, -3.047607421875, -2.7794189453125, -2.51123046875, -2.2430419921875, -1.974853515625, -1.7066650390625, -1.4384765625, -1.1702880859375, -0.902099609375, -0.6339111328125, -0.36572265625, -0.0975341796875, 0.170654296875, 0.4388427734375, 0.70703125, 0.9752197265625, 1.243408203125, 1.5115966796875, 1.77978515625, 2.0479736328125, 2.316162109375, 2.5843505859375, 2.8525390625, 3.1207275390625, 3.388916015625, 3.6571044921875, 3.92529296875, 4.1934814453125, 4.461669921875, 4.7298583984375, 4.998046875, 5.2662353515625, 5.534423828125, 5.8026123046875, 6.07080078125, 6.3389892578125, 6.607177734375, 6.8753662109375, 7.1435546875, 7.4117431640625, 7.679931640625, 7.9481201171875, 8.21630859375, 8.4844970703125, 8.752685546875, 9.0208740234375, 9.2890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 15.0, 24.0, 22.0, 37.0, 53.0, 82.0, 112.0, 161.0, 234.0, 457.0, 605.0, 750.0, 509.0, 324.0, 216.0, 117.0, 86.0, 58.0, 48.0, 41.0, 25.0, 21.0, 16.0, 13.0, 9.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3828125, -10.001953125, -9.62109375, -9.240234375, -8.859375, -8.478515625, -8.09765625, -7.716796875, -7.3359375, -6.955078125, -6.57421875, -6.193359375, -5.8125, -5.431640625, -5.05078125, -4.669921875, -4.2890625, -3.908203125, -3.52734375, -3.146484375, -2.765625, -2.384765625, -2.00390625, -1.623046875, -1.2421875, -0.861328125, -0.48046875, -0.099609375, 0.28125, 0.662109375, 1.04296875, 1.423828125, 1.8046875, 2.185546875, 2.56640625, 2.947265625, 3.328125, 3.708984375, 4.08984375, 4.470703125, 4.8515625, 5.232421875, 5.61328125, 5.994140625, 6.375, 6.755859375, 7.13671875, 7.517578125, 7.8984375, 8.279296875, 8.66015625, 9.041015625, 9.421875, 9.802734375, 10.18359375, 10.564453125, 10.9453125, 11.326171875, 11.70703125, 12.087890625, 12.46875, 12.849609375, 13.23046875, 13.611328125, 13.9921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 21.0, 52.0, 95.0, 228.0, 260.0, 158.0, 101.0, 34.0, 19.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-210.12994384765625, -204.63720703125, -199.14447021484375, -193.65174865722656, -188.1590118408203, -182.66627502441406, -177.1735382080078, -171.68081665039062, -166.18807983398438, -160.69534301757812, -155.20260620117188, -149.7098846435547, -144.21714782714844, -138.7244110107422, -133.23167419433594, -127.73894500732422, -122.24620819091797, -116.75347137451172, -111.2607421875, -105.76800537109375, -100.27527618408203, -94.78253936767578, -89.28981018066406, -83.79707336425781, -78.30433654785156, -72.81159973144531, -67.3188705444336, -61.826133728027344, -56.333404541015625, -50.840667724609375, -45.34793472290039, -39.855201721191406, -34.36247253417969, -28.869739532470703, -23.37700653076172, -17.8842716217041, -12.391538619995117, -6.898805618286133, -1.4060707092285156, 4.086662292480469, 9.579395294189453, 15.072128295898438, 20.564861297607422, 26.05759620666504, 31.550329208374023, 37.043060302734375, 42.535797119140625, 48.02853012084961, 53.521263122558594, 59.01399612426758, 64.50672912597656, 69.99946594238281, 75.49219512939453, 80.98493194580078, 86.4776611328125, 91.97039794921875, 97.463134765625, 102.95587158203125, 108.44860076904297, 113.94133758544922, 119.43406677246094, 124.92680358886719, 130.41954040527344, 135.91226196289062, 141.40499877929688]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 9.0, 12.0, 15.0, 17.0, 17.0, 19.0, 26.0, 35.0, 33.0, 27.0, 34.0, 32.0, 38.0, 37.0, 42.0, 34.0, 36.0, 32.0, 42.0, 48.0, 45.0, 35.0, 34.0, 37.0, 34.0, 32.0, 27.0, 23.0, 21.0, 14.0, 18.0, 12.0, 13.0, 11.0, 14.0, 7.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-53.924217224121094, -52.243858337402344, -50.563499450683594, -48.883140563964844, -47.20278549194336, -45.52242660522461, -43.84206771850586, -42.16170883178711, -40.48134994506836, -38.80099105834961, -37.12063217163086, -35.440277099609375, -33.759918212890625, -32.079559326171875, -30.399200439453125, -28.718841552734375, -27.038484573364258, -25.358125686645508, -23.67776870727539, -21.99740982055664, -20.31705093383789, -18.63669204711914, -16.956335067749023, -15.275976181030273, -13.59561824798584, -11.915260314941406, -10.234901428222656, -8.554543495178223, -6.874185085296631, -5.193826675415039, -3.5134687423706055, -1.8331098556518555, -0.15275192260742188, 1.5276063680648804, 3.2079646587371826, 4.888322830200195, 6.568681240081787, 8.249039649963379, 9.929397583007812, 11.609756469726562, 13.290114402770996, 14.97047233581543, 16.65083122253418, 18.331188201904297, 20.011547088623047, 21.691905975341797, 23.372264862060547, 25.052623748779297, 26.732980728149414, 28.413339614868164, 30.09369659423828, 31.77405548095703, 33.45441436767578, 35.13477325439453, 36.81513214111328, 38.49549102783203, 40.175846099853516, 41.856204986572266, 43.536563873291016, 45.2169189453125, 46.89727783203125, 48.57763671875, 50.25799560546875, 51.9383544921875, 53.61871337890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 3.0, 8.0, 12.0, 13.0, 26.0, 30.0, 33.0, 62.0, 91.0, 173.0, 288.0, 436.0, 754.0, 1503.0, 2815.0, 5869.0, 12295.0, 26149.0, 57443.0, 138190.0, 403097.0, 240805.0, 85496.0, 37965.0, 17923.0, 8356.0, 3910.0, 2105.0, 1097.0, 601.0, 377.0, 223.0, 129.0, 96.0, 50.0, 41.0, 29.0, 16.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.421875, -8.1646728515625, -7.907470703125, -7.6502685546875, -7.39306640625, -7.1358642578125, -6.878662109375, -6.6214599609375, -6.3642578125, -6.1070556640625, -5.849853515625, -5.5926513671875, -5.33544921875, -5.0782470703125, -4.821044921875, -4.5638427734375, -4.306640625, -4.0494384765625, -3.792236328125, -3.5350341796875, -3.27783203125, -3.0206298828125, -2.763427734375, -2.5062255859375, -2.2490234375, -1.9918212890625, -1.734619140625, -1.4774169921875, -1.22021484375, -0.9630126953125, -0.705810546875, -0.4486083984375, -0.19140625, 0.0657958984375, 0.322998046875, 0.5802001953125, 0.83740234375, 1.0946044921875, 1.351806640625, 1.6090087890625, 1.8662109375, 2.1234130859375, 2.380615234375, 2.6378173828125, 2.89501953125, 3.1522216796875, 3.409423828125, 3.6666259765625, 3.923828125, 4.1810302734375, 4.438232421875, 4.6954345703125, 4.95263671875, 5.2098388671875, 5.467041015625, 5.7242431640625, 5.9814453125, 6.2386474609375, 6.495849609375, 6.7530517578125, 7.01025390625, 7.2674560546875, 7.524658203125, 7.7818603515625, 8.0390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 5.0, 6.0, 4.0, 13.0, 13.0, 9.0, 20.0, 15.0, 17.0, 16.0, 31.0, 26.0, 39.0, 29.0, 45.0, 37.0, 30.0, 38.0, 43.0, 52.0, 52.0, 38.0, 48.0, 49.0, 27.0, 40.0, 35.0, 32.0, 30.0, 29.0, 17.0, 23.0, 11.0, 16.0, 12.0, 4.0, 10.0, 5.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.29296875, -3.192291259765625, -3.09161376953125, -2.990936279296875, -2.8902587890625, -2.789581298828125, -2.68890380859375, -2.588226318359375, -2.487548828125, -2.386871337890625, -2.28619384765625, -2.185516357421875, -2.0848388671875, -1.984161376953125, -1.88348388671875, -1.782806396484375, -1.68212890625, -1.581451416015625, -1.48077392578125, -1.380096435546875, -1.2794189453125, -1.178741455078125, -1.07806396484375, -0.977386474609375, -0.876708984375, -0.776031494140625, -0.67535400390625, -0.574676513671875, -0.4739990234375, -0.373321533203125, -0.27264404296875, -0.171966552734375, -0.0712890625, 0.029388427734375, 0.13006591796875, 0.230743408203125, 0.3314208984375, 0.432098388671875, 0.53277587890625, 0.633453369140625, 0.734130859375, 0.834808349609375, 0.93548583984375, 1.036163330078125, 1.1368408203125, 1.237518310546875, 1.33819580078125, 1.438873291015625, 1.53955078125, 1.640228271484375, 1.74090576171875, 1.841583251953125, 1.9422607421875, 2.042938232421875, 2.14361572265625, 2.244293212890625, 2.344970703125, 2.445648193359375, 2.54632568359375, 2.647003173828125, 2.7476806640625, 2.848358154296875, 2.94903564453125, 3.049713134765625, 3.150390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 7.0, 6.0, 9.0, 8.0, 20.0, 25.0, 53.0, 74.0, 102.0, 147.0, 240.0, 367.0, 630.0, 1091.0, 2038.0, 4473.0, 14276.0, 86667.0, 807146.0, 104734.0, 16432.0, 4961.0, 2173.0, 1126.0, 623.0, 402.0, 217.0, 162.0, 99.0, 71.0, 64.0, 29.0, 20.0, 16.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.453125, -23.76513671875, -23.0771484375, -22.38916015625, -21.701171875, -21.01318359375, -20.3251953125, -19.63720703125, -18.94921875, -18.26123046875, -17.5732421875, -16.88525390625, -16.197265625, -15.50927734375, -14.8212890625, -14.13330078125, -13.4453125, -12.75732421875, -12.0693359375, -11.38134765625, -10.693359375, -10.00537109375, -9.3173828125, -8.62939453125, -7.94140625, -7.25341796875, -6.5654296875, -5.87744140625, -5.189453125, -4.50146484375, -3.8134765625, -3.12548828125, -2.4375, -1.74951171875, -1.0615234375, -0.37353515625, 0.314453125, 1.00244140625, 1.6904296875, 2.37841796875, 3.06640625, 3.75439453125, 4.4423828125, 5.13037109375, 5.818359375, 6.50634765625, 7.1943359375, 7.88232421875, 8.5703125, 9.25830078125, 9.9462890625, 10.63427734375, 11.322265625, 12.01025390625, 12.6982421875, 13.38623046875, 14.07421875, 14.76220703125, 15.4501953125, 16.13818359375, 16.826171875, 17.51416015625, 18.2021484375, 18.89013671875, 19.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 15.0, 12.0, 20.0, 18.0, 20.0, 18.0, 22.0, 28.0, 33.0, 38.0, 27.0, 32.0, 47.0, 54.0, 55.0, 43.0, 48.0, 40.0, 45.0, 51.0, 41.0, 40.0, 31.0, 24.0, 24.0, 21.0, 19.0, 25.0, 9.0, 8.0, 9.0, 7.0, 15.0, 7.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-17.1875, -16.68896484375, -16.1904296875, -15.69189453125, -15.193359375, -14.69482421875, -14.1962890625, -13.69775390625, -13.19921875, -12.70068359375, -12.2021484375, -11.70361328125, -11.205078125, -10.70654296875, -10.2080078125, -9.70947265625, -9.2109375, -8.71240234375, -8.2138671875, -7.71533203125, -7.216796875, -6.71826171875, -6.2197265625, -5.72119140625, -5.22265625, -4.72412109375, -4.2255859375, -3.72705078125, -3.228515625, -2.72998046875, -2.2314453125, -1.73291015625, -1.234375, -0.73583984375, -0.2373046875, 0.26123046875, 0.759765625, 1.25830078125, 1.7568359375, 2.25537109375, 2.75390625, 3.25244140625, 3.7509765625, 4.24951171875, 4.748046875, 5.24658203125, 5.7451171875, 6.24365234375, 6.7421875, 7.24072265625, 7.7392578125, 8.23779296875, 8.736328125, 9.23486328125, 9.7333984375, 10.23193359375, 10.73046875, 11.22900390625, 11.7275390625, 12.22607421875, 12.724609375, 13.22314453125, 13.7216796875, 14.22021484375, 14.71875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 12.0, 14.0, 27.0, 32.0, 38.0, 58.0, 118.0, 212.0, 431.0, 979.0, 2216.0, 6448.0, 23085.0, 107034.0, 687495.0, 171610.0, 34717.0, 8781.0, 2933.0, 1101.0, 542.0, 289.0, 139.0, 73.0, 58.0, 30.0, 25.0, 12.0, 6.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.60882568359375, -5.4129638671875, -5.21710205078125, -5.021240234375, -4.82537841796875, -4.6295166015625, -4.43365478515625, -4.23779296875, -4.04193115234375, -3.8460693359375, -3.65020751953125, -3.454345703125, -3.25848388671875, -3.0626220703125, -2.86676025390625, -2.6708984375, -2.47503662109375, -2.2791748046875, -2.08331298828125, -1.887451171875, -1.69158935546875, -1.4957275390625, -1.29986572265625, -1.10400390625, -0.90814208984375, -0.7122802734375, -0.51641845703125, -0.320556640625, -0.12469482421875, 0.0711669921875, 0.26702880859375, 0.462890625, 0.65875244140625, 0.8546142578125, 1.05047607421875, 1.246337890625, 1.44219970703125, 1.6380615234375, 1.83392333984375, 2.02978515625, 2.22564697265625, 2.4215087890625, 2.61737060546875, 2.813232421875, 3.00909423828125, 3.2049560546875, 3.40081787109375, 3.5966796875, 3.79254150390625, 3.9884033203125, 4.18426513671875, 4.380126953125, 4.57598876953125, 4.7718505859375, 4.96771240234375, 5.16357421875, 5.35943603515625, 5.5552978515625, 5.75115966796875, 5.947021484375, 6.14288330078125, 6.3387451171875, 6.53460693359375, 6.73046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 21.0, 22.0, 15.0, 29.0, 28.0, 40.0, 56.0, 69.0, 141.0, 182.0, 87.0, 52.0, 45.0, 33.0, 32.0, 25.0, 25.0, 16.0, 9.0, 12.0, 6.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001941680908203125, -0.0018830150365829468, -0.0018243491649627686, -0.0017656832933425903, -0.0017070174217224121, -0.0016483515501022339, -0.0015896856784820557, -0.0015310198068618774, -0.0014723539352416992, -0.001413688063621521, -0.0013550221920013428, -0.0012963563203811646, -0.0012376904487609863, -0.001179024577140808, -0.0011203587055206299, -0.0010616928339004517, -0.0010030269622802734, -0.0009443610906600952, -0.000885695219039917, -0.0008270293474197388, -0.0007683634757995605, -0.0007096976041793823, -0.0006510317325592041, -0.0005923658609390259, -0.0005336999893188477, -0.00047503411769866943, -0.0004163682460784912, -0.000357702374458313, -0.00029903650283813477, -0.00024037063121795654, -0.00018170475959777832, -0.0001230388879776001, -6.437301635742188e-05, -5.707144737243652e-06, 5.295872688293457e-05, 0.00011162459850311279, 0.00017029047012329102, 0.00022895634174346924, 0.00028762221336364746, 0.0003462880849838257, 0.0004049539566040039, 0.00046361982822418213, 0.0005222856998443604, 0.0005809515714645386, 0.0006396174430847168, 0.000698283314704895, 0.0007569491863250732, 0.0008156150579452515, 0.0008742809295654297, 0.0009329468011856079, 0.0009916126728057861, 0.0010502785444259644, 0.0011089444160461426, 0.0011676102876663208, 0.001226276159286499, 0.0012849420309066772, 0.0013436079025268555, 0.0014022737741470337, 0.001460939645767212, 0.0015196055173873901, 0.0015782713890075684, 0.0016369372606277466, 0.0016956031322479248, 0.001754269003868103, 0.0018129348754882812]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 11.0, 1.0, 7.0, 4.0, 16.0, 8.0, 22.0, 29.0, 38.0, 59.0, 77.0, 113.0, 156.0, 201.0, 344.0, 583.0, 965.0, 1747.0, 3323.0, 7853.0, 25601.0, 115872.0, 653149.0, 181897.0, 37125.0, 10409.0, 4060.0, 1989.0, 1115.0, 617.0, 370.0, 231.0, 164.0, 112.0, 80.0, 70.0, 44.0, 21.0, 11.0, 10.0, 7.0, 15.0, 10.0, 7.0, 2.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.8873291015625, -4.727783203125, -4.5682373046875, -4.40869140625, -4.2491455078125, -4.089599609375, -3.9300537109375, -3.7705078125, -3.6109619140625, -3.451416015625, -3.2918701171875, -3.13232421875, -2.9727783203125, -2.813232421875, -2.6536865234375, -2.494140625, -2.3345947265625, -2.175048828125, -2.0155029296875, -1.85595703125, -1.6964111328125, -1.536865234375, -1.3773193359375, -1.2177734375, -1.0582275390625, -0.898681640625, -0.7391357421875, -0.57958984375, -0.4200439453125, -0.260498046875, -0.1009521484375, 0.05859375, 0.2181396484375, 0.377685546875, 0.5372314453125, 0.69677734375, 0.8563232421875, 1.015869140625, 1.1754150390625, 1.3349609375, 1.4945068359375, 1.654052734375, 1.8135986328125, 1.97314453125, 2.1326904296875, 2.292236328125, 2.4517822265625, 2.611328125, 2.7708740234375, 2.930419921875, 3.0899658203125, 3.24951171875, 3.4090576171875, 3.568603515625, 3.7281494140625, 3.8876953125, 4.0472412109375, 4.206787109375, 4.3663330078125, 4.52587890625, 4.6854248046875, 4.844970703125, 5.0045166015625, 5.1640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 3.0, 6.0, 6.0, 6.0, 4.0, 7.0, 10.0, 10.0, 16.0, 19.0, 17.0, 17.0, 18.0, 21.0, 26.0, 33.0, 34.0, 45.0, 47.0, 55.0, 67.0, 75.0, 72.0, 50.0, 52.0, 39.0, 24.0, 31.0, 35.0, 18.0, 9.0, 19.0, 12.0, 12.0, 14.0, 14.0, 10.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.41015625, -3.29425048828125, -3.1783447265625, -3.06243896484375, -2.946533203125, -2.83062744140625, -2.7147216796875, -2.59881591796875, -2.48291015625, -2.36700439453125, -2.2510986328125, -2.13519287109375, -2.019287109375, -1.90338134765625, -1.7874755859375, -1.67156982421875, -1.5556640625, -1.43975830078125, -1.3238525390625, -1.20794677734375, -1.092041015625, -0.97613525390625, -0.8602294921875, -0.74432373046875, -0.62841796875, -0.51251220703125, -0.3966064453125, -0.28070068359375, -0.164794921875, -0.04888916015625, 0.0670166015625, 0.18292236328125, 0.298828125, 0.41473388671875, 0.5306396484375, 0.64654541015625, 0.762451171875, 0.87835693359375, 0.9942626953125, 1.11016845703125, 1.22607421875, 1.34197998046875, 1.4578857421875, 1.57379150390625, 1.689697265625, 1.80560302734375, 1.9215087890625, 2.03741455078125, 2.1533203125, 2.26922607421875, 2.3851318359375, 2.50103759765625, 2.616943359375, 2.73284912109375, 2.8487548828125, 2.96466064453125, 3.08056640625, 3.19647216796875, 3.3123779296875, 3.42828369140625, 3.544189453125, 3.66009521484375, 3.7760009765625, 3.89190673828125, 4.0078125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 7.0, 8.0, 13.0, 31.0, 52.0, 89.0, 137.0, 214.0, 186.0, 98.0, 64.0, 43.0, 21.0, 8.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.78268432617188, -113.70319366455078, -109.62371063232422, -105.54421997070312, -101.46473693847656, -97.38524627685547, -93.30575561523438, -89.22627258300781, -85.14678192138672, -81.06729125976562, -76.98780822753906, -72.90831756591797, -68.82882690429688, -64.74934387207031, -60.66985321044922, -56.59036636352539, -52.51087951660156, -48.431392669677734, -44.351905822753906, -40.27241516113281, -36.192928314208984, -32.113441467285156, -28.033952713012695, -23.954463958740234, -19.874977111816406, -15.795489311218262, -11.716001510620117, -7.636513710021973, -3.557025909423828, 0.5224609375, 4.601949691772461, 8.681438446044922, 12.760940551757812, 16.84042739868164, 20.9199161529541, 24.999404907226562, 29.07889175415039, 33.15837860107422, 37.23786926269531, 41.31735610961914, 45.39684295654297, 49.4763298034668, 53.555816650390625, 57.63530731201172, 61.71479415893555, 65.79428100585938, 69.87377166748047, 73.95326232910156, 78.03274536132812, 82.11223602294922, 86.19171905517578, 90.27120971679688, 94.35069274902344, 98.43018341064453, 102.50967407226562, 106.58915710449219, 110.66864776611328, 114.74813842773438, 118.82762145996094, 122.90711212158203, 126.98660278320312, 131.0660858154297, 135.14556884765625, 139.22506713867188, 143.30455017089844]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 19.0, 24.0, 15.0, 19.0, 23.0, 27.0, 24.0, 35.0, 32.0, 36.0, 46.0, 51.0, 62.0, 77.0, 71.0, 65.0, 54.0, 46.0, 43.0, 24.0, 28.0, 22.0, 27.0, 15.0, 20.0, 12.0, 10.0, 15.0, 8.0, 7.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-86.53713989257812, -84.25668334960938, -81.97622680664062, -79.69577026367188, -77.41531372070312, -75.13485717773438, -72.85440063476562, -70.57394409179688, -68.29348754882812, -66.01303100585938, -63.732574462890625, -61.452117919921875, -59.171661376953125, -56.891204833984375, -54.610748291015625, -52.330291748046875, -50.04983901977539, -47.76938247680664, -45.48892593383789, -43.20846939086914, -40.92801284790039, -38.64755630493164, -36.367103576660156, -34.086647033691406, -31.806188583374023, -29.525732040405273, -27.245275497436523, -24.964820861816406, -22.684364318847656, -20.403907775878906, -18.123451232910156, -15.842994689941406, -13.562538146972656, -11.282081604003906, -9.001625061035156, -6.721169471740723, -4.440712928771973, -2.1602563858032227, 0.12019920349121094, 2.400655746459961, 4.681112289428711, 6.961568832397461, 9.242025375366211, 11.522480964660645, 13.802937507629395, 16.083393096923828, 18.363849639892578, 20.644306182861328, 22.924762725830078, 25.205219268798828, 27.485675811767578, 29.766132354736328, 32.04658889770508, 34.32704544067383, 36.60749816894531, 38.88795471191406, 41.16841125488281, 43.44886779785156, 45.72932434082031, 48.00978088378906, 50.29023742675781, 52.57069396972656, 54.85115051269531, 57.13160705566406, 59.41206359863281]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 6.0, 11.0, 25.0, 37.0, 39.0, 77.0, 128.0, 179.0, 249.0, 443.0, 648.0, 1080.0, 1750.0, 2954.0, 5189.0, 9297.0, 18057.0, 37311.0, 91614.0, 304519.0, 1241664.0, 1742123.0, 504970.0, 132708.0, 49349.0, 22917.0, 11569.0, 6332.0, 3521.0, 2106.0, 1268.0, 772.0, 475.0, 303.0, 181.0, 144.0, 97.0, 48.0, 51.0, 21.0, 14.0, 9.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.72265625, -4.59210205078125, -4.4615478515625, -4.33099365234375, -4.200439453125, -4.06988525390625, -3.9393310546875, -3.80877685546875, -3.67822265625, -3.54766845703125, -3.4171142578125, -3.28656005859375, -3.156005859375, -3.02545166015625, -2.8948974609375, -2.76434326171875, -2.6337890625, -2.50323486328125, -2.3726806640625, -2.24212646484375, -2.111572265625, -1.98101806640625, -1.8504638671875, -1.71990966796875, -1.58935546875, -1.45880126953125, -1.3282470703125, -1.19769287109375, -1.067138671875, -0.93658447265625, -0.8060302734375, -0.67547607421875, -0.544921875, -0.41436767578125, -0.2838134765625, -0.15325927734375, -0.022705078125, 0.10784912109375, 0.2384033203125, 0.36895751953125, 0.49951171875, 0.63006591796875, 0.7606201171875, 0.89117431640625, 1.021728515625, 1.15228271484375, 1.2828369140625, 1.41339111328125, 1.5439453125, 1.67449951171875, 1.8050537109375, 1.93560791015625, 2.066162109375, 2.19671630859375, 2.3272705078125, 2.45782470703125, 2.58837890625, 2.71893310546875, 2.8494873046875, 2.98004150390625, 3.110595703125, 3.24114990234375, 3.3717041015625, 3.50225830078125, 3.6328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 9.0, 9.0, 11.0, 15.0, 12.0, 12.0, 16.0, 30.0, 25.0, 28.0, 32.0, 34.0, 40.0, 40.0, 38.0, 45.0, 36.0, 42.0, 45.0, 47.0, 37.0, 40.0, 41.0, 54.0, 50.0, 28.0, 24.0, 23.0, 31.0, 14.0, 16.0, 18.0, 14.0, 12.0, 8.0, 9.0, 6.0, 4.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.505859375, -3.40106201171875, -3.2962646484375, -3.19146728515625, -3.086669921875, -2.98187255859375, -2.8770751953125, -2.77227783203125, -2.66748046875, -2.56268310546875, -2.4578857421875, -2.35308837890625, -2.248291015625, -2.14349365234375, -2.0386962890625, -1.93389892578125, -1.8291015625, -1.72430419921875, -1.6195068359375, -1.51470947265625, -1.409912109375, -1.30511474609375, -1.2003173828125, -1.09552001953125, -0.99072265625, -0.88592529296875, -0.7811279296875, -0.67633056640625, -0.571533203125, -0.46673583984375, -0.3619384765625, -0.25714111328125, -0.15234375, -0.04754638671875, 0.0572509765625, 0.16204833984375, 0.266845703125, 0.37164306640625, 0.4764404296875, 0.58123779296875, 0.68603515625, 0.79083251953125, 0.8956298828125, 1.00042724609375, 1.105224609375, 1.21002197265625, 1.3148193359375, 1.41961669921875, 1.5244140625, 1.62921142578125, 1.7340087890625, 1.83880615234375, 1.943603515625, 2.04840087890625, 2.1531982421875, 2.25799560546875, 2.36279296875, 2.46759033203125, 2.5723876953125, 2.67718505859375, 2.781982421875, 2.88677978515625, 2.9915771484375, 3.09637451171875, 3.201171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 25.0, 18.0, 28.0, 32.0, 61.0, 82.0, 130.0, 201.0, 333.0, 512.0, 927.0, 1772.0, 3819.0, 9557.0, 27633.0, 110929.0, 979650.0, 2714274.0, 261437.0, 53876.0, 16527.0, 6186.0, 2799.0, 1352.0, 775.0, 428.0, 292.0, 165.0, 135.0, 78.0, 60.0, 55.0, 29.0, 17.0, 20.0, 8.0, 12.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.703125, -9.37109375, -9.0390625, -8.70703125, -8.375, -8.04296875, -7.7109375, -7.37890625, -7.046875, -6.71484375, -6.3828125, -6.05078125, -5.71875, -5.38671875, -5.0546875, -4.72265625, -4.390625, -4.05859375, -3.7265625, -3.39453125, -3.0625, -2.73046875, -2.3984375, -2.06640625, -1.734375, -1.40234375, -1.0703125, -0.73828125, -0.40625, -0.07421875, 0.2578125, 0.58984375, 0.921875, 1.25390625, 1.5859375, 1.91796875, 2.25, 2.58203125, 2.9140625, 3.24609375, 3.578125, 3.91015625, 4.2421875, 4.57421875, 4.90625, 5.23828125, 5.5703125, 5.90234375, 6.234375, 6.56640625, 6.8984375, 7.23046875, 7.5625, 7.89453125, 8.2265625, 8.55859375, 8.890625, 9.22265625, 9.5546875, 9.88671875, 10.21875, 10.55078125, 10.8828125, 11.21484375, 11.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 6.0, 12.0, 11.0, 11.0, 27.0, 27.0, 46.0, 83.0, 85.0, 165.0, 277.0, 514.0, 722.0, 684.0, 488.0, 297.0, 187.0, 100.0, 88.0, 68.0, 40.0, 32.0, 20.0, 13.0, 14.0, 14.0, 7.0, 2.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.5516357421875, -12.118896484375, -11.6861572265625, -11.25341796875, -10.8206787109375, -10.387939453125, -9.9552001953125, -9.5224609375, -9.0897216796875, -8.656982421875, -8.2242431640625, -7.79150390625, -7.3587646484375, -6.926025390625, -6.4932861328125, -6.060546875, -5.6278076171875, -5.195068359375, -4.7623291015625, -4.32958984375, -3.8968505859375, -3.464111328125, -3.0313720703125, -2.5986328125, -2.1658935546875, -1.733154296875, -1.3004150390625, -0.86767578125, -0.4349365234375, -0.002197265625, 0.4305419921875, 0.86328125, 1.2960205078125, 1.728759765625, 2.1614990234375, 2.59423828125, 3.0269775390625, 3.459716796875, 3.8924560546875, 4.3251953125, 4.7579345703125, 5.190673828125, 5.6234130859375, 6.05615234375, 6.4888916015625, 6.921630859375, 7.3543701171875, 7.787109375, 8.2198486328125, 8.652587890625, 9.0853271484375, 9.51806640625, 9.9508056640625, 10.383544921875, 10.8162841796875, 11.2490234375, 11.6817626953125, 12.114501953125, 12.5472412109375, 12.97998046875, 13.4127197265625, 13.845458984375, 14.2781982421875, 14.7109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 12.0, 14.0, 32.0, 83.0, 153.0, 200.0, 206.0, 137.0, 58.0, 43.0, 21.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.30025482177734, -104.95867156982422, -99.61709594726562, -94.2755126953125, -88.93392944335938, -83.59234619140625, -78.25077056884766, -72.90918731689453, -67.56761169433594, -62.22603225708008, -56.88444900512695, -51.542869567871094, -46.20128631591797, -40.85970687866211, -35.51812744140625, -30.176544189453125, -24.8349609375, -19.493379592895508, -14.151799201965332, -8.810218811035156, -3.468637466430664, 1.8729438781738281, 7.2145233154296875, 12.556106567382812, 17.897686004638672, 23.239267349243164, 28.580848693847656, 33.922428131103516, 39.264007568359375, 44.6055908203125, 49.94717025756836, 55.288753509521484, 60.63032531738281, 65.97190856933594, 71.31348419189453, 76.65506744384766, 81.99665069580078, 87.33822631835938, 92.6798095703125, 98.02139282226562, 103.36297607421875, 108.70455932617188, 114.04613494873047, 119.3877182006836, 124.72930145263672, 130.0708770751953, 135.41246032714844, 140.75404357910156, 146.09561157226562, 151.43719482421875, 156.77877807617188, 162.120361328125, 167.46192932128906, 172.8035125732422, 178.1450958251953, 183.48667907714844, 188.82826232910156, 194.1698455810547, 199.5114288330078, 204.85299682617188, 210.194580078125, 215.53616333007812, 220.87774658203125, 226.21932983398438, 231.5609130859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 18.0, 14.0, 11.0, 18.0, 18.0, 26.0, 20.0, 35.0, 39.0, 37.0, 41.0, 46.0, 43.0, 48.0, 53.0, 43.0, 51.0, 32.0, 34.0, 41.0, 39.0, 39.0, 29.0, 23.0, 29.0, 25.0, 24.0, 12.0, 10.0, 16.0, 15.0, 8.0, 10.0, 2.0, 5.0, 7.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-64.92037963867188, -62.97454833984375, -61.028717041015625, -59.0828857421875, -57.13705062866211, -55.191219329833984, -53.24538803100586, -51.299556732177734, -49.353721618652344, -47.40789031982422, -45.462059020996094, -43.51622772216797, -41.57039260864258, -39.62456130981445, -37.67873001098633, -35.7328987121582, -33.78706741333008, -31.841236114501953, -29.895402908325195, -27.94957160949707, -26.003738403320312, -24.057907104492188, -22.112075805664062, -20.166244506835938, -18.22041130065918, -16.274580001831055, -14.328746795654297, -12.382915496826172, -10.43708324432373, -8.491250991821289, -6.545419692993164, -4.599587440490723, -2.6537551879882812, -0.707923173904419, 1.2379088401794434, 3.1837406158447266, 5.129572868347168, 7.075405120849609, 9.021236419677734, 10.967068672180176, 12.912900924682617, 14.858733177185059, 16.8045654296875, 18.750396728515625, 20.69622802734375, 22.642061233520508, 24.587892532348633, 26.53372573852539, 28.479557037353516, 30.42538833618164, 32.371219635009766, 34.317054748535156, 36.26288604736328, 38.208717346191406, 40.15454864501953, 42.100379943847656, 44.04621124267578, 45.992042541503906, 47.93787384033203, 49.883705139160156, 51.82954025268555, 53.77537155151367, 55.7212028503418, 57.66703414916992, 59.61286926269531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 13.0, 17.0, 20.0, 23.0, 36.0, 47.0, 71.0, 130.0, 164.0, 227.0, 376.0, 585.0, 861.0, 1310.0, 2249.0, 3697.0, 6358.0, 11419.0, 22061.0, 47245.0, 124847.0, 380552.0, 280653.0, 88173.0, 36404.0, 17559.0, 9511.0, 5466.0, 3100.0, 1999.0, 1171.0, 702.0, 494.0, 305.0, 216.0, 136.0, 102.0, 69.0, 39.0, 45.0, 23.0, 25.0, 11.0, 8.0, 10.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.70880126953125, -6.4761962890625, -6.24359130859375, -6.010986328125, -5.77838134765625, -5.5457763671875, -5.31317138671875, -5.08056640625, -4.84796142578125, -4.6153564453125, -4.38275146484375, -4.150146484375, -3.91754150390625, -3.6849365234375, -3.45233154296875, -3.2197265625, -2.98712158203125, -2.7545166015625, -2.52191162109375, -2.289306640625, -2.05670166015625, -1.8240966796875, -1.59149169921875, -1.35888671875, -1.12628173828125, -0.8936767578125, -0.66107177734375, -0.428466796875, -0.19586181640625, 0.0367431640625, 0.26934814453125, 0.501953125, 0.73455810546875, 0.9671630859375, 1.19976806640625, 1.432373046875, 1.66497802734375, 1.8975830078125, 2.13018798828125, 2.36279296875, 2.59539794921875, 2.8280029296875, 3.06060791015625, 3.293212890625, 3.52581787109375, 3.7584228515625, 3.99102783203125, 4.2236328125, 4.45623779296875, 4.6888427734375, 4.92144775390625, 5.154052734375, 5.38665771484375, 5.6192626953125, 5.85186767578125, 6.08447265625, 6.31707763671875, 6.5496826171875, 6.78228759765625, 7.014892578125, 7.24749755859375, 7.4801025390625, 7.71270751953125, 7.9453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 5.0, 3.0, 12.0, 11.0, 16.0, 22.0, 21.0, 18.0, 33.0, 35.0, 27.0, 24.0, 42.0, 52.0, 43.0, 53.0, 37.0, 58.0, 48.0, 46.0, 49.0, 54.0, 31.0, 38.0, 27.0, 26.0, 32.0, 19.0, 16.0, 14.0, 14.0, 14.0, 5.0, 7.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.091278076171875, -3.96771240234375, -3.844146728515625, -3.7205810546875, -3.597015380859375, -3.47344970703125, -3.349884033203125, -3.226318359375, -3.102752685546875, -2.97918701171875, -2.855621337890625, -2.7320556640625, -2.608489990234375, -2.48492431640625, -2.361358642578125, -2.23779296875, -2.114227294921875, -1.99066162109375, -1.867095947265625, -1.7435302734375, -1.619964599609375, -1.49639892578125, -1.372833251953125, -1.249267578125, -1.125701904296875, -1.00213623046875, -0.878570556640625, -0.7550048828125, -0.631439208984375, -0.50787353515625, -0.384307861328125, -0.2607421875, -0.137176513671875, -0.01361083984375, 0.109954833984375, 0.2335205078125, 0.357086181640625, 0.48065185546875, 0.604217529296875, 0.727783203125, 0.851348876953125, 0.97491455078125, 1.098480224609375, 1.2220458984375, 1.345611572265625, 1.46917724609375, 1.592742919921875, 1.71630859375, 1.839874267578125, 1.96343994140625, 2.087005615234375, 2.2105712890625, 2.334136962890625, 2.45770263671875, 2.581268310546875, 2.704833984375, 2.828399658203125, 2.95196533203125, 3.075531005859375, 3.1990966796875, 3.322662353515625, 3.44622802734375, 3.569793701171875, 3.693359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 12.0, 9.0, 11.0, 24.0, 42.0, 41.0, 58.0, 89.0, 116.0, 169.0, 264.0, 479.0, 719.0, 1426.0, 2930.0, 7896.0, 29067.0, 224223.0, 708098.0, 52123.0, 12234.0, 4099.0, 1778.0, 994.0, 545.0, 344.0, 222.0, 170.0, 125.0, 65.0, 57.0, 42.0, 21.0, 15.0, 20.0, 12.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.384521484375, -18.80029296875, -18.216064453125, -17.6318359375, -17.047607421875, -16.46337890625, -15.879150390625, -15.294921875, -14.710693359375, -14.12646484375, -13.542236328125, -12.9580078125, -12.373779296875, -11.78955078125, -11.205322265625, -10.62109375, -10.036865234375, -9.45263671875, -8.868408203125, -8.2841796875, -7.699951171875, -7.11572265625, -6.531494140625, -5.947265625, -5.363037109375, -4.77880859375, -4.194580078125, -3.6103515625, -3.026123046875, -2.44189453125, -1.857666015625, -1.2734375, -0.689208984375, -0.10498046875, 0.479248046875, 1.0634765625, 1.647705078125, 2.23193359375, 2.816162109375, 3.400390625, 3.984619140625, 4.56884765625, 5.153076171875, 5.7373046875, 6.321533203125, 6.90576171875, 7.489990234375, 8.07421875, 8.658447265625, 9.24267578125, 9.826904296875, 10.4111328125, 10.995361328125, 11.57958984375, 12.163818359375, 12.748046875, 13.332275390625, 13.91650390625, 14.500732421875, 15.0849609375, 15.669189453125, 16.25341796875, 16.837646484375, 17.421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 8.0, 16.0, 18.0, 20.0, 34.0, 31.0, 36.0, 48.0, 47.0, 44.0, 56.0, 74.0, 65.0, 45.0, 42.0, 52.0, 44.0, 43.0, 41.0, 36.0, 29.0, 22.0, 19.0, 20.0, 13.0, 14.0, 18.0, 5.0, 0.0, 2.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.5078125, -15.921875, -15.3359375, -14.75, -14.1640625, -13.578125, -12.9921875, -12.40625, -11.8203125, -11.234375, -10.6484375, -10.0625, -9.4765625, -8.890625, -8.3046875, -7.71875, -7.1328125, -6.546875, -5.9609375, -5.375, -4.7890625, -4.203125, -3.6171875, -3.03125, -2.4453125, -1.859375, -1.2734375, -0.6875, -0.1015625, 0.484375, 1.0703125, 1.65625, 2.2421875, 2.828125, 3.4140625, 4.0, 4.5859375, 5.171875, 5.7578125, 6.34375, 6.9296875, 7.515625, 8.1015625, 8.6875, 9.2734375, 9.859375, 10.4453125, 11.03125, 11.6171875, 12.203125, 12.7890625, 13.375, 13.9609375, 14.546875, 15.1328125, 15.71875, 16.3046875, 16.890625, 17.4765625, 18.0625, 18.6484375, 19.234375, 19.8203125, 20.40625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 10.0, 8.0, 20.0, 23.0, 38.0, 61.0, 109.0, 199.0, 394.0, 703.0, 1483.0, 3309.0, 9058.0, 29116.0, 114161.0, 644471.0, 182397.0, 42532.0, 12434.0, 4444.0, 1807.0, 810.0, 399.0, 218.0, 131.0, 72.0, 46.0, 23.0, 19.0, 15.0, 10.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.6953125, -5.50946044921875, -5.3236083984375, -5.13775634765625, -4.951904296875, -4.76605224609375, -4.5802001953125, -4.39434814453125, -4.20849609375, -4.02264404296875, -3.8367919921875, -3.65093994140625, -3.465087890625, -3.27923583984375, -3.0933837890625, -2.90753173828125, -2.7216796875, -2.53582763671875, -2.3499755859375, -2.16412353515625, -1.978271484375, -1.79241943359375, -1.6065673828125, -1.42071533203125, -1.23486328125, -1.04901123046875, -0.8631591796875, -0.67730712890625, -0.491455078125, -0.30560302734375, -0.1197509765625, 0.06610107421875, 0.251953125, 0.43780517578125, 0.6236572265625, 0.80950927734375, 0.995361328125, 1.18121337890625, 1.3670654296875, 1.55291748046875, 1.73876953125, 1.92462158203125, 2.1104736328125, 2.29632568359375, 2.482177734375, 2.66802978515625, 2.8538818359375, 3.03973388671875, 3.2255859375, 3.41143798828125, 3.5972900390625, 3.78314208984375, 3.968994140625, 4.15484619140625, 4.3406982421875, 4.52655029296875, 4.71240234375, 4.89825439453125, 5.0841064453125, 5.26995849609375, 5.455810546875, 5.64166259765625, 5.8275146484375, 6.01336669921875, 6.19921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 10.0, 12.0, 11.0, 16.0, 15.0, 22.0, 22.0, 38.0, 59.0, 85.0, 122.0, 151.0, 130.0, 76.0, 59.0, 33.0, 29.0, 21.0, 17.0, 14.0, 10.0, 14.0, 6.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00223541259765625, -0.0021725594997406006, -0.002109706401824951, -0.0020468533039093018, -0.0019840002059936523, -0.001921147108078003, -0.0018582940101623535, -0.001795440912246704, -0.0017325878143310547, -0.0016697347164154053, -0.0016068816184997559, -0.0015440285205841064, -0.001481175422668457, -0.0014183223247528076, -0.0013554692268371582, -0.0012926161289215088, -0.0012297630310058594, -0.00116690993309021, -0.0011040568351745605, -0.0010412037372589111, -0.0009783506393432617, -0.0009154975414276123, -0.0008526444435119629, -0.0007897913455963135, -0.0007269382476806641, -0.0006640851497650146, -0.0006012320518493652, -0.0005383789539337158, -0.0004755258560180664, -0.000412672758102417, -0.0003498196601867676, -0.00028696656227111816, -0.00022411346435546875, -0.00016126036643981934, -9.840726852416992e-05, -3.555417060852051e-05, 2.7298927307128906e-05, 9.015202522277832e-05, 0.00015300512313842773, 0.00021585822105407715, 0.00027871131896972656, 0.000341564416885376, 0.0004044175148010254, 0.0004672706127166748, 0.0005301237106323242, 0.0005929768085479736, 0.000655829906463623, 0.0007186830043792725, 0.0007815361022949219, 0.0008443892002105713, 0.0009072422981262207, 0.0009700953960418701, 0.0010329484939575195, 0.001095801591873169, 0.0011586546897888184, 0.0012215077877044678, 0.0012843608856201172, 0.0013472139835357666, 0.001410067081451416, 0.0014729201793670654, 0.0015357732772827148, 0.0015986263751983643, 0.0016614794731140137, 0.001724332571029663, 0.0017871856689453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 4.0, 24.0, 17.0, 47.0, 62.0, 120.0, 217.0, 374.0, 755.0, 1502.0, 3569.0, 11151.0, 50442.0, 483764.0, 428412.0, 50258.0, 11091.0, 3597.0, 1568.0, 748.0, 338.0, 168.0, 103.0, 80.0, 49.0, 28.0, 17.0, 11.0, 10.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.9014892578125, -6.685791015625, -6.4700927734375, -6.25439453125, -6.0386962890625, -5.822998046875, -5.6072998046875, -5.3916015625, -5.1759033203125, -4.960205078125, -4.7445068359375, -4.52880859375, -4.3131103515625, -4.097412109375, -3.8817138671875, -3.666015625, -3.4503173828125, -3.234619140625, -3.0189208984375, -2.80322265625, -2.5875244140625, -2.371826171875, -2.1561279296875, -1.9404296875, -1.7247314453125, -1.509033203125, -1.2933349609375, -1.07763671875, -0.8619384765625, -0.646240234375, -0.4305419921875, -0.21484375, 0.0008544921875, 0.216552734375, 0.4322509765625, 0.64794921875, 0.8636474609375, 1.079345703125, 1.2950439453125, 1.5107421875, 1.7264404296875, 1.942138671875, 2.1578369140625, 2.37353515625, 2.5892333984375, 2.804931640625, 3.0206298828125, 3.236328125, 3.4520263671875, 3.667724609375, 3.8834228515625, 4.09912109375, 4.3148193359375, 4.530517578125, 4.7462158203125, 4.9619140625, 5.1776123046875, 5.393310546875, 5.6090087890625, 5.82470703125, 6.0404052734375, 6.256103515625, 6.4718017578125, 6.6875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 2.0, 9.0, 8.0, 7.0, 11.0, 18.0, 10.0, 15.0, 20.0, 34.0, 21.0, 48.0, 60.0, 79.0, 81.0, 97.0, 94.0, 73.0, 66.0, 47.0, 33.0, 30.0, 24.0, 20.0, 21.0, 10.0, 9.0, 9.0, 8.0, 7.0, 11.0, 1.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.26385498046875, -4.1097412109375, -3.95562744140625, -3.801513671875, -3.64739990234375, -3.4932861328125, -3.33917236328125, -3.18505859375, -3.03094482421875, -2.8768310546875, -2.72271728515625, -2.568603515625, -2.41448974609375, -2.2603759765625, -2.10626220703125, -1.9521484375, -1.79803466796875, -1.6439208984375, -1.48980712890625, -1.335693359375, -1.18157958984375, -1.0274658203125, -0.87335205078125, -0.71923828125, -0.56512451171875, -0.4110107421875, -0.25689697265625, -0.102783203125, 0.05133056640625, 0.2054443359375, 0.35955810546875, 0.513671875, 0.66778564453125, 0.8218994140625, 0.97601318359375, 1.130126953125, 1.28424072265625, 1.4383544921875, 1.59246826171875, 1.74658203125, 1.90069580078125, 2.0548095703125, 2.20892333984375, 2.363037109375, 2.51715087890625, 2.6712646484375, 2.82537841796875, 2.9794921875, 3.13360595703125, 3.2877197265625, 3.44183349609375, 3.595947265625, 3.75006103515625, 3.9041748046875, 4.05828857421875, 4.21240234375, 4.36651611328125, 4.5206298828125, 4.67474365234375, 4.828857421875, 4.98297119140625, 5.1370849609375, 5.29119873046875, 5.4453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 19.0, 24.0, 59.0, 78.0, 143.0, 256.0, 129.0, 112.0, 61.0, 43.0, 23.0, 12.0, 8.0, 2.0, 8.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-125.44071960449219, -121.80831146240234, -118.1759033203125, -114.54348754882812, -110.91107940673828, -107.27867126464844, -103.6462631225586, -100.01385498046875, -96.38143920898438, -92.74903106689453, -89.11662292480469, -85.48420715332031, -81.85179901123047, -78.21939086914062, -74.58698272705078, -70.95457458496094, -67.32215881347656, -63.68975067138672, -60.05733871459961, -56.424930572509766, -52.792518615722656, -49.16011047363281, -45.52770233154297, -41.89529037475586, -38.26288604736328, -34.63047790527344, -30.998065948486328, -27.365657806396484, -23.733245849609375, -20.10083770751953, -16.468427658081055, -12.836017608642578, -9.203605651855469, -5.571195602416992, -1.9387860298156738, 1.6936235427856445, 5.326033592224121, 8.958442687988281, 12.590852737426758, 16.223262786865234, 19.85567283630371, 23.488082885742188, 27.120492935180664, 30.75290298461914, 34.385311126708984, 38.017723083496094, 41.65013122558594, 45.28253936767578, 48.91495132446289, 52.547359466552734, 56.179771423339844, 59.81217956542969, 63.4445915222168, 67.07699584960938, 70.70941162109375, 74.3418197631836, 77.97422790527344, 81.60663604736328, 85.23904418945312, 88.8714599609375, 92.50386810302734, 96.13627624511719, 99.76868438720703, 103.40109252929688, 107.03350830078125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 10.0, 14.0, 11.0, 14.0, 15.0, 20.0, 20.0, 26.0, 39.0, 37.0, 39.0, 46.0, 35.0, 48.0, 58.0, 76.0, 73.0, 60.0, 37.0, 50.0, 40.0, 23.0, 27.0, 24.0, 22.0, 18.0, 26.0, 11.0, 18.0, 12.0, 6.0, 11.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.79644012451172, -73.5357437133789, -71.27505493164062, -69.01435852050781, -66.753662109375, -64.49296569824219, -62.232276916503906, -59.971580505371094, -57.71088790893555, -55.4501953125, -53.18949890136719, -50.92880630493164, -48.668113708496094, -46.40741729736328, -44.146724700927734, -41.88603210449219, -39.625335693359375, -37.36464309692383, -35.103946685791016, -32.84325408935547, -30.58255958557129, -28.32186508178711, -26.061172485351562, -23.800477981567383, -21.539783477783203, -19.279088973999023, -17.018394470214844, -14.757701873779297, -12.497007369995117, -10.236312866210938, -7.975619316101074, -5.714925765991211, -3.4542388916015625, -1.193544864654541, 1.0671491622924805, 3.327843189239502, 5.588537216186523, 7.849231719970703, 10.109925270080566, 12.37061882019043, 14.63131332397461, 16.89200782775879, 19.15270233154297, 21.413394927978516, 23.674089431762695, 25.934783935546875, 28.195476531982422, 30.4561710357666, 32.71686553955078, 34.97755813598633, 37.23825454711914, 39.49894714355469, 41.7596435546875, 44.02033615112305, 46.281028747558594, 48.541725158691406, 50.80241775512695, 53.0631103515625, 55.32380676269531, 57.58449935913086, 59.845191955566406, 62.10588836669922, 64.36658477783203, 66.62727355957031, 68.88796997070312]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 12.0, 13.0, 41.0, 53.0, 90.0, 132.0, 260.0, 534.0, 945.0, 2000.0, 4383.0, 10554.0, 29841.0, 111032.0, 785593.0, 2587079.0, 537416.0, 84029.0, 23683.0, 8888.0, 3805.0, 1817.0, 912.0, 490.0, 270.0, 137.0, 81.0, 62.0, 39.0, 29.0, 12.0, 10.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.3082275390625, -6.100830078125, -5.8934326171875, -5.68603515625, -5.4786376953125, -5.271240234375, -5.0638427734375, -4.8564453125, -4.6490478515625, -4.441650390625, -4.2342529296875, -4.02685546875, -3.8194580078125, -3.612060546875, -3.4046630859375, -3.197265625, -2.9898681640625, -2.782470703125, -2.5750732421875, -2.36767578125, -2.1602783203125, -1.952880859375, -1.7454833984375, -1.5380859375, -1.3306884765625, -1.123291015625, -0.9158935546875, -0.70849609375, -0.5010986328125, -0.293701171875, -0.0863037109375, 0.12109375, 0.3284912109375, 0.535888671875, 0.7432861328125, 0.95068359375, 1.1580810546875, 1.365478515625, 1.5728759765625, 1.7802734375, 1.9876708984375, 2.195068359375, 2.4024658203125, 2.60986328125, 2.8172607421875, 3.024658203125, 3.2320556640625, 3.439453125, 3.6468505859375, 3.854248046875, 4.0616455078125, 4.26904296875, 4.4764404296875, 4.683837890625, 4.8912353515625, 5.0986328125, 5.3060302734375, 5.513427734375, 5.7208251953125, 5.92822265625, 6.1356201171875, 6.343017578125, 6.5504150390625, 6.7578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 8.0, 4.0, 9.0, 10.0, 12.0, 17.0, 12.0, 21.0, 18.0, 19.0, 30.0, 32.0, 30.0, 32.0, 33.0, 33.0, 34.0, 28.0, 39.0, 46.0, 36.0, 38.0, 34.0, 39.0, 44.0, 33.0, 34.0, 35.0, 26.0, 25.0, 31.0, 15.0, 19.0, 11.0, 18.0, 23.0, 11.0, 7.0, 8.0, 10.0, 5.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.2578125, -3.156463623046875, -3.05511474609375, -2.953765869140625, -2.8524169921875, -2.751068115234375, -2.64971923828125, -2.548370361328125, -2.447021484375, -2.345672607421875, -2.24432373046875, -2.142974853515625, -2.0416259765625, -1.940277099609375, -1.83892822265625, -1.737579345703125, -1.63623046875, -1.534881591796875, -1.43353271484375, -1.332183837890625, -1.2308349609375, -1.129486083984375, -1.02813720703125, -0.926788330078125, -0.825439453125, -0.724090576171875, -0.62274169921875, -0.521392822265625, -0.4200439453125, -0.318695068359375, -0.21734619140625, -0.115997314453125, -0.0146484375, 0.086700439453125, 0.18804931640625, 0.289398193359375, 0.3907470703125, 0.492095947265625, 0.59344482421875, 0.694793701171875, 0.796142578125, 0.897491455078125, 0.99884033203125, 1.100189208984375, 1.2015380859375, 1.302886962890625, 1.40423583984375, 1.505584716796875, 1.60693359375, 1.708282470703125, 1.80963134765625, 1.910980224609375, 2.0123291015625, 2.113677978515625, 2.21502685546875, 2.316375732421875, 2.417724609375, 2.519073486328125, 2.62042236328125, 2.721771240234375, 2.8231201171875, 2.924468994140625, 3.02581787109375, 3.127166748046875, 3.228515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 20.0, 30.0, 46.0, 91.0, 153.0, 267.0, 647.0, 2071.0, 9737.0, 115701.0, 3874237.0, 175996.0, 11564.0, 2120.0, 747.0, 331.0, 166.0, 118.0, 61.0, 59.0, 38.0, 16.0, 13.0, 9.0, 8.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.51806640625, -20.7080078125, -19.89794921875, -19.087890625, -18.27783203125, -17.4677734375, -16.65771484375, -15.84765625, -15.03759765625, -14.2275390625, -13.41748046875, -12.607421875, -11.79736328125, -10.9873046875, -10.17724609375, -9.3671875, -8.55712890625, -7.7470703125, -6.93701171875, -6.126953125, -5.31689453125, -4.5068359375, -3.69677734375, -2.88671875, -2.07666015625, -1.2666015625, -0.45654296875, 0.353515625, 1.16357421875, 1.9736328125, 2.78369140625, 3.59375, 4.40380859375, 5.2138671875, 6.02392578125, 6.833984375, 7.64404296875, 8.4541015625, 9.26416015625, 10.07421875, 10.88427734375, 11.6943359375, 12.50439453125, 13.314453125, 14.12451171875, 14.9345703125, 15.74462890625, 16.5546875, 17.36474609375, 18.1748046875, 18.98486328125, 19.794921875, 20.60498046875, 21.4150390625, 22.22509765625, 23.03515625, 23.84521484375, 24.6552734375, 25.46533203125, 26.275390625, 27.08544921875, 27.8955078125, 28.70556640625, 29.515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 1.0, 1.0, 13.0, 12.0, 29.0, 21.0, 40.0, 71.0, 145.0, 283.0, 644.0, 1262.0, 852.0, 350.0, 162.0, 73.0, 41.0, 29.0, 13.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.16552734375, -18.4716796875, -17.77783203125, -17.083984375, -16.39013671875, -15.6962890625, -15.00244140625, -14.30859375, -13.61474609375, -12.9208984375, -12.22705078125, -11.533203125, -10.83935546875, -10.1455078125, -9.45166015625, -8.7578125, -8.06396484375, -7.3701171875, -6.67626953125, -5.982421875, -5.28857421875, -4.5947265625, -3.90087890625, -3.20703125, -2.51318359375, -1.8193359375, -1.12548828125, -0.431640625, 0.26220703125, 0.9560546875, 1.64990234375, 2.34375, 3.03759765625, 3.7314453125, 4.42529296875, 5.119140625, 5.81298828125, 6.5068359375, 7.20068359375, 7.89453125, 8.58837890625, 9.2822265625, 9.97607421875, 10.669921875, 11.36376953125, 12.0576171875, 12.75146484375, 13.4453125, 14.13916015625, 14.8330078125, 15.52685546875, 16.220703125, 16.91455078125, 17.6083984375, 18.30224609375, 18.99609375, 19.68994140625, 20.3837890625, 21.07763671875, 21.771484375, 22.46533203125, 23.1591796875, 23.85302734375, 24.546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 11.0, 18.0, 55.0, 214.0, 376.0, 238.0, 56.0, 13.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-343.9481506347656, -334.5206298828125, -325.0931091308594, -315.66558837890625, -306.2380676269531, -296.810546875, -287.3830261230469, -277.95550537109375, -268.5279541015625, -259.1004333496094, -249.67291259765625, -240.24539184570312, -230.81787109375, -221.39035034179688, -211.9628143310547, -202.53529357910156, -193.1077880859375, -183.68026733398438, -174.25274658203125, -164.82522583007812, -155.397705078125, -145.97018432617188, -136.5426483154297, -127.11512756347656, -117.68760681152344, -108.26008605957031, -98.83256530761719, -89.40503692626953, -79.9775161743164, -70.54999542236328, -61.12247085571289, -51.6949462890625, -42.267425537109375, -32.83990478515625, -23.41238021850586, -13.984857559204102, -4.557334899902344, 4.870185852050781, 14.297710418701172, 23.725234985351562, 33.15275573730469, 42.58027648925781, 52.0078010559082, 61.435325622558594, 70.86284637451172, 80.29036712646484, 89.7178955078125, 99.14541625976562, 108.57293701171875, 118.00045776367188, 127.427978515625, 136.85549926757812, 146.28302001953125, 155.71054077148438, 165.13807678222656, 174.5655975341797, 183.9931182861328, 193.42063903808594, 202.84815979003906, 212.2756805419922, 221.70321655273438, 231.1307373046875, 240.55825805664062, 249.98577880859375, 259.4132995605469]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 10.0, 15.0, 16.0, 21.0, 16.0, 19.0, 21.0, 34.0, 34.0, 35.0, 32.0, 38.0, 37.0, 46.0, 55.0, 40.0, 49.0, 44.0, 42.0, 50.0, 45.0, 45.0, 32.0, 23.0, 33.0, 22.0, 21.0, 23.0, 19.0, 14.0, 9.0, 9.0, 7.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.45194244384766, -66.40643310546875, -64.36093139648438, -62.315425872802734, -60.269920349121094, -58.22441101074219, -56.17890548706055, -54.133399963378906, -52.087894439697266, -50.042388916015625, -47.996883392333984, -45.951377868652344, -43.90586853027344, -41.86036682128906, -39.814857482910156, -37.769351959228516, -35.723846435546875, -33.678340911865234, -31.632835388183594, -29.58732795715332, -27.54182243347168, -25.49631690979004, -23.450809478759766, -21.405303955078125, -19.359798431396484, -17.314292907714844, -15.268786430358887, -13.22327995300293, -11.177774429321289, -9.132268905639648, -7.086762428283691, -5.041255950927734, -2.995746612548828, -0.9502406120300293, 1.0952653884887695, 3.1407713890075684, 5.186277389526367, 7.231782913208008, 9.277289390563965, 11.322795867919922, 13.368301391601562, 15.413806915283203, 17.459312438964844, 19.504819869995117, 21.550325393676758, 23.5958309173584, 25.641338348388672, 27.686843872070312, 29.732349395751953, 31.777854919433594, 33.823360443115234, 35.868865966796875, 37.91437530517578, 39.959877014160156, 42.00538635253906, 44.0508918762207, 46.096397399902344, 48.141902923583984, 50.187408447265625, 52.232913970947266, 54.278419494628906, 56.32392883300781, 58.36943435668945, 60.414939880371094, 62.460445404052734]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 5.0, 14.0, 13.0, 24.0, 29.0, 43.0, 68.0, 86.0, 152.0, 203.0, 336.0, 503.0, 841.0, 1398.0, 2286.0, 4147.0, 8403.0, 18840.0, 52679.0, 166773.0, 405314.0, 254989.0, 80495.0, 27106.0, 11159.0, 5359.0, 2857.0, 1657.0, 995.0, 595.0, 360.0, 250.0, 156.0, 117.0, 82.0, 61.0, 47.0, 23.0, 13.0, 16.0, 8.0, 7.0, 7.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.38671875, -6.1851806640625, -5.983642578125, -5.7821044921875, -5.58056640625, -5.3790283203125, -5.177490234375, -4.9759521484375, -4.7744140625, -4.5728759765625, -4.371337890625, -4.1697998046875, -3.96826171875, -3.7667236328125, -3.565185546875, -3.3636474609375, -3.162109375, -2.9605712890625, -2.759033203125, -2.5574951171875, -2.35595703125, -2.1544189453125, -1.952880859375, -1.7513427734375, -1.5498046875, -1.3482666015625, -1.146728515625, -0.9451904296875, -0.74365234375, -0.5421142578125, -0.340576171875, -0.1390380859375, 0.0625, 0.2640380859375, 0.465576171875, 0.6671142578125, 0.86865234375, 1.0701904296875, 1.271728515625, 1.4732666015625, 1.6748046875, 1.8763427734375, 2.077880859375, 2.2794189453125, 2.48095703125, 2.6824951171875, 2.884033203125, 3.0855712890625, 3.287109375, 3.4886474609375, 3.690185546875, 3.8917236328125, 4.09326171875, 4.2947998046875, 4.496337890625, 4.6978759765625, 4.8994140625, 5.1009521484375, 5.302490234375, 5.5040283203125, 5.70556640625, 5.9071044921875, 6.108642578125, 6.3101806640625, 6.51171875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 1.0, 10.0, 9.0, 11.0, 10.0, 9.0, 10.0, 23.0, 30.0, 26.0, 34.0, 19.0, 40.0, 41.0, 41.0, 25.0, 46.0, 51.0, 41.0, 62.0, 40.0, 54.0, 37.0, 34.0, 34.0, 31.0, 36.0, 27.0, 30.0, 27.0, 15.0, 14.0, 12.0, 10.0, 15.0, 11.0, 5.0, 4.0, 3.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.87890625, -4.73516845703125, -4.5914306640625, -4.44769287109375, -4.303955078125, -4.16021728515625, -4.0164794921875, -3.87274169921875, -3.72900390625, -3.58526611328125, -3.4415283203125, -3.29779052734375, -3.154052734375, -3.01031494140625, -2.8665771484375, -2.72283935546875, -2.5791015625, -2.43536376953125, -2.2916259765625, -2.14788818359375, -2.004150390625, -1.86041259765625, -1.7166748046875, -1.57293701171875, -1.42919921875, -1.28546142578125, -1.1417236328125, -0.99798583984375, -0.854248046875, -0.71051025390625, -0.5667724609375, -0.42303466796875, -0.279296875, -0.13555908203125, 0.0081787109375, 0.15191650390625, 0.295654296875, 0.43939208984375, 0.5831298828125, 0.72686767578125, 0.87060546875, 1.01434326171875, 1.1580810546875, 1.30181884765625, 1.445556640625, 1.58929443359375, 1.7330322265625, 1.87677001953125, 2.0205078125, 2.16424560546875, 2.3079833984375, 2.45172119140625, 2.595458984375, 2.73919677734375, 2.8829345703125, 3.02667236328125, 3.17041015625, 3.31414794921875, 3.4578857421875, 3.60162353515625, 3.745361328125, 3.88909912109375, 4.0328369140625, 4.17657470703125, 4.3203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 2.0, 4.0, 9.0, 11.0, 12.0, 30.0, 30.0, 56.0, 68.0, 137.0, 242.0, 436.0, 924.0, 2151.0, 6900.0, 35874.0, 610699.0, 352139.0, 28975.0, 6105.0, 2004.0, 833.0, 381.0, 209.0, 108.0, 74.0, 54.0, 21.0, 18.0, 11.0, 7.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.5, -16.9844970703125, -16.468994140625, -15.9534912109375, -15.43798828125, -14.9224853515625, -14.406982421875, -13.8914794921875, -13.3759765625, -12.8604736328125, -12.344970703125, -11.8294677734375, -11.31396484375, -10.7984619140625, -10.282958984375, -9.7674560546875, -9.251953125, -8.7364501953125, -8.220947265625, -7.7054443359375, -7.18994140625, -6.6744384765625, -6.158935546875, -5.6434326171875, -5.1279296875, -4.6124267578125, -4.096923828125, -3.5814208984375, -3.06591796875, -2.5504150390625, -2.034912109375, -1.5194091796875, -1.00390625, -0.4884033203125, 0.027099609375, 0.5426025390625, 1.05810546875, 1.5736083984375, 2.089111328125, 2.6046142578125, 3.1201171875, 3.6356201171875, 4.151123046875, 4.6666259765625, 5.18212890625, 5.6976318359375, 6.213134765625, 6.7286376953125, 7.244140625, 7.7596435546875, 8.275146484375, 8.7906494140625, 9.30615234375, 9.8216552734375, 10.337158203125, 10.8526611328125, 11.3681640625, 11.8836669921875, 12.399169921875, 12.9146728515625, 13.43017578125, 13.9456787109375, 14.461181640625, 14.9766845703125, 15.4921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 2.0, 6.0, 18.0, 9.0, 19.0, 17.0, 15.0, 23.0, 23.0, 29.0, 34.0, 32.0, 46.0, 50.0, 47.0, 48.0, 47.0, 44.0, 51.0, 51.0, 46.0, 50.0, 46.0, 37.0, 28.0, 33.0, 20.0, 15.0, 16.0, 12.0, 12.0, 12.0, 15.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.609375, -16.97802734375, -16.3466796875, -15.71533203125, -15.083984375, -14.45263671875, -13.8212890625, -13.18994140625, -12.55859375, -11.92724609375, -11.2958984375, -10.66455078125, -10.033203125, -9.40185546875, -8.7705078125, -8.13916015625, -7.5078125, -6.87646484375, -6.2451171875, -5.61376953125, -4.982421875, -4.35107421875, -3.7197265625, -3.08837890625, -2.45703125, -1.82568359375, -1.1943359375, -0.56298828125, 0.068359375, 0.69970703125, 1.3310546875, 1.96240234375, 2.59375, 3.22509765625, 3.8564453125, 4.48779296875, 5.119140625, 5.75048828125, 6.3818359375, 7.01318359375, 7.64453125, 8.27587890625, 8.9072265625, 9.53857421875, 10.169921875, 10.80126953125, 11.4326171875, 12.06396484375, 12.6953125, 13.32666015625, 13.9580078125, 14.58935546875, 15.220703125, 15.85205078125, 16.4833984375, 17.11474609375, 17.74609375, 18.37744140625, 19.0087890625, 19.64013671875, 20.271484375, 20.90283203125, 21.5341796875, 22.16552734375, 22.796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 8.0, 11.0, 21.0, 27.0, 46.0, 43.0, 70.0, 119.0, 220.0, 423.0, 715.0, 1224.0, 2248.0, 4738.0, 11426.0, 35798.0, 166659.0, 651370.0, 125749.0, 28706.0, 9934.0, 4190.0, 2115.0, 1098.0, 670.0, 385.0, 192.0, 125.0, 87.0, 47.0, 28.0, 30.0, 7.0, 8.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.27911376953125, -4.1285400390625, -3.97796630859375, -3.827392578125, -3.67681884765625, -3.5262451171875, -3.37567138671875, -3.22509765625, -3.07452392578125, -2.9239501953125, -2.77337646484375, -2.622802734375, -2.47222900390625, -2.3216552734375, -2.17108154296875, -2.0205078125, -1.86993408203125, -1.7193603515625, -1.56878662109375, -1.418212890625, -1.26763916015625, -1.1170654296875, -0.96649169921875, -0.81591796875, -0.66534423828125, -0.5147705078125, -0.36419677734375, -0.213623046875, -0.06304931640625, 0.0875244140625, 0.23809814453125, 0.388671875, 0.53924560546875, 0.6898193359375, 0.84039306640625, 0.990966796875, 1.14154052734375, 1.2921142578125, 1.44268798828125, 1.59326171875, 1.74383544921875, 1.8944091796875, 2.04498291015625, 2.195556640625, 2.34613037109375, 2.4967041015625, 2.64727783203125, 2.7978515625, 2.94842529296875, 3.0989990234375, 3.24957275390625, 3.400146484375, 3.55072021484375, 3.7012939453125, 3.85186767578125, 4.00244140625, 4.15301513671875, 4.3035888671875, 4.45416259765625, 4.604736328125, 4.75531005859375, 4.9058837890625, 5.05645751953125, 5.20703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 12.0, 3.0, 5.0, 7.0, 20.0, 26.0, 43.0, 84.0, 128.0, 156.0, 193.0, 111.0, 78.0, 42.0, 31.0, 15.0, 13.0, 8.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0022735595703125, -0.002204328775405884, -0.0021350979804992676, -0.0020658671855926514, -0.001996636390686035, -0.001927405595779419, -0.0018581748008728027, -0.0017889440059661865, -0.0017197132110595703, -0.001650482416152954, -0.0015812516212463379, -0.0015120208263397217, -0.0014427900314331055, -0.0013735592365264893, -0.001304328441619873, -0.0012350976467132568, -0.0011658668518066406, -0.0010966360569000244, -0.0010274052619934082, -0.000958174467086792, -0.0008889436721801758, -0.0008197128772735596, -0.0007504820823669434, -0.0006812512874603271, -0.0006120204925537109, -0.0005427896976470947, -0.0004735589027404785, -0.0004043281078338623, -0.0003350973129272461, -0.0002658665180206299, -0.00019663572311401367, -0.00012740492820739746, -5.817413330078125e-05, 1.1056661605834961e-05, 8.028745651245117e-05, 0.00014951825141906738, 0.0002187490463256836, 0.0002879798412322998, 0.000357210636138916, 0.0004264414310455322, 0.0004956722259521484, 0.0005649030208587646, 0.0006341338157653809, 0.0007033646106719971, 0.0007725954055786133, 0.0008418262004852295, 0.0009110569953918457, 0.000980287790298462, 0.0010495185852050781, 0.0011187493801116943, 0.0011879801750183105, 0.0012572109699249268, 0.001326441764831543, 0.0013956725597381592, 0.0014649033546447754, 0.0015341341495513916, 0.0016033649444580078, 0.001672595739364624, 0.0017418265342712402, 0.0018110573291778564, 0.0018802881240844727, 0.0019495189189910889, 0.002018749713897705, 0.0020879805088043213, 0.0021572113037109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 16.0, 18.0, 28.0, 38.0, 78.0, 92.0, 176.0, 302.0, 564.0, 925.0, 2081.0, 4786.0, 12234.0, 37985.0, 158573.0, 619968.0, 153059.0, 36828.0, 11758.0, 4645.0, 2076.0, 983.0, 571.0, 259.0, 172.0, 109.0, 78.0, 39.0, 27.0, 10.0, 13.0, 8.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.18511962890625, -4.0382080078125, -3.89129638671875, -3.744384765625, -3.59747314453125, -3.4505615234375, -3.30364990234375, -3.15673828125, -3.00982666015625, -2.8629150390625, -2.71600341796875, -2.569091796875, -2.42218017578125, -2.2752685546875, -2.12835693359375, -1.9814453125, -1.83453369140625, -1.6876220703125, -1.54071044921875, -1.393798828125, -1.24688720703125, -1.0999755859375, -0.95306396484375, -0.80615234375, -0.65924072265625, -0.5123291015625, -0.36541748046875, -0.218505859375, -0.07159423828125, 0.0753173828125, 0.22222900390625, 0.369140625, 0.51605224609375, 0.6629638671875, 0.80987548828125, 0.956787109375, 1.10369873046875, 1.2506103515625, 1.39752197265625, 1.54443359375, 1.69134521484375, 1.8382568359375, 1.98516845703125, 2.132080078125, 2.27899169921875, 2.4259033203125, 2.57281494140625, 2.7197265625, 2.86663818359375, 3.0135498046875, 3.16046142578125, 3.307373046875, 3.45428466796875, 3.6011962890625, 3.74810791015625, 3.89501953125, 4.04193115234375, 4.1888427734375, 4.33575439453125, 4.482666015625, 4.62957763671875, 4.7764892578125, 4.92340087890625, 5.0703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 9.0, 7.0, 24.0, 13.0, 11.0, 28.0, 52.0, 54.0, 75.0, 61.0, 87.0, 87.0, 98.0, 70.0, 65.0, 56.0, 48.0, 36.0, 29.0, 24.0, 8.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.06640625, -4.91937255859375, -4.7723388671875, -4.62530517578125, -4.478271484375, -4.33123779296875, -4.1842041015625, -4.03717041015625, -3.89013671875, -3.74310302734375, -3.5960693359375, -3.44903564453125, -3.302001953125, -3.15496826171875, -3.0079345703125, -2.86090087890625, -2.7138671875, -2.56683349609375, -2.4197998046875, -2.27276611328125, -2.125732421875, -1.97869873046875, -1.8316650390625, -1.68463134765625, -1.53759765625, -1.39056396484375, -1.2435302734375, -1.09649658203125, -0.949462890625, -0.80242919921875, -0.6553955078125, -0.50836181640625, -0.361328125, -0.21429443359375, -0.0672607421875, 0.07977294921875, 0.226806640625, 0.37384033203125, 0.5208740234375, 0.66790771484375, 0.81494140625, 0.96197509765625, 1.1090087890625, 1.25604248046875, 1.403076171875, 1.55010986328125, 1.6971435546875, 1.84417724609375, 1.9912109375, 2.13824462890625, 2.2852783203125, 2.43231201171875, 2.579345703125, 2.72637939453125, 2.8734130859375, 3.02044677734375, 3.16748046875, 3.31451416015625, 3.4615478515625, 3.60858154296875, 3.755615234375, 3.90264892578125, 4.0496826171875, 4.19671630859375, 4.34375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 20.0, 43.0, 75.0, 154.0, 289.0, 202.0, 94.0, 45.0, 22.0, 18.0, 7.0, 5.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.7164306640625, -93.60334014892578, -89.49024963378906, -85.37715148925781, -81.2640609741211, -77.15097045898438, -73.03787231445312, -68.9247817993164, -64.81169128417969, -60.69860076904297, -56.585506439208984, -52.472412109375, -48.35932159423828, -44.24623107910156, -40.13313674926758, -36.020042419433594, -31.906951904296875, -27.793859481811523, -23.680767059326172, -19.56767463684082, -15.454582214355469, -11.341489791870117, -7.228397369384766, -3.115304946899414, 0.9977874755859375, 5.110879898071289, 9.22397232055664, 13.337064743041992, 17.450157165527344, 21.563249588012695, 25.676342010498047, 29.7894344329834, 33.90252685546875, 38.01561737060547, 42.12871170043945, 46.24180603027344, 50.354896545410156, 54.467987060546875, 58.58108139038086, 62.694175720214844, 66.80726623535156, 70.92035675048828, 75.033447265625, 79.14654541015625, 83.25963592529297, 87.37272644042969, 91.48582458496094, 95.59891510009766, 99.71200561523438, 103.8250961303711, 107.93818664550781, 112.05128479003906, 116.16437530517578, 120.2774658203125, 124.39056396484375, 128.50364685058594, 132.6167449951172, 136.72984313964844, 140.84292602539062, 144.95602416992188, 149.06912231445312, 153.1822052001953, 157.29530334472656, 161.40838623046875, 165.521484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 6.0, 6.0, 6.0, 7.0, 14.0, 15.0, 18.0, 10.0, 19.0, 21.0, 30.0, 32.0, 25.0, 25.0, 31.0, 40.0, 47.0, 73.0, 81.0, 72.0, 56.0, 58.0, 46.0, 33.0, 31.0, 27.0, 27.0, 25.0, 21.0, 16.0, 10.0, 12.0, 10.0, 10.0, 7.0, 7.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.0448226928711, -75.50323486328125, -72.96163940429688, -70.42005157470703, -67.87845611572266, -65.33686828613281, -62.7952766418457, -60.253684997558594, -57.712093353271484, -55.170501708984375, -52.628910064697266, -50.087318420410156, -47.54573059082031, -45.00413513183594, -42.462547302246094, -39.920955657958984, -37.379364013671875, -34.837772369384766, -32.296180725097656, -29.75459098815918, -27.21299934387207, -24.67140769958496, -22.129817962646484, -19.588226318359375, -17.046634674072266, -14.505043029785156, -11.963452339172363, -9.42186164855957, -6.880270004272461, -4.338678359985352, -1.7970876693725586, 0.7445030212402344, 3.2860946655273438, 5.827685832977295, 8.369277000427246, 10.910867691040039, 13.452459335327148, 15.994050979614258, 18.535640716552734, 21.077232360839844, 23.618824005126953, 26.160415649414062, 28.702007293701172, 31.24359703063965, 33.785186767578125, 36.3267822265625, 38.868370056152344, 41.40996170043945, 43.95155334472656, 46.49314498901367, 49.03473663330078, 51.57632827758789, 54.117919921875, 56.659507751464844, 59.20109939575195, 61.74269104003906, 64.28428649902344, 66.82587432861328, 69.36746978759766, 71.9090576171875, 74.45065307617188, 76.99224090576172, 79.5338363647461, 82.07542419433594, 84.61701202392578]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 14.0, 16.0, 26.0, 37.0, 44.0, 97.0, 136.0, 203.0, 378.0, 776.0, 1326.0, 2583.0, 5434.0, 12464.0, 34293.0, 138100.0, 849640.0, 2384883.0, 609903.0, 105786.0, 27706.0, 10523.0, 4636.0, 2321.0, 1225.0, 683.0, 390.0, 216.0, 144.0, 92.0, 59.0, 44.0, 22.0, 22.0, 20.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.37896728515625, -6.1759033203125, -5.97283935546875, -5.769775390625, -5.56671142578125, -5.3636474609375, -5.16058349609375, -4.95751953125, -4.75445556640625, -4.5513916015625, -4.34832763671875, -4.145263671875, -3.94219970703125, -3.7391357421875, -3.53607177734375, -3.3330078125, -3.12994384765625, -2.9268798828125, -2.72381591796875, -2.520751953125, -2.31768798828125, -2.1146240234375, -1.91156005859375, -1.70849609375, -1.50543212890625, -1.3023681640625, -1.09930419921875, -0.896240234375, -0.69317626953125, -0.4901123046875, -0.28704833984375, -0.083984375, 0.11907958984375, 0.3221435546875, 0.52520751953125, 0.728271484375, 0.93133544921875, 1.1343994140625, 1.33746337890625, 1.54052734375, 1.74359130859375, 1.9466552734375, 2.14971923828125, 2.352783203125, 2.55584716796875, 2.7589111328125, 2.96197509765625, 3.1650390625, 3.36810302734375, 3.5711669921875, 3.77423095703125, 3.977294921875, 4.18035888671875, 4.3834228515625, 4.58648681640625, 4.78955078125, 4.99261474609375, 5.1956787109375, 5.39874267578125, 5.601806640625, 5.80487060546875, 6.0079345703125, 6.21099853515625, 6.4140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 7.0, 15.0, 10.0, 10.0, 17.0, 20.0, 25.0, 31.0, 33.0, 34.0, 37.0, 60.0, 59.0, 46.0, 60.0, 59.0, 55.0, 53.0, 58.0, 51.0, 26.0, 46.0, 39.0, 27.0, 30.0, 23.0, 15.0, 7.0, 18.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.17803955078125, -4.0006103515625, -3.82318115234375, -3.645751953125, -3.46832275390625, -3.2908935546875, -3.11346435546875, -2.93603515625, -2.75860595703125, -2.5811767578125, -2.40374755859375, -2.226318359375, -2.04888916015625, -1.8714599609375, -1.69403076171875, -1.5166015625, -1.33917236328125, -1.1617431640625, -0.98431396484375, -0.806884765625, -0.62945556640625, -0.4520263671875, -0.27459716796875, -0.09716796875, 0.08026123046875, 0.2576904296875, 0.43511962890625, 0.612548828125, 0.78997802734375, 0.9674072265625, 1.14483642578125, 1.322265625, 1.49969482421875, 1.6771240234375, 1.85455322265625, 2.031982421875, 2.20941162109375, 2.3868408203125, 2.56427001953125, 2.74169921875, 2.91912841796875, 3.0965576171875, 3.27398681640625, 3.451416015625, 3.62884521484375, 3.8062744140625, 3.98370361328125, 4.1611328125, 4.33856201171875, 4.5159912109375, 4.69342041015625, 4.870849609375, 5.04827880859375, 5.2257080078125, 5.40313720703125, 5.58056640625, 5.75799560546875, 5.9354248046875, 6.11285400390625, 6.290283203125, 6.46771240234375, 6.6451416015625, 6.82257080078125, 7.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 14.0, 19.0, 38.0, 102.0, 237.0, 828.0, 4525.0, 78788.0, 4046658.0, 57484.0, 4251.0, 873.0, 238.0, 103.0, 48.0, 29.0, 16.0, 8.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.875, -40.62353515625, -39.3720703125, -38.12060546875, -36.869140625, -35.61767578125, -34.3662109375, -33.11474609375, -31.86328125, -30.61181640625, -29.3603515625, -28.10888671875, -26.857421875, -25.60595703125, -24.3544921875, -23.10302734375, -21.8515625, -20.60009765625, -19.3486328125, -18.09716796875, -16.845703125, -15.59423828125, -14.3427734375, -13.09130859375, -11.83984375, -10.58837890625, -9.3369140625, -8.08544921875, -6.833984375, -5.58251953125, -4.3310546875, -3.07958984375, -1.828125, -0.57666015625, 0.6748046875, 1.92626953125, 3.177734375, 4.42919921875, 5.6806640625, 6.93212890625, 8.18359375, 9.43505859375, 10.6865234375, 11.93798828125, 13.189453125, 14.44091796875, 15.6923828125, 16.94384765625, 18.1953125, 19.44677734375, 20.6982421875, 21.94970703125, 23.201171875, 24.45263671875, 25.7041015625, 26.95556640625, 28.20703125, 29.45849609375, 30.7099609375, 31.96142578125, 33.212890625, 34.46435546875, 35.7158203125, 36.96728515625, 38.21875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 5.0, 9.0, 25.0, 36.0, 50.0, 74.0, 132.0, 273.0, 714.0, 1158.0, 820.0, 369.0, 149.0, 87.0, 52.0, 29.0, 19.0, 16.0, 12.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.1038818359375, -12.434326171875, -11.7647705078125, -11.09521484375, -10.4256591796875, -9.756103515625, -9.0865478515625, -8.4169921875, -7.7474365234375, -7.077880859375, -6.4083251953125, -5.73876953125, -5.0692138671875, -4.399658203125, -3.7301025390625, -3.060546875, -2.3909912109375, -1.721435546875, -1.0518798828125, -0.38232421875, 0.2872314453125, 0.956787109375, 1.6263427734375, 2.2958984375, 2.9654541015625, 3.635009765625, 4.3045654296875, 4.97412109375, 5.6436767578125, 6.313232421875, 6.9827880859375, 7.65234375, 8.3218994140625, 8.991455078125, 9.6610107421875, 10.33056640625, 11.0001220703125, 11.669677734375, 12.3392333984375, 13.0087890625, 13.6783447265625, 14.347900390625, 15.0174560546875, 15.68701171875, 16.3565673828125, 17.026123046875, 17.6956787109375, 18.365234375, 19.0347900390625, 19.704345703125, 20.3739013671875, 21.04345703125, 21.7130126953125, 22.382568359375, 23.0521240234375, 23.7216796875, 24.3912353515625, 25.060791015625, 25.7303466796875, 26.39990234375, 27.0694580078125, 27.739013671875, 28.4085693359375, 29.078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 13.0, 14.0, 40.0, 129.0, 202.0, 248.0, 182.0, 87.0, 37.0, 19.0, 10.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.34624481201172, -87.62030792236328, -80.89436340332031, -74.16842651367188, -67.44248962402344, -60.71654510498047, -53.99060821533203, -47.26466751098633, -40.538726806640625, -33.81278610229492, -27.08684730529785, -20.36090850830078, -13.634967803955078, -6.909027099609375, -0.1830902099609375, 6.542850494384766, 13.268791198730469, 19.994731903076172, 26.720670700073242, 33.44660949707031, 40.172550201416016, 46.89849090576172, 53.624427795410156, 60.35036849975586, 67.07630920410156, 73.80224609375, 80.52819061279297, 87.2541275024414, 93.98007202148438, 100.70600891113281, 107.43194580078125, 114.15788269042969, 120.88381958007812, 127.60975646972656, 134.335693359375, 141.0616455078125, 147.78758239746094, 154.51351928710938, 161.2394561767578, 167.96539306640625, 174.69134521484375, 181.4172821044922, 188.14321899414062, 194.86917114257812, 201.59510803222656, 208.321044921875, 215.04698181152344, 221.77291870117188, 228.4988555908203, 235.22479248046875, 241.9507293701172, 248.67666625976562, 255.40261840820312, 262.1285400390625, 268.8544921875, 275.5804443359375, 282.3063659667969, 289.0323181152344, 295.75823974609375, 302.48419189453125, 309.2101135253906, 315.9360656738281, 322.6619873046875, 329.387939453125, 336.1138916015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 15.0, 11.0, 16.0, 24.0, 25.0, 29.0, 37.0, 54.0, 42.0, 32.0, 44.0, 48.0, 40.0, 37.0, 50.0, 42.0, 39.0, 41.0, 37.0, 46.0, 39.0, 36.0, 34.0, 30.0, 30.0, 23.0, 25.0, 12.0, 10.0, 7.0, 5.0, 2.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.89161682128906, -66.52911376953125, -64.16661834716797, -61.804115295410156, -59.44161605834961, -57.07911682128906, -54.71661376953125, -52.3541145324707, -49.991615295410156, -47.62911605834961, -45.2666130065918, -42.90411376953125, -40.5416145324707, -38.179115295410156, -35.816612243652344, -33.4541130065918, -31.091609954833984, -28.729108810424805, -26.366609573364258, -24.004108428955078, -21.64160919189453, -19.27910804748535, -16.916606903076172, -14.554107666015625, -12.191606521606445, -9.829106330871582, -7.4666056632995605, -5.104104995727539, -2.741604804992676, -0.3791046142578125, 1.9833965301513672, 4.345895767211914, 6.708396911621094, 9.070897102355957, 11.43339729309082, 13.7958984375, 16.158397674560547, 18.520898818969727, 20.883399963378906, 23.245899200439453, 25.608400344848633, 27.970901489257812, 30.33340072631836, 32.695899963378906, 35.05840301513672, 37.420902252197266, 39.78340148925781, 42.145904541015625, 44.50840377807617, 46.87090301513672, 49.23340606689453, 51.59590530395508, 53.958404541015625, 56.32090759277344, 58.683406829833984, 61.04590606689453, 63.408409118652344, 65.77091217041016, 68.13340759277344, 70.49591064453125, 72.85841369628906, 75.22090911865234, 77.58341217041016, 79.94590759277344, 82.30841064453125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 17.0, 25.0, 38.0, 47.0, 58.0, 67.0, 125.0, 168.0, 232.0, 339.0, 468.0, 761.0, 1053.0, 1841.0, 3019.0, 5542.0, 10594.0, 21729.0, 53042.0, 149806.0, 381375.0, 261126.0, 89428.0, 34186.0, 15041.0, 7494.0, 4073.0, 2398.0, 1479.0, 930.0, 632.0, 432.0, 246.0, 213.0, 134.0, 109.0, 72.0, 46.0, 38.0, 29.0, 26.0, 17.0, 13.0, 10.0, 7.0, 6.0, 1.0, 3.0, 3.0], "bins": [-6.51953125, -6.33721923828125, -6.1549072265625, -5.97259521484375, -5.790283203125, -5.60797119140625, -5.4256591796875, -5.24334716796875, -5.06103515625, -4.87872314453125, -4.6964111328125, -4.51409912109375, -4.331787109375, -4.14947509765625, -3.9671630859375, -3.78485107421875, -3.6025390625, -3.42022705078125, -3.2379150390625, -3.05560302734375, -2.873291015625, -2.69097900390625, -2.5086669921875, -2.32635498046875, -2.14404296875, -1.96173095703125, -1.7794189453125, -1.59710693359375, -1.414794921875, -1.23248291015625, -1.0501708984375, -0.86785888671875, -0.685546875, -0.50323486328125, -0.3209228515625, -0.13861083984375, 0.043701171875, 0.22601318359375, 0.4083251953125, 0.59063720703125, 0.77294921875, 0.95526123046875, 1.1375732421875, 1.31988525390625, 1.502197265625, 1.68450927734375, 1.8668212890625, 2.04913330078125, 2.2314453125, 2.41375732421875, 2.5960693359375, 2.77838134765625, 2.960693359375, 3.14300537109375, 3.3253173828125, 3.50762939453125, 3.68994140625, 3.87225341796875, 4.0545654296875, 4.23687744140625, 4.419189453125, 4.60150146484375, 4.7838134765625, 4.96612548828125, 5.1484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 13.0, 10.0, 14.0, 15.0, 17.0, 19.0, 20.0, 24.0, 35.0, 47.0, 42.0, 63.0, 50.0, 58.0, 80.0, 70.0, 60.0, 58.0, 46.0, 57.0, 38.0, 32.0, 29.0, 21.0, 19.0, 14.0, 16.0, 11.0, 4.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.19921875, -5.97735595703125, -5.7554931640625, -5.53363037109375, -5.311767578125, -5.08990478515625, -4.8680419921875, -4.64617919921875, -4.42431640625, -4.20245361328125, -3.9805908203125, -3.75872802734375, -3.536865234375, -3.31500244140625, -3.0931396484375, -2.87127685546875, -2.6494140625, -2.42755126953125, -2.2056884765625, -1.98382568359375, -1.761962890625, -1.54010009765625, -1.3182373046875, -1.09637451171875, -0.87451171875, -0.65264892578125, -0.4307861328125, -0.20892333984375, 0.012939453125, 0.23480224609375, 0.4566650390625, 0.67852783203125, 0.900390625, 1.12225341796875, 1.3441162109375, 1.56597900390625, 1.787841796875, 2.00970458984375, 2.2315673828125, 2.45343017578125, 2.67529296875, 2.89715576171875, 3.1190185546875, 3.34088134765625, 3.562744140625, 3.78460693359375, 4.0064697265625, 4.22833251953125, 4.4501953125, 4.67205810546875, 4.8939208984375, 5.11578369140625, 5.337646484375, 5.55950927734375, 5.7813720703125, 6.00323486328125, 6.22509765625, 6.44696044921875, 6.6688232421875, 6.89068603515625, 7.112548828125, 7.33441162109375, 7.5562744140625, 7.77813720703125, 8.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 13.0, 11.0, 19.0, 23.0, 31.0, 38.0, 87.0, 95.0, 166.0, 311.0, 532.0, 1145.0, 3051.0, 11898.0, 97317.0, 844555.0, 73966.0, 10206.0, 2778.0, 1025.0, 497.0, 290.0, 160.0, 100.0, 69.0, 58.0, 30.0, 19.0, 11.0, 11.0, 12.0, 6.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.654541015625, -17.07470703125, -16.494873046875, -15.9150390625, -15.335205078125, -14.75537109375, -14.175537109375, -13.595703125, -13.015869140625, -12.43603515625, -11.856201171875, -11.2763671875, -10.696533203125, -10.11669921875, -9.536865234375, -8.95703125, -8.377197265625, -7.79736328125, -7.217529296875, -6.6376953125, -6.057861328125, -5.47802734375, -4.898193359375, -4.318359375, -3.738525390625, -3.15869140625, -2.578857421875, -1.9990234375, -1.419189453125, -0.83935546875, -0.259521484375, 0.3203125, 0.900146484375, 1.47998046875, 2.059814453125, 2.6396484375, 3.219482421875, 3.79931640625, 4.379150390625, 4.958984375, 5.538818359375, 6.11865234375, 6.698486328125, 7.2783203125, 7.858154296875, 8.43798828125, 9.017822265625, 9.59765625, 10.177490234375, 10.75732421875, 11.337158203125, 11.9169921875, 12.496826171875, 13.07666015625, 13.656494140625, 14.236328125, 14.816162109375, 15.39599609375, 15.975830078125, 16.5556640625, 17.135498046875, 17.71533203125, 18.295166015625, 18.875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 8.0, 9.0, 9.0, 10.0, 13.0, 20.0, 12.0, 25.0, 25.0, 33.0, 36.0, 42.0, 44.0, 41.0, 56.0, 55.0, 88.0, 54.0, 63.0, 54.0, 51.0, 47.0, 33.0, 25.0, 31.0, 15.0, 21.0, 12.0, 15.0, 9.0, 10.0, 8.0, 2.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.3564453125, -22.556640625, -21.7568359375, -20.95703125, -20.1572265625, -19.357421875, -18.5576171875, -17.7578125, -16.9580078125, -16.158203125, -15.3583984375, -14.55859375, -13.7587890625, -12.958984375, -12.1591796875, -11.359375, -10.5595703125, -9.759765625, -8.9599609375, -8.16015625, -7.3603515625, -6.560546875, -5.7607421875, -4.9609375, -4.1611328125, -3.361328125, -2.5615234375, -1.76171875, -0.9619140625, -0.162109375, 0.6376953125, 1.4375, 2.2373046875, 3.037109375, 3.8369140625, 4.63671875, 5.4365234375, 6.236328125, 7.0361328125, 7.8359375, 8.6357421875, 9.435546875, 10.2353515625, 11.03515625, 11.8349609375, 12.634765625, 13.4345703125, 14.234375, 15.0341796875, 15.833984375, 16.6337890625, 17.43359375, 18.2333984375, 19.033203125, 19.8330078125, 20.6328125, 21.4326171875, 22.232421875, 23.0322265625, 23.83203125, 24.6318359375, 25.431640625, 26.2314453125, 27.03125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 10.0, 21.0, 15.0, 25.0, 47.0, 87.0, 118.0, 186.0, 351.0, 589.0, 1227.0, 2491.0, 6636.0, 21031.0, 100217.0, 742239.0, 133612.0, 25903.0, 7792.0, 2943.0, 1417.0, 687.0, 374.0, 212.0, 123.0, 70.0, 52.0, 23.0, 19.0, 12.0, 12.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6875, -4.51751708984375, -4.3475341796875, -4.17755126953125, -4.007568359375, -3.83758544921875, -3.6676025390625, -3.49761962890625, -3.32763671875, -3.15765380859375, -2.9876708984375, -2.81768798828125, -2.647705078125, -2.47772216796875, -2.3077392578125, -2.13775634765625, -1.9677734375, -1.79779052734375, -1.6278076171875, -1.45782470703125, -1.287841796875, -1.11785888671875, -0.9478759765625, -0.77789306640625, -0.60791015625, -0.43792724609375, -0.2679443359375, -0.09796142578125, 0.072021484375, 0.24200439453125, 0.4119873046875, 0.58197021484375, 0.751953125, 0.92193603515625, 1.0919189453125, 1.26190185546875, 1.431884765625, 1.60186767578125, 1.7718505859375, 1.94183349609375, 2.11181640625, 2.28179931640625, 2.4517822265625, 2.62176513671875, 2.791748046875, 2.96173095703125, 3.1317138671875, 3.30169677734375, 3.4716796875, 3.64166259765625, 3.8116455078125, 3.98162841796875, 4.151611328125, 4.32159423828125, 4.4915771484375, 4.66156005859375, 4.83154296875, 5.00152587890625, 5.1715087890625, 5.34149169921875, 5.511474609375, 5.68145751953125, 5.8514404296875, 6.02142333984375, 6.19140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 7.0, 19.0, 18.0, 31.0, 43.0, 80.0, 125.0, 210.0, 183.0, 109.0, 58.0, 31.0, 24.0, 16.0, 13.0, 4.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00290679931640625, -0.0028354376554489136, -0.002764075994491577, -0.0026927143335342407, -0.0026213526725769043, -0.002549991011619568, -0.0024786293506622314, -0.002407267689704895, -0.0023359060287475586, -0.002264544367790222, -0.0021931827068328857, -0.0021218210458755493, -0.002050459384918213, -0.0019790977239608765, -0.00190773606300354, -0.0018363744020462036, -0.0017650127410888672, -0.0016936510801315308, -0.0016222894191741943, -0.001550927758216858, -0.0014795660972595215, -0.001408204436302185, -0.0013368427753448486, -0.0012654811143875122, -0.0011941194534301758, -0.0011227577924728394, -0.001051396131515503, -0.0009800344705581665, -0.0009086728096008301, -0.0008373111486434937, -0.0007659494876861572, -0.0006945878267288208, -0.0006232261657714844, -0.000551864504814148, -0.0004805028438568115, -0.0004091411828994751, -0.00033777952194213867, -0.00026641786098480225, -0.00019505620002746582, -0.0001236945390701294, -5.233287811279297e-05, 1.9028782844543457e-05, 9.039044380187988e-05, 0.0001617521047592163, 0.00023311376571655273, 0.00030447542667388916, 0.0003758370876312256, 0.000447198748588562, 0.0005185604095458984, 0.0005899220705032349, 0.0006612837314605713, 0.0007326453924179077, 0.0008040070533752441, 0.0008753687143325806, 0.000946730375289917, 0.0010180920362472534, 0.0010894536972045898, 0.0011608153581619263, 0.0012321770191192627, 0.0013035386800765991, 0.0013749003410339355, 0.001446262001991272, 0.0015176236629486084, 0.0015889853239059448, 0.0016603469848632812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 9.0, 9.0, 10.0, 19.0, 32.0, 44.0, 84.0, 113.0, 191.0, 322.0, 542.0, 1166.0, 2491.0, 6179.0, 18041.0, 76710.0, 690576.0, 199138.0, 35342.0, 10231.0, 3767.0, 1679.0, 788.0, 445.0, 244.0, 138.0, 72.0, 52.0, 41.0, 34.0, 12.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.09375, -5.91839599609375, -5.7430419921875, -5.56768798828125, -5.392333984375, -5.21697998046875, -5.0416259765625, -4.86627197265625, -4.69091796875, -4.51556396484375, -4.3402099609375, -4.16485595703125, -3.989501953125, -3.81414794921875, -3.6387939453125, -3.46343994140625, -3.2880859375, -3.11273193359375, -2.9373779296875, -2.76202392578125, -2.586669921875, -2.41131591796875, -2.2359619140625, -2.06060791015625, -1.88525390625, -1.70989990234375, -1.5345458984375, -1.35919189453125, -1.183837890625, -1.00848388671875, -0.8331298828125, -0.65777587890625, -0.482421875, -0.30706787109375, -0.1317138671875, 0.04364013671875, 0.218994140625, 0.39434814453125, 0.5697021484375, 0.74505615234375, 0.92041015625, 1.09576416015625, 1.2711181640625, 1.44647216796875, 1.621826171875, 1.79718017578125, 1.9725341796875, 2.14788818359375, 2.3232421875, 2.49859619140625, 2.6739501953125, 2.84930419921875, 3.024658203125, 3.20001220703125, 3.3753662109375, 3.55072021484375, 3.72607421875, 3.90142822265625, 4.0767822265625, 4.25213623046875, 4.427490234375, 4.60284423828125, 4.7781982421875, 4.95355224609375, 5.12890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 11.0, 8.0, 11.0, 11.0, 15.0, 35.0, 49.0, 74.0, 100.0, 158.0, 150.0, 131.0, 73.0, 52.0, 37.0, 31.0, 15.0, 10.0, 8.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.21875, -8.0089111328125, -7.799072265625, -7.5892333984375, -7.37939453125, -7.1695556640625, -6.959716796875, -6.7498779296875, -6.5400390625, -6.3302001953125, -6.120361328125, -5.9105224609375, -5.70068359375, -5.4908447265625, -5.281005859375, -5.0711669921875, -4.861328125, -4.6514892578125, -4.441650390625, -4.2318115234375, -4.02197265625, -3.8121337890625, -3.602294921875, -3.3924560546875, -3.1826171875, -2.9727783203125, -2.762939453125, -2.5531005859375, -2.34326171875, -2.1334228515625, -1.923583984375, -1.7137451171875, -1.50390625, -1.2940673828125, -1.084228515625, -0.8743896484375, -0.66455078125, -0.4547119140625, -0.244873046875, -0.0350341796875, 0.1748046875, 0.3846435546875, 0.594482421875, 0.8043212890625, 1.01416015625, 1.2239990234375, 1.433837890625, 1.6436767578125, 1.853515625, 2.0633544921875, 2.273193359375, 2.4830322265625, 2.69287109375, 2.9027099609375, 3.112548828125, 3.3223876953125, 3.5322265625, 3.7420654296875, 3.951904296875, 4.1617431640625, 4.37158203125, 4.5814208984375, 4.791259765625, 5.0010986328125, 5.2109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 10.0, 18.0, 40.0, 89.0, 171.0, 360.0, 142.0, 73.0, 49.0, 10.0, 13.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.34686279296875, -160.685302734375, -156.02374267578125, -151.3621826171875, -146.70062255859375, -142.03904724121094, -137.3774871826172, -132.71592712402344, -128.0543670654297, -123.39280700683594, -118.73124694824219, -114.0696792602539, -109.40811920166016, -104.7465591430664, -100.08499145507812, -95.42343139648438, -90.76187133789062, -86.10031127929688, -81.43875122070312, -76.77718353271484, -72.1156234741211, -67.45406341552734, -62.79249954223633, -58.13093566894531, -53.46937561035156, -48.80781555175781, -44.1462516784668, -39.48468780517578, -34.82312774658203, -30.16156578063965, -25.500003814697266, -20.83843994140625, -16.1768798828125, -11.515317916870117, -6.853755950927734, -2.1921939849853516, 2.4693679809570312, 7.130929946899414, 11.792491912841797, 16.454055786132812, 21.115615844726562, 25.777177810668945, 30.438739776611328, 35.100303649902344, 39.761863708496094, 44.423423767089844, 49.08498764038086, 53.746551513671875, 58.408111572265625, 63.069671630859375, 67.73123168945312, 72.3927993774414, 77.05435943603516, 81.7159194946289, 86.37748718261719, 91.03904724121094, 95.70060729980469, 100.36216735839844, 105.02372741699219, 109.68529510498047, 114.34685516357422, 119.00841522216797, 123.66998291015625, 128.33154296875, 132.99310302734375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 11.0, 10.0, 8.0, 12.0, 21.0, 19.0, 20.0, 18.0, 15.0, 24.0, 30.0, 30.0, 35.0, 46.0, 73.0, 86.0, 105.0, 48.0, 59.0, 33.0, 36.0, 27.0, 33.0, 28.0, 24.0, 14.0, 21.0, 17.0, 12.0, 16.0, 13.0, 11.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-88.90167236328125, -86.29511260986328, -83.68855285644531, -81.08200073242188, -78.4754409790039, -75.86888122558594, -73.2623291015625, -70.65576934814453, -68.04920959472656, -65.4426498413086, -62.83609390258789, -60.22953796386719, -57.62297821044922, -55.01641845703125, -52.40986251831055, -49.803306579589844, -47.196746826171875, -44.590187072753906, -41.9836311340332, -39.3770751953125, -36.77051544189453, -34.16395568847656, -31.55739974975586, -28.950841903686523, -26.344284057617188, -23.73772621154785, -21.131168365478516, -18.52461051940918, -15.918052673339844, -13.311494827270508, -10.704936981201172, -8.098379135131836, -5.4918212890625, -2.885263442993164, -0.2787055969238281, 2.327852249145508, 4.934410095214844, 7.54096794128418, 10.147525787353516, 12.754083633422852, 15.360641479492188, 17.967199325561523, 20.57375717163086, 23.180315017700195, 25.78687286376953, 28.393430709838867, 30.999988555908203, 33.606544494628906, 36.213104248046875, 38.819664001464844, 41.42621994018555, 44.03277587890625, 46.63933563232422, 49.24589538574219, 51.85245132446289, 54.459007263183594, 57.06556701660156, 59.67212677001953, 62.278682708740234, 64.88523864746094, 67.4917984008789, 70.09835815429688, 72.70491027832031, 75.31147003173828, 77.91802978515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 14.0, 17.0, 17.0, 25.0, 43.0, 46.0, 80.0, 125.0, 183.0, 395.0, 689.0, 1172.0, 2340.0, 5014.0, 12246.0, 36839.0, 157362.0, 962821.0, 2360745.0, 522584.0, 90876.0, 23878.0, 8785.0, 3874.0, 1833.0, 870.0, 541.0, 326.0, 192.0, 114.0, 67.0, 54.0, 38.0, 21.0, 16.0, 7.0, 9.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.53814697265625, -6.2989501953125, -6.05975341796875, -5.820556640625, -5.58135986328125, -5.3421630859375, -5.10296630859375, -4.86376953125, -4.62457275390625, -4.3853759765625, -4.14617919921875, -3.906982421875, -3.66778564453125, -3.4285888671875, -3.18939208984375, -2.9501953125, -2.71099853515625, -2.4718017578125, -2.23260498046875, -1.993408203125, -1.75421142578125, -1.5150146484375, -1.27581787109375, -1.03662109375, -0.79742431640625, -0.5582275390625, -0.31903076171875, -0.079833984375, 0.15936279296875, 0.3985595703125, 0.63775634765625, 0.876953125, 1.11614990234375, 1.3553466796875, 1.59454345703125, 1.833740234375, 2.07293701171875, 2.3121337890625, 2.55133056640625, 2.79052734375, 3.02972412109375, 3.2689208984375, 3.50811767578125, 3.747314453125, 3.98651123046875, 4.2257080078125, 4.46490478515625, 4.7041015625, 4.94329833984375, 5.1824951171875, 5.42169189453125, 5.660888671875, 5.90008544921875, 6.1392822265625, 6.37847900390625, 6.61767578125, 6.85687255859375, 7.0960693359375, 7.33526611328125, 7.574462890625, 7.81365966796875, 8.0528564453125, 8.29205322265625, 8.53125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 20.0, 17.0, 25.0, 31.0, 36.0, 35.0, 44.0, 54.0, 53.0, 62.0, 54.0, 81.0, 50.0, 69.0, 68.0, 55.0, 39.0, 38.0, 35.0, 22.0, 18.0, 15.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.161376953125, -4.93994140625, -4.718505859375, -4.4970703125, -4.275634765625, -4.05419921875, -3.832763671875, -3.611328125, -3.389892578125, -3.16845703125, -2.947021484375, -2.7255859375, -2.504150390625, -2.28271484375, -2.061279296875, -1.83984375, -1.618408203125, -1.39697265625, -1.175537109375, -0.9541015625, -0.732666015625, -0.51123046875, -0.289794921875, -0.068359375, 0.153076171875, 0.37451171875, 0.595947265625, 0.8173828125, 1.038818359375, 1.26025390625, 1.481689453125, 1.703125, 1.924560546875, 2.14599609375, 2.367431640625, 2.5888671875, 2.810302734375, 3.03173828125, 3.253173828125, 3.474609375, 3.696044921875, 3.91748046875, 4.138916015625, 4.3603515625, 4.581787109375, 4.80322265625, 5.024658203125, 5.24609375, 5.467529296875, 5.68896484375, 5.910400390625, 6.1318359375, 6.353271484375, 6.57470703125, 6.796142578125, 7.017578125, 7.239013671875, 7.46044921875, 7.681884765625, 7.9033203125, 8.124755859375, 8.34619140625, 8.567626953125, 8.7890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 7.0, 20.0, 32.0, 44.0, 93.0, 175.0, 352.0, 880.0, 2995.0, 16406.0, 350530.0, 3755238.0, 58132.0, 6617.0, 1588.0, 591.0, 232.0, 136.0, 64.0, 48.0, 24.0, 26.0, 15.0, 6.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.953125, -22.044677734375, -21.13623046875, -20.227783203125, -19.3193359375, -18.410888671875, -17.50244140625, -16.593994140625, -15.685546875, -14.777099609375, -13.86865234375, -12.960205078125, -12.0517578125, -11.143310546875, -10.23486328125, -9.326416015625, -8.41796875, -7.509521484375, -6.60107421875, -5.692626953125, -4.7841796875, -3.875732421875, -2.96728515625, -2.058837890625, -1.150390625, -0.241943359375, 0.66650390625, 1.574951171875, 2.4833984375, 3.391845703125, 4.30029296875, 5.208740234375, 6.1171875, 7.025634765625, 7.93408203125, 8.842529296875, 9.7509765625, 10.659423828125, 11.56787109375, 12.476318359375, 13.384765625, 14.293212890625, 15.20166015625, 16.110107421875, 17.0185546875, 17.927001953125, 18.83544921875, 19.743896484375, 20.65234375, 21.560791015625, 22.46923828125, 23.377685546875, 24.2861328125, 25.194580078125, 26.10302734375, 27.011474609375, 27.919921875, 28.828369140625, 29.73681640625, 30.645263671875, 31.5537109375, 32.462158203125, 33.37060546875, 34.279052734375, 35.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 4.0, 8.0, 9.0, 10.0, 13.0, 17.0, 22.0, 37.0, 64.0, 85.0, 132.0, 191.0, 420.0, 712.0, 882.0, 618.0, 310.0, 182.0, 109.0, 80.0, 41.0, 34.0, 22.0, 14.0, 13.0, 7.0, 8.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.798095703125, -13.25244140625, -12.706787109375, -12.1611328125, -11.615478515625, -11.06982421875, -10.524169921875, -9.978515625, -9.432861328125, -8.88720703125, -8.341552734375, -7.7958984375, -7.250244140625, -6.70458984375, -6.158935546875, -5.61328125, -5.067626953125, -4.52197265625, -3.976318359375, -3.4306640625, -2.885009765625, -2.33935546875, -1.793701171875, -1.248046875, -0.702392578125, -0.15673828125, 0.388916015625, 0.9345703125, 1.480224609375, 2.02587890625, 2.571533203125, 3.1171875, 3.662841796875, 4.20849609375, 4.754150390625, 5.2998046875, 5.845458984375, 6.39111328125, 6.936767578125, 7.482421875, 8.028076171875, 8.57373046875, 9.119384765625, 9.6650390625, 10.210693359375, 10.75634765625, 11.302001953125, 11.84765625, 12.393310546875, 12.93896484375, 13.484619140625, 14.0302734375, 14.575927734375, 15.12158203125, 15.667236328125, 16.212890625, 16.758544921875, 17.30419921875, 17.849853515625, 18.3955078125, 18.941162109375, 19.48681640625, 20.032470703125, 20.578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 27.0, 44.0, 85.0, 149.0, 189.0, 178.0, 124.0, 77.0, 31.0, 32.0, 15.0, 9.0, 4.0, 2.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.3233642578125, -142.38999938964844, -137.45664978027344, -132.52328491210938, -127.58993530273438, -122.65657043457031, -117.72321319580078, -112.78985595703125, -107.85649871826172, -102.92314147949219, -97.98978424072266, -93.05642700195312, -88.12306213378906, -83.18971252441406, -78.25634765625, -73.32299041748047, -68.38963317871094, -63.456275939941406, -58.522918701171875, -53.58955764770508, -48.65620040893555, -43.722843170166016, -38.78948211669922, -33.85612487792969, -28.922767639160156, -23.989410400390625, -19.05605125427246, -14.122693061828613, -9.189334869384766, -4.255977630615234, 0.6773815155029297, 5.610740661621094, 10.544097900390625, 15.477456092834473, 20.41081428527832, 25.344173431396484, 30.277530670166016, 35.21088790893555, 40.144248962402344, 45.077606201171875, 50.010963439941406, 54.94432067871094, 59.87767791748047, 64.81103515625, 69.74440002441406, 74.67774963378906, 79.61111450195312, 84.54447174072266, 89.47782897949219, 94.41118621826172, 99.34454345703125, 104.27790069580078, 109.21125793457031, 114.14462280273438, 119.0779800415039, 124.01133728027344, 128.9447021484375, 133.87806701660156, 138.81141662597656, 143.74478149414062, 148.67813110351562, 153.6114959716797, 158.5448455810547, 163.47821044921875, 168.41156005859375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 11.0, 10.0, 13.0, 19.0, 24.0, 21.0, 29.0, 29.0, 30.0, 37.0, 41.0, 27.0, 36.0, 35.0, 38.0, 50.0, 39.0, 49.0, 47.0, 49.0, 38.0, 44.0, 27.0, 28.0, 25.0, 23.0, 24.0, 19.0, 16.0, 14.0, 9.0, 8.0, 11.0, 7.0, 7.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.42251968383789, -59.467926025390625, -57.513328552246094, -55.55873107910156, -53.6041374206543, -51.64954376220703, -49.6949462890625, -47.74034881591797, -45.7857551574707, -43.83116149902344, -41.876564025878906, -39.921966552734375, -37.96737289428711, -36.012779235839844, -34.05818176269531, -32.10358428955078, -30.148990631103516, -28.194395065307617, -26.23979949951172, -24.28520393371582, -22.330608367919922, -20.376012802124023, -18.421417236328125, -16.466821670532227, -14.512226104736328, -12.55763053894043, -10.603034973144531, -8.648439407348633, -6.693843841552734, -4.739248275756836, -2.7846527099609375, -0.8300571441650391, 1.1245346069335938, 3.079130172729492, 5.033725738525391, 6.988321304321289, 8.942916870117188, 10.897512435913086, 12.852108001708984, 14.806703567504883, 16.76129913330078, 18.71589469909668, 20.670490264892578, 22.625085830688477, 24.579681396484375, 26.534276962280273, 28.488872528076172, 30.44346809387207, 32.39806365966797, 34.3526611328125, 36.307254791259766, 38.26184844970703, 40.21644592285156, 42.171043395996094, 44.12563705444336, 46.080230712890625, 48.034828186035156, 49.98942565917969, 51.94401931762695, 53.89861297607422, 55.85321044921875, 57.80780792236328, 59.76240158081055, 61.71699523925781, 63.671592712402344]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 11.0, 7.0, 26.0, 23.0, 44.0, 59.0, 97.0, 134.0, 224.0, 368.0, 587.0, 959.0, 1720.0, 3044.0, 6278.0, 13809.0, 34949.0, 105248.0, 389963.0, 342571.0, 91724.0, 31363.0, 12701.0, 5792.0, 2817.0, 1515.0, 889.0, 562.0, 393.0, 221.0, 147.0, 100.0, 63.0, 48.0, 19.0, 22.0, 15.0, 8.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.84869384765625, -8.5880126953125, -8.32733154296875, -8.066650390625, -7.80596923828125, -7.5452880859375, -7.28460693359375, -7.02392578125, -6.76324462890625, -6.5025634765625, -6.24188232421875, -5.981201171875, -5.72052001953125, -5.4598388671875, -5.19915771484375, -4.9384765625, -4.67779541015625, -4.4171142578125, -4.15643310546875, -3.895751953125, -3.63507080078125, -3.3743896484375, -3.11370849609375, -2.85302734375, -2.59234619140625, -2.3316650390625, -2.07098388671875, -1.810302734375, -1.54962158203125, -1.2889404296875, -1.02825927734375, -0.767578125, -0.50689697265625, -0.2462158203125, 0.01446533203125, 0.275146484375, 0.53582763671875, 0.7965087890625, 1.05718994140625, 1.31787109375, 1.57855224609375, 1.8392333984375, 2.09991455078125, 2.360595703125, 2.62127685546875, 2.8819580078125, 3.14263916015625, 3.4033203125, 3.66400146484375, 3.9246826171875, 4.18536376953125, 4.446044921875, 4.70672607421875, 4.9674072265625, 5.22808837890625, 5.48876953125, 5.74945068359375, 6.0101318359375, 6.27081298828125, 6.531494140625, 6.79217529296875, 7.0528564453125, 7.31353759765625, 7.57421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 12.0, 16.0, 9.0, 22.0, 21.0, 33.0, 35.0, 55.0, 48.0, 45.0, 50.0, 49.0, 59.0, 55.0, 55.0, 61.0, 45.0, 56.0, 39.0, 28.0, 44.0, 33.0, 24.0, 17.0, 19.0, 10.0, 9.0, 5.0, 4.0, 4.0, 5.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37890625, -6.13714599609375, -5.8953857421875, -5.65362548828125, -5.411865234375, -5.17010498046875, -4.9283447265625, -4.68658447265625, -4.44482421875, -4.20306396484375, -3.9613037109375, -3.71954345703125, -3.477783203125, -3.23602294921875, -2.9942626953125, -2.75250244140625, -2.5107421875, -2.26898193359375, -2.0272216796875, -1.78546142578125, -1.543701171875, -1.30194091796875, -1.0601806640625, -0.81842041015625, -0.57666015625, -0.33489990234375, -0.0931396484375, 0.14862060546875, 0.390380859375, 0.63214111328125, 0.8739013671875, 1.11566162109375, 1.357421875, 1.59918212890625, 1.8409423828125, 2.08270263671875, 2.324462890625, 2.56622314453125, 2.8079833984375, 3.04974365234375, 3.29150390625, 3.53326416015625, 3.7750244140625, 4.01678466796875, 4.258544921875, 4.50030517578125, 4.7420654296875, 4.98382568359375, 5.2255859375, 5.46734619140625, 5.7091064453125, 5.95086669921875, 6.192626953125, 6.43438720703125, 6.6761474609375, 6.91790771484375, 7.15966796875, 7.40142822265625, 7.6431884765625, 7.88494873046875, 8.126708984375, 8.36846923828125, 8.6102294921875, 8.85198974609375, 9.09375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 11.0, 14.0, 14.0, 24.0, 25.0, 34.0, 34.0, 65.0, 111.0, 158.0, 234.0, 330.0, 613.0, 1036.0, 2163.0, 5277.0, 17476.0, 99019.0, 806494.0, 89004.0, 16584.0, 5110.0, 2130.0, 985.0, 553.0, 322.0, 197.0, 134.0, 119.0, 61.0, 55.0, 32.0, 27.0, 22.0, 19.0, 12.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.21875, -15.7193603515625, -15.219970703125, -14.7205810546875, -14.22119140625, -13.7218017578125, -13.222412109375, -12.7230224609375, -12.2236328125, -11.7242431640625, -11.224853515625, -10.7254638671875, -10.22607421875, -9.7266845703125, -9.227294921875, -8.7279052734375, -8.228515625, -7.7291259765625, -7.229736328125, -6.7303466796875, -6.23095703125, -5.7315673828125, -5.232177734375, -4.7327880859375, -4.2333984375, -3.7340087890625, -3.234619140625, -2.7352294921875, -2.23583984375, -1.7364501953125, -1.237060546875, -0.7376708984375, -0.23828125, 0.2611083984375, 0.760498046875, 1.2598876953125, 1.75927734375, 2.2586669921875, 2.758056640625, 3.2574462890625, 3.7568359375, 4.2562255859375, 4.755615234375, 5.2550048828125, 5.75439453125, 6.2537841796875, 6.753173828125, 7.2525634765625, 7.751953125, 8.2513427734375, 8.750732421875, 9.2501220703125, 9.74951171875, 10.2489013671875, 10.748291015625, 11.2476806640625, 11.7470703125, 12.2464599609375, 12.745849609375, 13.2452392578125, 13.74462890625, 14.2440185546875, 14.743408203125, 15.2427978515625, 15.7421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 13.0, 8.0, 9.0, 7.0, 12.0, 17.0, 18.0, 18.0, 26.0, 26.0, 42.0, 37.0, 43.0, 47.0, 54.0, 60.0, 39.0, 47.0, 67.0, 57.0, 51.0, 46.0, 45.0, 31.0, 25.0, 19.0, 25.0, 18.0, 20.0, 11.0, 4.0, 5.0, 11.0, 14.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.265625, -24.430908203125, -23.59619140625, -22.761474609375, -21.9267578125, -21.092041015625, -20.25732421875, -19.422607421875, -18.587890625, -17.753173828125, -16.91845703125, -16.083740234375, -15.2490234375, -14.414306640625, -13.57958984375, -12.744873046875, -11.91015625, -11.075439453125, -10.24072265625, -9.406005859375, -8.5712890625, -7.736572265625, -6.90185546875, -6.067138671875, -5.232421875, -4.397705078125, -3.56298828125, -2.728271484375, -1.8935546875, -1.058837890625, -0.22412109375, 0.610595703125, 1.4453125, 2.280029296875, 3.11474609375, 3.949462890625, 4.7841796875, 5.618896484375, 6.45361328125, 7.288330078125, 8.123046875, 8.957763671875, 9.79248046875, 10.627197265625, 11.4619140625, 12.296630859375, 13.13134765625, 13.966064453125, 14.80078125, 15.635498046875, 16.47021484375, 17.304931640625, 18.1396484375, 18.974365234375, 19.80908203125, 20.643798828125, 21.478515625, 22.313232421875, 23.14794921875, 23.982666015625, 24.8173828125, 25.652099609375, 26.48681640625, 27.321533203125, 28.15625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 11.0, 14.0, 31.0, 35.0, 74.0, 141.0, 252.0, 510.0, 1202.0, 3189.0, 9508.0, 38351.0, 263546.0, 661400.0, 51602.0, 12108.0, 3794.0, 1466.0, 604.0, 295.0, 139.0, 93.0, 58.0, 31.0, 21.0, 11.0, 7.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.09765625, -4.9564208984375, -4.815185546875, -4.6739501953125, -4.53271484375, -4.3914794921875, -4.250244140625, -4.1090087890625, -3.9677734375, -3.8265380859375, -3.685302734375, -3.5440673828125, -3.40283203125, -3.2615966796875, -3.120361328125, -2.9791259765625, -2.837890625, -2.6966552734375, -2.555419921875, -2.4141845703125, -2.27294921875, -2.1317138671875, -1.990478515625, -1.8492431640625, -1.7080078125, -1.5667724609375, -1.425537109375, -1.2843017578125, -1.14306640625, -1.0018310546875, -0.860595703125, -0.7193603515625, -0.578125, -0.4368896484375, -0.295654296875, -0.1544189453125, -0.01318359375, 0.1280517578125, 0.269287109375, 0.4105224609375, 0.5517578125, 0.6929931640625, 0.834228515625, 0.9754638671875, 1.11669921875, 1.2579345703125, 1.399169921875, 1.5404052734375, 1.681640625, 1.8228759765625, 1.964111328125, 2.1053466796875, 2.24658203125, 2.3878173828125, 2.529052734375, 2.6702880859375, 2.8115234375, 2.9527587890625, 3.093994140625, 3.2352294921875, 3.37646484375, 3.5177001953125, 3.658935546875, 3.8001708984375, 3.94140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 4.0, 3.0, 2.0, 6.0, 4.0, 10.0, 22.0, 31.0, 39.0, 75.0, 128.0, 214.0, 194.0, 112.0, 53.0, 29.0, 16.0, 17.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002197265625, -0.0021302998065948486, -0.0020633339881896973, -0.001996368169784546, -0.0019294023513793945, -0.0018624365329742432, -0.0017954707145690918, -0.0017285048961639404, -0.001661539077758789, -0.0015945732593536377, -0.0015276074409484863, -0.001460641622543335, -0.0013936758041381836, -0.0013267099857330322, -0.0012597441673278809, -0.0011927783489227295, -0.0011258125305175781, -0.0010588467121124268, -0.0009918808937072754, -0.000924915075302124, -0.0008579492568969727, -0.0007909834384918213, -0.0007240176200866699, -0.0006570518016815186, -0.0005900859832763672, -0.0005231201648712158, -0.00045615434646606445, -0.0003891885280609131, -0.0003222227096557617, -0.00025525689125061035, -0.00018829107284545898, -0.00012132525444030762, -5.435943603515625e-05, 1.2606382369995117e-05, 7.957220077514648e-05, 0.00014653801918029785, 0.00021350383758544922, 0.0002804696559906006, 0.00034743547439575195, 0.0004144012928009033, 0.0004813671112060547, 0.0005483329296112061, 0.0006152987480163574, 0.0006822645664215088, 0.0007492303848266602, 0.0008161962032318115, 0.0008831620216369629, 0.0009501278400421143, 0.0010170936584472656, 0.001084059476852417, 0.0011510252952575684, 0.0012179911136627197, 0.001284956932067871, 0.0013519227504730225, 0.0014188885688781738, 0.0014858543872833252, 0.0015528202056884766, 0.001619786024093628, 0.0016867518424987793, 0.0017537176609039307, 0.001820683479309082, 0.0018876492977142334, 0.0019546151161193848, 0.002021580934524536, 0.0020885467529296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 14.0, 24.0, 27.0, 43.0, 57.0, 101.0, 149.0, 254.0, 438.0, 767.0, 1303.0, 2641.0, 5574.0, 13485.0, 36877.0, 116738.0, 635018.0, 157916.0, 46677.0, 16810.0, 6810.0, 3066.0, 1570.0, 876.0, 484.0, 290.0, 178.0, 104.0, 77.0, 42.0, 36.0, 24.0, 15.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.780181884765625, -2.67950439453125, -2.578826904296875, -2.4781494140625, -2.377471923828125, -2.27679443359375, -2.176116943359375, -2.075439453125, -1.974761962890625, -1.87408447265625, -1.773406982421875, -1.6727294921875, -1.572052001953125, -1.47137451171875, -1.370697021484375, -1.27001953125, -1.169342041015625, -1.06866455078125, -0.967987060546875, -0.8673095703125, -0.766632080078125, -0.66595458984375, -0.565277099609375, -0.464599609375, -0.363922119140625, -0.26324462890625, -0.162567138671875, -0.0618896484375, 0.038787841796875, 0.13946533203125, 0.240142822265625, 0.3408203125, 0.441497802734375, 0.54217529296875, 0.642852783203125, 0.7435302734375, 0.844207763671875, 0.94488525390625, 1.045562744140625, 1.146240234375, 1.246917724609375, 1.34759521484375, 1.448272705078125, 1.5489501953125, 1.649627685546875, 1.75030517578125, 1.850982666015625, 1.95166015625, 2.052337646484375, 2.15301513671875, 2.253692626953125, 2.3543701171875, 2.455047607421875, 2.55572509765625, 2.656402587890625, 2.757080078125, 2.857757568359375, 2.95843505859375, 3.059112548828125, 3.1597900390625, 3.260467529296875, 3.36114501953125, 3.461822509765625, 3.5625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 13.0, 5.0, 8.0, 6.0, 13.0, 21.0, 23.0, 16.0, 23.0, 53.0, 58.0, 59.0, 75.0, 93.0, 94.0, 69.0, 61.0, 49.0, 45.0, 40.0, 36.0, 18.0, 25.0, 17.0, 20.0, 18.0, 14.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.810546875, -3.6915283203125, -3.572509765625, -3.4534912109375, -3.33447265625, -3.2154541015625, -3.096435546875, -2.9774169921875, -2.8583984375, -2.7393798828125, -2.620361328125, -2.5013427734375, -2.38232421875, -2.2633056640625, -2.144287109375, -2.0252685546875, -1.90625, -1.7872314453125, -1.668212890625, -1.5491943359375, -1.43017578125, -1.3111572265625, -1.192138671875, -1.0731201171875, -0.9541015625, -0.8350830078125, -0.716064453125, -0.5970458984375, -0.47802734375, -0.3590087890625, -0.239990234375, -0.1209716796875, -0.001953125, 0.1170654296875, 0.236083984375, 0.3551025390625, 0.47412109375, 0.5931396484375, 0.712158203125, 0.8311767578125, 0.9501953125, 1.0692138671875, 1.188232421875, 1.3072509765625, 1.42626953125, 1.5452880859375, 1.664306640625, 1.7833251953125, 1.90234375, 2.0213623046875, 2.140380859375, 2.2593994140625, 2.37841796875, 2.4974365234375, 2.616455078125, 2.7354736328125, 2.8544921875, 2.9735107421875, 3.092529296875, 3.2115478515625, 3.33056640625, 3.4495849609375, 3.568603515625, 3.6876220703125, 3.806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 17.0, 30.0, 78.0, 146.0, 449.0, 171.0, 70.0, 17.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.17439270019531, -83.95804595947266, -77.74170684814453, -71.52536010742188, -65.30902099609375, -59.092674255371094, -52.87632751464844, -46.65998458862305, -40.443641662597656, -34.227298736572266, -28.010953903198242, -21.79460906982422, -15.578266143798828, -9.361923217773438, -3.1455764770507812, 3.0707664489746094, 9.287109375, 15.503453254699707, 21.719797134399414, 27.936141967773438, 34.15248489379883, 40.36882781982422, 46.585174560546875, 52.801517486572266, 59.017860412597656, 65.23420715332031, 71.45054626464844, 77.6668930053711, 83.88323974609375, 90.09957885742188, 96.31592559814453, 102.53227233886719, 108.74862670898438, 114.96497344970703, 121.18131256103516, 127.39765930175781, 133.61399841308594, 139.83035278320312, 146.04669189453125, 152.26303100585938, 158.4793701171875, 164.69570922851562, 170.9120635986328, 177.12840270996094, 183.34474182128906, 189.56109619140625, 195.77743530273438, 201.9937744140625, 208.2101287841797, 214.4264678955078, 220.642822265625, 226.85916137695312, 233.07550048828125, 239.29183959960938, 245.50819396972656, 251.7245330810547, 257.9408874511719, 264.1572265625, 270.3735656738281, 276.58990478515625, 282.8062744140625, 289.0226135253906, 295.23895263671875, 301.4552917480469, 307.671630859375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 5.0, 0.0, 5.0, 0.0, 4.0, 5.0, 5.0, 9.0, 4.0, 14.0, 11.0, 12.0, 14.0, 11.0, 15.0, 16.0, 26.0, 20.0, 22.0, 29.0, 35.0, 30.0, 45.0, 62.0, 100.0, 109.0, 94.0, 42.0, 29.0, 31.0, 26.0, 26.0, 25.0, 20.0, 8.0, 21.0, 14.0, 8.0, 12.0, 7.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-80.78650665283203, -77.7035903930664, -74.62068176269531, -71.53776550292969, -68.45484924316406, -65.37194061279297, -62.289024353027344, -59.206111907958984, -56.123199462890625, -53.040287017822266, -49.957374572753906, -46.87445831298828, -43.79154586791992, -40.70863342285156, -37.62571716308594, -34.54280471801758, -31.45989227294922, -28.37697982788086, -25.294065475463867, -22.211151123046875, -19.128238677978516, -16.045326232910156, -12.962411880493164, -9.879497528076172, -6.7965850830078125, -3.7136716842651367, -0.6307582855224609, 2.452155113220215, 5.535068511962891, 8.617981910705566, 11.700895309448242, 14.783809661865234, 17.866722106933594, 20.949634552001953, 24.032548904418945, 27.115463256835938, 30.198375701904297, 33.281288146972656, 36.36420440673828, 39.44711685180664, 42.530029296875, 45.61294174194336, 48.69585418701172, 51.778770446777344, 54.8616828918457, 57.94459533691406, 61.02751159667969, 64.11042785644531, 67.1933364868164, 70.27625274658203, 73.35916137695312, 76.44207763671875, 79.52499389648438, 82.60790252685547, 85.6908187866211, 88.77372741699219, 91.85664367675781, 94.93955993652344, 98.02246856689453, 101.10538482666016, 104.18829345703125, 107.27120971679688, 110.3541259765625, 113.43704223632812, 116.51995086669922]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 7.0, 2.0, 8.0, 10.0, 12.0, 28.0, 37.0, 47.0, 67.0, 93.0, 117.0, 208.0, 349.0, 533.0, 860.0, 1493.0, 2579.0, 4868.0, 9792.0, 23159.0, 65934.0, 236418.0, 891748.0, 1901195.0, 764337.0, 194284.0, 55679.0, 20634.0, 9132.0, 4519.0, 2329.0, 1387.0, 874.0, 515.0, 342.0, 188.0, 150.0, 102.0, 62.0, 64.0, 39.0, 34.0, 7.0, 16.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0], "bins": [-10.5, -10.21185302734375, -9.9237060546875, -9.63555908203125, -9.347412109375, -9.05926513671875, -8.7711181640625, -8.48297119140625, -8.19482421875, -7.90667724609375, -7.6185302734375, -7.33038330078125, -7.042236328125, -6.75408935546875, -6.4659423828125, -6.17779541015625, -5.8896484375, -5.60150146484375, -5.3133544921875, -5.02520751953125, -4.737060546875, -4.44891357421875, -4.1607666015625, -3.87261962890625, -3.58447265625, -3.29632568359375, -3.0081787109375, -2.72003173828125, -2.431884765625, -2.14373779296875, -1.8555908203125, -1.56744384765625, -1.279296875, -0.99114990234375, -0.7030029296875, -0.41485595703125, -0.126708984375, 0.16143798828125, 0.4495849609375, 0.73773193359375, 1.02587890625, 1.31402587890625, 1.6021728515625, 1.89031982421875, 2.178466796875, 2.46661376953125, 2.7547607421875, 3.04290771484375, 3.3310546875, 3.61920166015625, 3.9073486328125, 4.19549560546875, 4.483642578125, 4.77178955078125, 5.0599365234375, 5.34808349609375, 5.63623046875, 5.92437744140625, 6.2125244140625, 6.50067138671875, 6.788818359375, 7.07696533203125, 7.3651123046875, 7.65325927734375, 7.94140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 12.0, 5.0, 14.0, 8.0, 16.0, 11.0, 16.0, 18.0, 22.0, 33.0, 27.0, 23.0, 37.0, 39.0, 59.0, 55.0, 50.0, 46.0, 54.0, 45.0, 44.0, 42.0, 45.0, 44.0, 30.0, 29.0, 23.0, 19.0, 21.0, 23.0, 15.0, 11.0, 10.0, 14.0, 7.0, 5.0, 6.0, 5.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.546875, -6.35498046875, -6.1630859375, -5.97119140625, -5.779296875, -5.58740234375, -5.3955078125, -5.20361328125, -5.01171875, -4.81982421875, -4.6279296875, -4.43603515625, -4.244140625, -4.05224609375, -3.8603515625, -3.66845703125, -3.4765625, -3.28466796875, -3.0927734375, -2.90087890625, -2.708984375, -2.51708984375, -2.3251953125, -2.13330078125, -1.94140625, -1.74951171875, -1.5576171875, -1.36572265625, -1.173828125, -0.98193359375, -0.7900390625, -0.59814453125, -0.40625, -0.21435546875, -0.0224609375, 0.16943359375, 0.361328125, 0.55322265625, 0.7451171875, 0.93701171875, 1.12890625, 1.32080078125, 1.5126953125, 1.70458984375, 1.896484375, 2.08837890625, 2.2802734375, 2.47216796875, 2.6640625, 2.85595703125, 3.0478515625, 3.23974609375, 3.431640625, 3.62353515625, 3.8154296875, 4.00732421875, 4.19921875, 4.39111328125, 4.5830078125, 4.77490234375, 4.966796875, 5.15869140625, 5.3505859375, 5.54248046875, 5.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 35.0, 86.0, 259.0, 1078.0, 8392.0, 4167758.0, 14711.0, 1319.0, 386.0, 141.0, 46.0, 20.0, 15.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-161.5, -157.201171875, -152.90234375, -148.603515625, -144.3046875, -140.005859375, -135.70703125, -131.408203125, -127.109375, -122.810546875, -118.51171875, -114.212890625, -109.9140625, -105.615234375, -101.31640625, -97.017578125, -92.71875, -88.419921875, -84.12109375, -79.822265625, -75.5234375, -71.224609375, -66.92578125, -62.626953125, -58.328125, -54.029296875, -49.73046875, -45.431640625, -41.1328125, -36.833984375, -32.53515625, -28.236328125, -23.9375, -19.638671875, -15.33984375, -11.041015625, -6.7421875, -2.443359375, 1.85546875, 6.154296875, 10.453125, 14.751953125, 19.05078125, 23.349609375, 27.6484375, 31.947265625, 36.24609375, 40.544921875, 44.84375, 49.142578125, 53.44140625, 57.740234375, 62.0390625, 66.337890625, 70.63671875, 74.935546875, 79.234375, 83.533203125, 87.83203125, 92.130859375, 96.4296875, 100.728515625, 105.02734375, 109.326171875, 113.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 11.0, 25.0, 37.0, 100.0, 149.0, 376.0, 913.0, 1338.0, 633.0, 258.0, 134.0, 50.0, 29.0, 14.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -22.40673828125, -20.7197265625, -19.03271484375, -17.345703125, -15.65869140625, -13.9716796875, -12.28466796875, -10.59765625, -8.91064453125, -7.2236328125, -5.53662109375, -3.849609375, -2.16259765625, -0.4755859375, 1.21142578125, 2.8984375, 4.58544921875, 6.2724609375, 7.95947265625, 9.646484375, 11.33349609375, 13.0205078125, 14.70751953125, 16.39453125, 18.08154296875, 19.7685546875, 21.45556640625, 23.142578125, 24.82958984375, 26.5166015625, 28.20361328125, 29.890625, 31.57763671875, 33.2646484375, 34.95166015625, 36.638671875, 38.32568359375, 40.0126953125, 41.69970703125, 43.38671875, 45.07373046875, 46.7607421875, 48.44775390625, 50.134765625, 51.82177734375, 53.5087890625, 55.19580078125, 56.8828125, 58.56982421875, 60.2568359375, 61.94384765625, 63.630859375, 65.31787109375, 67.0048828125, 68.69189453125, 70.37890625, 72.06591796875, 73.7529296875, 75.43994140625, 77.126953125, 78.81396484375, 80.5009765625, 82.18798828125, 83.875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 11.0, 14.0, 28.0, 34.0, 99.0, 137.0, 196.0, 188.0, 98.0, 67.0, 37.0, 24.0, 19.0, 11.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-229.7044677734375, -219.14569091796875, -208.5869140625, -198.0281524658203, -187.46937561035156, -176.9105987548828, -166.35183715820312, -155.79306030273438, -145.23428344726562, -134.67550659179688, -124.11673736572266, -113.55796813964844, -102.99919128417969, -92.44041442871094, -81.88164520263672, -71.3228759765625, -60.76409912109375, -50.205326080322266, -39.64655303955078, -29.087779998779297, -18.529006958007812, -7.970233917236328, 2.5885391235351562, 13.147308349609375, 23.706085205078125, 34.26485824584961, 44.823631286621094, 55.38240432739258, 65.94117736816406, 76.49995422363281, 87.05872344970703, 97.61749267578125, 108.17626953125, 118.73504638671875, 129.2938232421875, 139.8525848388672, 150.41136169433594, 160.9701385498047, 171.52890014648438, 182.08767700195312, 192.64645385742188, 203.20523071289062, 213.76400756835938, 224.32276916503906, 234.8815460205078, 245.44032287597656, 255.99908447265625, 266.557861328125, 277.11663818359375, 287.6754150390625, 298.23419189453125, 308.79296875, 319.35174560546875, 329.9104919433594, 340.4692687988281, 351.0280456542969, 361.5868225097656, 372.1455993652344, 382.7043762207031, 393.2631530761719, 403.8218994140625, 414.38067626953125, 424.939453125, 435.49822998046875, 446.0570068359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 10.0, 8.0, 16.0, 13.0, 21.0, 20.0, 39.0, 55.0, 75.0, 76.0, 104.0, 91.0, 114.0, 72.0, 72.0, 65.0, 51.0, 31.0, 22.0, 9.0, 14.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-329.9376525878906, -321.8611145019531, -313.7845764160156, -305.70806884765625, -297.63153076171875, -289.55499267578125, -281.47845458984375, -273.40191650390625, -265.32537841796875, -257.24884033203125, -249.1723175048828, -241.0957794189453, -233.01925659179688, -224.94271850585938, -216.86618041992188, -208.78964233398438, -200.713134765625, -192.6365966796875, -184.56007385253906, -176.48353576660156, -168.40701293945312, -160.33047485351562, -152.25393676757812, -144.17739868164062, -136.1008758544922, -128.0243377685547, -119.94781494140625, -111.87127685546875, -103.79474639892578, -95.71821594238281, -87.64167785644531, -79.56514739990234, -71.48861694335938, -63.412086486816406, -55.33555221557617, -47.25901794433594, -39.18248748779297, -31.10595703125, -23.029422760009766, -14.952888488769531, -6.8763580322265625, 1.200174331665039, 9.27670669555664, 17.353239059448242, 25.429771423339844, 33.50630187988281, 41.58283615112305, 49.65937042236328, 57.73590087890625, 65.81243133544922, 73.88896179199219, 81.96549987792969, 90.04203033447266, 98.11856079101562, 106.19509887695312, 114.2716293334961, 122.34815979003906, 130.42469787597656, 138.501220703125, 146.5777587890625, 154.654296875, 162.73081970214844, 170.80735778808594, 178.88388061523438, 186.96041870117188]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 10.0, 12.0, 16.0, 21.0, 35.0, 52.0, 87.0, 110.0, 202.0, 316.0, 591.0, 1012.0, 2049.0, 4566.0, 11126.0, 34221.0, 143987.0, 641705.0, 152545.0, 34947.0, 11582.0, 4664.0, 2120.0, 1098.0, 611.0, 328.0, 188.0, 112.0, 79.0, 51.0, 32.0, 14.0, 19.0, 8.0, 10.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.156494140625, -10.71923828125, -10.281982421875, -9.8447265625, -9.407470703125, -8.97021484375, -8.532958984375, -8.095703125, -7.658447265625, -7.22119140625, -6.783935546875, -6.3466796875, -5.909423828125, -5.47216796875, -5.034912109375, -4.59765625, -4.160400390625, -3.72314453125, -3.285888671875, -2.8486328125, -2.411376953125, -1.97412109375, -1.536865234375, -1.099609375, -0.662353515625, -0.22509765625, 0.212158203125, 0.6494140625, 1.086669921875, 1.52392578125, 1.961181640625, 2.3984375, 2.835693359375, 3.27294921875, 3.710205078125, 4.1474609375, 4.584716796875, 5.02197265625, 5.459228515625, 5.896484375, 6.333740234375, 6.77099609375, 7.208251953125, 7.6455078125, 8.082763671875, 8.52001953125, 8.957275390625, 9.39453125, 9.831787109375, 10.26904296875, 10.706298828125, 11.1435546875, 11.580810546875, 12.01806640625, 12.455322265625, 12.892578125, 13.329833984375, 13.76708984375, 14.204345703125, 14.6416015625, 15.078857421875, 15.51611328125, 15.953369140625, 16.390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 6.0, 9.0, 8.0, 15.0, 20.0, 9.0, 23.0, 14.0, 26.0, 35.0, 32.0, 44.0, 43.0, 51.0, 52.0, 64.0, 51.0, 58.0, 73.0, 59.0, 48.0, 45.0, 34.0, 32.0, 25.0, 28.0, 23.0, 14.0, 13.0, 6.0, 9.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.4609375, -9.1080322265625, -8.755126953125, -8.4022216796875, -8.04931640625, -7.6964111328125, -7.343505859375, -6.9906005859375, -6.6376953125, -6.2847900390625, -5.931884765625, -5.5789794921875, -5.22607421875, -4.8731689453125, -4.520263671875, -4.1673583984375, -3.814453125, -3.4615478515625, -3.108642578125, -2.7557373046875, -2.40283203125, -2.0499267578125, -1.697021484375, -1.3441162109375, -0.9912109375, -0.6383056640625, -0.285400390625, 0.0675048828125, 0.42041015625, 0.7733154296875, 1.126220703125, 1.4791259765625, 1.83203125, 2.1849365234375, 2.537841796875, 2.8907470703125, 3.24365234375, 3.5965576171875, 3.949462890625, 4.3023681640625, 4.6552734375, 5.0081787109375, 5.361083984375, 5.7139892578125, 6.06689453125, 6.4197998046875, 6.772705078125, 7.1256103515625, 7.478515625, 7.8314208984375, 8.184326171875, 8.5372314453125, 8.89013671875, 9.2430419921875, 9.595947265625, 9.9488525390625, 10.3017578125, 10.6546630859375, 11.007568359375, 11.3604736328125, 11.71337890625, 12.0662841796875, 12.419189453125, 12.7720947265625, 13.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 1.0, 6.0, 5.0, 16.0, 10.0, 16.0, 14.0, 25.0, 33.0, 40.0, 62.0, 82.0, 131.0, 224.0, 429.0, 878.0, 2317.0, 9592.0, 71477.0, 905174.0, 46613.0, 7307.0, 2195.0, 846.0, 384.0, 203.0, 130.0, 82.0, 64.0, 41.0, 37.0, 23.0, 21.0, 17.0, 11.0, 9.0, 5.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.123046875, -16.44921875, -15.775390625, -15.1015625, -14.427734375, -13.75390625, -13.080078125, -12.40625, -11.732421875, -11.05859375, -10.384765625, -9.7109375, -9.037109375, -8.36328125, -7.689453125, -7.015625, -6.341796875, -5.66796875, -4.994140625, -4.3203125, -3.646484375, -2.97265625, -2.298828125, -1.625, -0.951171875, -0.27734375, 0.396484375, 1.0703125, 1.744140625, 2.41796875, 3.091796875, 3.765625, 4.439453125, 5.11328125, 5.787109375, 6.4609375, 7.134765625, 7.80859375, 8.482421875, 9.15625, 9.830078125, 10.50390625, 11.177734375, 11.8515625, 12.525390625, 13.19921875, 13.873046875, 14.546875, 15.220703125, 15.89453125, 16.568359375, 17.2421875, 17.916015625, 18.58984375, 19.263671875, 19.9375, 20.611328125, 21.28515625, 21.958984375, 22.6328125, 23.306640625, 23.98046875, 24.654296875, 25.328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 12.0, 9.0, 10.0, 15.0, 12.0, 10.0, 21.0, 28.0, 23.0, 41.0, 23.0, 38.0, 48.0, 58.0, 65.0, 85.0, 56.0, 60.0, 61.0, 65.0, 29.0, 34.0, 28.0, 24.0, 21.0, 22.0, 19.0, 17.0, 9.0, 11.0, 8.0, 7.0, 6.0, 4.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.90625, -34.69482421875, -33.4833984375, -32.27197265625, -31.060546875, -29.84912109375, -28.6376953125, -27.42626953125, -26.21484375, -25.00341796875, -23.7919921875, -22.58056640625, -21.369140625, -20.15771484375, -18.9462890625, -17.73486328125, -16.5234375, -15.31201171875, -14.1005859375, -12.88916015625, -11.677734375, -10.46630859375, -9.2548828125, -8.04345703125, -6.83203125, -5.62060546875, -4.4091796875, -3.19775390625, -1.986328125, -0.77490234375, 0.4365234375, 1.64794921875, 2.859375, 4.07080078125, 5.2822265625, 6.49365234375, 7.705078125, 8.91650390625, 10.1279296875, 11.33935546875, 12.55078125, 13.76220703125, 14.9736328125, 16.18505859375, 17.396484375, 18.60791015625, 19.8193359375, 21.03076171875, 22.2421875, 23.45361328125, 24.6650390625, 25.87646484375, 27.087890625, 28.29931640625, 29.5107421875, 30.72216796875, 31.93359375, 33.14501953125, 34.3564453125, 35.56787109375, 36.779296875, 37.99072265625, 39.2021484375, 40.41357421875, 41.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 14.0, 23.0, 43.0, 50.0, 87.0, 221.0, 505.0, 1766.0, 9391.0, 219244.0, 802680.0, 11290.0, 2042.0, 621.0, 246.0, 120.0, 55.0, 45.0, 32.0, 16.0, 13.0, 3.0, 6.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.578125, -7.325927734375, -7.07373046875, -6.821533203125, -6.5693359375, -6.317138671875, -6.06494140625, -5.812744140625, -5.560546875, -5.308349609375, -5.05615234375, -4.803955078125, -4.5517578125, -4.299560546875, -4.04736328125, -3.795166015625, -3.54296875, -3.290771484375, -3.03857421875, -2.786376953125, -2.5341796875, -2.281982421875, -2.02978515625, -1.777587890625, -1.525390625, -1.273193359375, -1.02099609375, -0.768798828125, -0.5166015625, -0.264404296875, -0.01220703125, 0.239990234375, 0.4921875, 0.744384765625, 0.99658203125, 1.248779296875, 1.5009765625, 1.753173828125, 2.00537109375, 2.257568359375, 2.509765625, 2.761962890625, 3.01416015625, 3.266357421875, 3.5185546875, 3.770751953125, 4.02294921875, 4.275146484375, 4.52734375, 4.779541015625, 5.03173828125, 5.283935546875, 5.5361328125, 5.788330078125, 6.04052734375, 6.292724609375, 6.544921875, 6.797119140625, 7.04931640625, 7.301513671875, 7.5537109375, 7.805908203125, 8.05810546875, 8.310302734375, 8.5625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 8.0, 4.0, 12.0, 20.0, 37.0, 34.0, 52.0, 70.0, 118.0, 143.0, 152.0, 85.0, 66.0, 26.0, 26.0, 29.0, 22.0, 12.0, 10.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00144195556640625, -0.0014003515243530273, -0.0013587474822998047, -0.001317143440246582, -0.0012755393981933594, -0.0012339353561401367, -0.001192331314086914, -0.0011507272720336914, -0.0011091232299804688, -0.001067519187927246, -0.0010259151458740234, -0.0009843111038208008, -0.0009427070617675781, -0.0009011030197143555, -0.0008594989776611328, -0.0008178949356079102, -0.0007762908935546875, -0.0007346868515014648, -0.0006930828094482422, -0.0006514787673950195, -0.0006098747253417969, -0.0005682706832885742, -0.0005266666412353516, -0.0004850625991821289, -0.00044345855712890625, -0.0004018545150756836, -0.00036025047302246094, -0.0003186464309692383, -0.0002770423889160156, -0.00023543834686279297, -0.0001938343048095703, -0.00015223026275634766, -0.000110626220703125, -6.902217864990234e-05, -2.7418136596679688e-05, 1.4185905456542969e-05, 5.5789947509765625e-05, 9.739398956298828e-05, 0.00013899803161621094, 0.0001806020736694336, 0.00022220611572265625, 0.0002638101577758789, 0.00030541419982910156, 0.0003470182418823242, 0.0003886222839355469, 0.00043022632598876953, 0.0004718303680419922, 0.0005134344100952148, 0.0005550384521484375, 0.0005966424942016602, 0.0006382465362548828, 0.0006798505783081055, 0.0007214546203613281, 0.0007630586624145508, 0.0008046627044677734, 0.0008462667465209961, 0.0008878707885742188, 0.0009294748306274414, 0.0009710788726806641, 0.0010126829147338867, 0.0010542869567871094, 0.001095890998840332, 0.0011374950408935547, 0.0011790990829467773, 0.001220703125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 9.0, 6.0, 6.0, 13.0, 23.0, 27.0, 28.0, 46.0, 78.0, 125.0, 249.0, 399.0, 922.0, 2176.0, 5241.0, 16516.0, 77588.0, 861708.0, 60621.0, 14165.0, 4741.0, 2008.0, 824.0, 442.0, 205.0, 129.0, 83.0, 54.0, 34.0, 19.0, 18.0, 11.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.17578125, -5.02099609375, -4.8662109375, -4.71142578125, -4.556640625, -4.40185546875, -4.2470703125, -4.09228515625, -3.9375, -3.78271484375, -3.6279296875, -3.47314453125, -3.318359375, -3.16357421875, -3.0087890625, -2.85400390625, -2.69921875, -2.54443359375, -2.3896484375, -2.23486328125, -2.080078125, -1.92529296875, -1.7705078125, -1.61572265625, -1.4609375, -1.30615234375, -1.1513671875, -0.99658203125, -0.841796875, -0.68701171875, -0.5322265625, -0.37744140625, -0.22265625, -0.06787109375, 0.0869140625, 0.24169921875, 0.396484375, 0.55126953125, 0.7060546875, 0.86083984375, 1.015625, 1.17041015625, 1.3251953125, 1.47998046875, 1.634765625, 1.78955078125, 1.9443359375, 2.09912109375, 2.25390625, 2.40869140625, 2.5634765625, 2.71826171875, 2.873046875, 3.02783203125, 3.1826171875, 3.33740234375, 3.4921875, 3.64697265625, 3.8017578125, 3.95654296875, 4.111328125, 4.26611328125, 4.4208984375, 4.57568359375, 4.73046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 6.0, 5.0, 13.0, 9.0, 11.0, 15.0, 15.0, 24.0, 50.0, 58.0, 100.0, 144.0, 151.0, 123.0, 72.0, 46.0, 38.0, 26.0, 21.0, 13.0, 11.0, 13.0, 4.0, 2.0, 7.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.54217529296875, -5.3695068359375, -5.19683837890625, -5.024169921875, -4.85150146484375, -4.6788330078125, -4.50616455078125, -4.33349609375, -4.16082763671875, -3.9881591796875, -3.81549072265625, -3.642822265625, -3.47015380859375, -3.2974853515625, -3.12481689453125, -2.9521484375, -2.77947998046875, -2.6068115234375, -2.43414306640625, -2.261474609375, -2.08880615234375, -1.9161376953125, -1.74346923828125, -1.57080078125, -1.39813232421875, -1.2254638671875, -1.05279541015625, -0.880126953125, -0.70745849609375, -0.5347900390625, -0.36212158203125, -0.189453125, -0.01678466796875, 0.1558837890625, 0.32855224609375, 0.501220703125, 0.67388916015625, 0.8465576171875, 1.01922607421875, 1.19189453125, 1.36456298828125, 1.5372314453125, 1.70989990234375, 1.882568359375, 2.05523681640625, 2.2279052734375, 2.40057373046875, 2.5732421875, 2.74591064453125, 2.9185791015625, 3.09124755859375, 3.263916015625, 3.43658447265625, 3.6092529296875, 3.78192138671875, 3.95458984375, 4.12725830078125, 4.2999267578125, 4.47259521484375, 4.645263671875, 4.81793212890625, 4.9906005859375, 5.16326904296875, 5.3359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 11.0, 5.0, 7.0, 15.0, 29.0, 63.0, 140.0, 479.0, 145.0, 60.0, 24.0, 16.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.5830383300781, -330.62945556640625, -323.6759033203125, -316.7223205566406, -309.76873779296875, -302.815185546875, -295.8616027832031, -288.9080505371094, -281.9544677734375, -275.0008850097656, -268.0473327636719, -261.09375, -254.1401824951172, -247.18661499023438, -240.2330322265625, -233.2794647216797, -226.32589721679688, -219.37232971191406, -212.41876220703125, -205.46517944335938, -198.51161193847656, -191.55804443359375, -184.60446166992188, -177.65089416503906, -170.69732666015625, -163.74375915527344, -156.79019165039062, -149.83660888671875, -142.88304138183594, -135.92947387695312, -128.97589111328125, -122.02232360839844, -115.06875610351562, -108.11518859863281, -101.16161346435547, -94.20803833007812, -87.25447082519531, -80.3009033203125, -73.34732818603516, -66.39375305175781, -59.440185546875, -52.48661422729492, -45.533042907714844, -38.579471588134766, -31.625900268554688, -24.67232894897461, -17.71875762939453, -10.765186309814453, -3.811614990234375, 3.141956329345703, 10.095527648925781, 17.04909896850586, 24.002670288085938, 30.956241607666016, 37.909812927246094, 44.86338424682617, 51.81695556640625, 58.77052688598633, 65.7240982055664, 72.67767333984375, 79.63124084472656, 86.58480834960938, 93.53838348388672, 100.49195861816406, 107.44552612304688]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 14.0, 11.0, 12.0, 13.0, 17.0, 20.0, 18.0, 24.0, 26.0, 27.0, 27.0, 71.0, 155.0, 152.0, 150.0, 63.0, 28.0, 21.0, 24.0, 18.0, 24.0, 17.0, 10.0, 8.0, 5.0, 6.0, 10.0, 3.0, 0.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.55050659179688, -150.90188598632812, -146.25326538085938, -141.60464477539062, -136.95602416992188, -132.3074188232422, -127.65879821777344, -123.01017761230469, -118.36155700683594, -113.71293640136719, -109.06431579589844, -104.41570281982422, -99.76708221435547, -95.11846160888672, -90.4698486328125, -85.82122802734375, -81.172607421875, -76.52398681640625, -71.8753662109375, -67.22675323486328, -62.57813262939453, -57.92951202392578, -53.2808952331543, -48.63227844238281, -43.98365783691406, -39.33503723144531, -34.68642044067383, -30.03780174255371, -25.389183044433594, -20.740564346313477, -16.09194564819336, -11.443328857421875, -6.7947235107421875, -2.1461048126220703, 2.502513885498047, 7.151132583618164, 11.799751281738281, 16.4483699798584, 21.096988677978516, 25.74560546875, 30.39422607421875, 35.0428466796875, 39.691463470458984, 44.34008026123047, 48.98870086669922, 53.63732147216797, 58.28593826293945, 62.93455505371094, 67.58317565917969, 72.23179626464844, 76.88041687011719, 81.5290298461914, 86.17765045166016, 90.8262710571289, 95.47488403320312, 100.12350463867188, 104.77212524414062, 109.42074584960938, 114.06936645507812, 118.71797943115234, 123.3666000366211, 128.0152130126953, 132.66383361816406, 137.3124542236328, 141.96107482910156]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 12.0, 10.0, 19.0, 21.0, 22.0, 26.0, 33.0, 38.0, 77.0, 93.0, 232.0, 101.0, 54.0, 32.0, 45.0, 30.0, 14.0, 24.0, 16.0, 10.0, 16.0, 14.0, 6.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.7265625, -13.339599609375, -12.95263671875, -12.565673828125, -12.1787109375, -11.791748046875, -11.40478515625, -11.017822265625, -10.630859375, -10.243896484375, -9.85693359375, -9.469970703125, -9.0830078125, -8.696044921875, -8.30908203125, -7.922119140625, -7.53515625, -7.148193359375, -6.76123046875, -6.374267578125, -5.9873046875, -5.600341796875, -5.21337890625, -4.826416015625, -4.439453125, -4.052490234375, -3.66552734375, -3.278564453125, -2.8916015625, -2.504638671875, -2.11767578125, -1.730712890625, -1.34375, -0.956787109375, -0.56982421875, -0.182861328125, 0.2041015625, 0.591064453125, 0.97802734375, 1.364990234375, 1.751953125, 2.138916015625, 2.52587890625, 2.912841796875, 3.2998046875, 3.686767578125, 4.07373046875, 4.460693359375, 4.84765625, 5.234619140625, 5.62158203125, 6.008544921875, 6.3955078125, 6.782470703125, 7.16943359375, 7.556396484375, 7.943359375, 8.330322265625, 8.71728515625, 9.104248046875, 9.4912109375, 9.878173828125, 10.26513671875, 10.652099609375, 11.0390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 8.0, 7.0, 8.0, 12.0, 24.0, 29.0, 44.0, 50.0, 108.0, 180.0, 435.0, 1215.0, 5146.0, 178441.0, 8193976.0, 6530.0, 1433.0, 469.0, 202.0, 87.0, 59.0, 39.0, 23.0, 13.0, 9.0, 7.0, 11.0, 13.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.58132934570312, -64.77389526367188, -61.966461181640625, -59.15903091430664, -56.35159683227539, -53.54416275024414, -50.736732482910156, -47.929298400878906, -45.121864318847656, -42.314430236816406, -39.506996154785156, -36.69956588745117, -33.89213180541992, -31.084697723388672, -28.277265548706055, -25.469833374023438, -22.662399291992188, -19.854965209960938, -17.04753303527832, -14.240099906921387, -11.432666778564453, -8.62523365020752, -5.817800521850586, -3.0103683471679688, -0.20293426513671875, 2.604498863220215, 5.411931991577148, 8.219365119934082, 11.026798248291016, 13.83423137664795, 16.641664505004883, 19.4490966796875, 22.25652313232422, 25.06395721435547, 27.871389389038086, 30.678821563720703, 33.48625564575195, 36.2936897277832, 39.10111999511719, 41.90855407714844, 44.71598815917969, 47.52342224121094, 50.33085632324219, 53.13828659057617, 55.94572067260742, 58.75315475463867, 61.560585021972656, 64.3680191040039, 67.17545318603516, 69.9828872680664, 72.79032135009766, 75.5977554321289, 78.40518188476562, 81.21261596679688, 84.02005004882812, 86.82748413085938, 89.63491821289062, 92.44235229492188, 95.24978637695312, 98.05722045898438, 100.86465454101562, 103.67208099365234, 106.4795150756836, 109.28694915771484, 112.0943832397461]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 8.0, 7.0, 6.0, 8.0, 5.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-120.12277221679688, -117.27487182617188, -114.42697143554688, -111.57906341552734, -108.73116302490234, -105.88326263427734, -103.03535461425781, -100.18745422363281, -97.33955383300781, -94.49165344238281, -91.64375305175781, -88.79584503173828, -85.94794464111328, -83.10004425048828, -80.25213623046875, -77.40423583984375, -74.55633544921875, -71.70843505859375, -68.86053466796875, -66.01262664794922, -63.16472625732422, -60.31682586669922, -57.46892166137695, -54.62101745605469, -51.77311706542969, -48.92521667480469, -46.07731246948242, -43.229408264160156, -40.381507873535156, -37.533607482910156, -34.68570327758789, -31.837800979614258, -28.98989486694336, -26.141992568969727, -23.294090270996094, -20.44618797302246, -17.598285675048828, -14.750383377075195, -11.902481079101562, -9.05457878112793, -6.206676483154297, -3.358774185180664, -0.5108718872070312, 2.3370304107666016, 5.184932708740234, 8.032835006713867, 10.8807373046875, 13.728639602661133, 16.576541900634766, 19.4244441986084, 22.27234649658203, 25.120248794555664, 27.968151092529297, 30.81605339050293, 33.66395568847656, 36.51185607910156, 39.35976028442383, 42.207664489746094, 45.055564880371094, 47.903465270996094, 50.75136947631836, 53.599273681640625, 56.447174072265625, 59.295074462890625, 62.14297866821289]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 4.0, 7.0, 7.0, 3.0, 5.0, 6.0, 7.0, 9.0, 19.0, 18.0, 28.0, 27.0, 34.0, 54.0, 52.0, 83.0, 69.0, 76.0, 54.0, 55.0, 82.0, 46.0, 60.0, 47.0, 36.0, 24.0, 18.0, 19.0, 12.0, 10.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.6484375, -7.41259765625, -7.1767578125, -6.94091796875, -6.705078125, -6.46923828125, -6.2333984375, -5.99755859375, -5.76171875, -5.52587890625, -5.2900390625, -5.05419921875, -4.818359375, -4.58251953125, -4.3466796875, -4.11083984375, -3.875, -3.63916015625, -3.4033203125, -3.16748046875, -2.931640625, -2.69580078125, -2.4599609375, -2.22412109375, -1.98828125, -1.75244140625, -1.5166015625, -1.28076171875, -1.044921875, -0.80908203125, -0.5732421875, -0.33740234375, -0.1015625, 0.13427734375, 0.3701171875, 0.60595703125, 0.841796875, 1.07763671875, 1.3134765625, 1.54931640625, 1.78515625, 2.02099609375, 2.2568359375, 2.49267578125, 2.728515625, 2.96435546875, 3.2001953125, 3.43603515625, 3.671875, 3.90771484375, 4.1435546875, 4.37939453125, 4.615234375, 4.85107421875, 5.0869140625, 5.32275390625, 5.55859375, 5.79443359375, 6.0302734375, 6.26611328125, 6.501953125, 6.73779296875, 6.9736328125, 7.20947265625, 7.4453125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 8.0, 14.0, 30.0, 31.0, 53.0, 90.0, 144.0, 227.0, 446.0, 877.0, 1805.0, 4496.0, 12148.0, 40321.0, 152685.0, 215558.0, 65269.0, 18960.0, 6450.0, 2560.0, 1056.0, 451.0, 258.0, 130.0, 71.0, 31.0, 23.0, 13.0, 7.0, 14.0, 6.0, 4.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-84.75, -82.1953125, -79.640625, -77.0859375, -74.53125, -71.9765625, -69.421875, -66.8671875, -64.3125, -61.7578125, -59.203125, -56.6484375, -54.09375, -51.5390625, -48.984375, -46.4296875, -43.875, -41.3203125, -38.765625, -36.2109375, -33.65625, -31.1015625, -28.546875, -25.9921875, -23.4375, -20.8828125, -18.328125, -15.7734375, -13.21875, -10.6640625, -8.109375, -5.5546875, -3.0, -0.4453125, 2.109375, 4.6640625, 7.21875, 9.7734375, 12.328125, 14.8828125, 17.4375, 19.9921875, 22.546875, 25.1015625, 27.65625, 30.2109375, 32.765625, 35.3203125, 37.875, 40.4296875, 42.984375, 45.5390625, 48.09375, 50.6484375, 53.203125, 55.7578125, 58.3125, 60.8671875, 63.421875, 65.9765625, 68.53125, 71.0859375, 73.640625, 76.1953125, 78.75]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 0.0, 3.0, 7.0, 13.0, 6.0, 7.0, 7.0, 14.0, 19.0, 18.0, 20.0, 29.0, 49.0, 32.0, 46.0, 44.0, 56.0, 100.0, 79.0, 60.0, 58.0, 60.0, 45.0, 51.0, 31.0, 25.0, 20.0, 26.0, 11.0, 12.0, 14.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.078125, -10.7532958984375, -10.428466796875, -10.1036376953125, -9.77880859375, -9.4539794921875, -9.129150390625, -8.8043212890625, -8.4794921875, -8.1546630859375, -7.829833984375, -7.5050048828125, -7.18017578125, -6.8553466796875, -6.530517578125, -6.2056884765625, -5.880859375, -5.5560302734375, -5.231201171875, -4.9063720703125, -4.58154296875, -4.2567138671875, -3.931884765625, -3.6070556640625, -3.2822265625, -2.9573974609375, -2.632568359375, -2.3077392578125, -1.98291015625, -1.6580810546875, -1.333251953125, -1.0084228515625, -0.68359375, -0.3587646484375, -0.033935546875, 0.2908935546875, 0.61572265625, 0.9405517578125, 1.265380859375, 1.5902099609375, 1.9150390625, 2.2398681640625, 2.564697265625, 2.8895263671875, 3.21435546875, 3.5391845703125, 3.864013671875, 4.1888427734375, 4.513671875, 4.8385009765625, 5.163330078125, 5.4881591796875, 5.81298828125, 6.1378173828125, 6.462646484375, 6.7874755859375, 7.1123046875, 7.4371337890625, 7.761962890625, 8.0867919921875, 8.41162109375, 8.7364501953125, 9.061279296875, 9.3861083984375, 9.7109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 22.0, 36.0, 78.0, 120.0, 91.0, 43.0, 29.0, 15.0, 6.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.23785400390625, -137.8482208251953, -134.4585723876953, -131.06893920898438, -127.6792984008789, -124.28966522216797, -120.9000244140625, -117.51039123535156, -114.1207504272461, -110.73110961914062, -107.34147644042969, -103.95183563232422, -100.56219482421875, -97.17256164550781, -93.78292083740234, -90.39328002929688, -87.00364685058594, -83.61400604248047, -80.22437286376953, -76.83473205566406, -73.4450912475586, -70.05545806884766, -66.66581726074219, -63.276180267333984, -59.88653564453125, -56.49689865112305, -53.10725784301758, -49.717620849609375, -46.32798385620117, -42.93834686279297, -39.5487060546875, -36.1590690612793, -32.769432067871094, -29.379793167114258, -25.990156173706055, -22.60051727294922, -19.210880279541016, -15.82124137878418, -12.431602478027344, -9.04196548461914, -5.652326583862305, -2.262688398361206, 1.1269497871398926, 4.51658821105957, 7.90622615814209, 11.29586410522461, 14.685503005981445, 18.07513999938965, 21.464778900146484, 24.85441780090332, 28.244054794311523, 31.63369369506836, 35.02333068847656, 38.41297149658203, 41.802608489990234, 45.19224548339844, 48.581886291503906, 51.97152328491211, 55.36116409301758, 58.75080108642578, 62.140438079833984, 65.53007507324219, 68.91971588134766, 72.30935668945312, 75.69898986816406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 11.0, 14.0, 49.0, 87.0, 114.0, 78.0, 35.0, 15.0, 6.0, 8.0, 5.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.50379180908203, -52.434173583984375, -50.364559173583984, -48.294944763183594, -46.22532653808594, -44.15570831298828, -42.08609390258789, -40.0164794921875, -37.946861267089844, -35.87724304199219, -33.8076286315918, -31.738012313842773, -29.66839599609375, -27.598779678344727, -25.529163360595703, -23.45954704284668, -21.389930725097656, -19.320314407348633, -17.25069808959961, -15.181081771850586, -13.111465454101562, -11.041849136352539, -8.972232818603516, -6.902616500854492, -4.833000183105469, -2.7633838653564453, -0.6937675476074219, 1.3758487701416016, 3.445465087890625, 5.515081405639648, 7.584697723388672, 9.654314041137695, 11.723922729492188, 13.793539047241211, 15.863155364990234, 17.932771682739258, 20.00238800048828, 22.072004318237305, 24.141620635986328, 26.21123695373535, 28.280853271484375, 30.3504695892334, 32.42008590698242, 34.48970031738281, 36.55931854248047, 38.628936767578125, 40.698551177978516, 42.768165588378906, 44.83778381347656, 46.90740203857422, 48.97701644897461, 51.046630859375, 53.116249084472656, 55.18586730957031, 57.2554817199707, 59.325096130371094, 61.39471435546875, 63.464332580566406, 65.53395080566406, 67.60356140136719, 69.67317962646484, 71.7427978515625, 73.81240844726562, 75.88202667236328, 77.95164489746094]}, "eval/loss": 0.7765135765075684, "eval/wer": 0.13639428798095993, "eval/runtime": 828.6657, "eval/samples_per_second": 3.188, "eval/steps_per_second": 0.399} \ No newline at end of file