diff --git "a/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" "b/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" --- "a/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" +++ "b/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.642, "train/learning_rate": 1.2667630057803469e-05, "train/epoch": 13.45, "train/global_step": 3000, "_runtime": 56607, "_timestamp": 1646791575, "_step": 3001, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 38.0, 354.0, 29994.0, 110.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -95.0322265625, -86.126953125, -77.2216796875, -68.31640625, -59.4111328125, -50.505859375, -41.6005859375, -32.6953125, -23.7900390625, -14.884765625, -5.9794921875, 2.92578125, 11.8310546875, 20.736328125, 29.6416015625, 38.546875, 47.4521484375, 56.357421875, 65.2626953125, 74.16796875, 83.0732421875, 91.978515625, 100.8837890625, 109.7890625, 118.6943359375, 127.599609375, 136.5048828125, 145.41015625, 154.3154296875, 163.220703125, 172.1259765625, 181.03125, 189.9365234375, 198.841796875, 207.7470703125, 216.65234375, 225.5576171875, 234.462890625, 243.3681640625, 252.2734375, 261.1787109375, 270.083984375, 278.9892578125, 287.89453125, 296.7998046875, 305.705078125, 314.6103515625, 323.515625, 332.4208984375, 341.326171875, 350.2314453125, 359.13671875, 368.0419921875, 376.947265625, 385.8525390625, 394.7578125, 403.6630859375, 412.568359375, 421.4736328125, 430.37890625, 439.2841796875, 448.189453125, 457.0947265625, 466.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 13.0, 11.0, 26.0, 22.0, 33.0, 28.0, 41.0, 53.0, 60.0, 61.0, 63.0, 60.0, 57.0, 58.0, 58.0, 51.0, 40.0, 35.0, 43.0, 30.0, 33.0, 23.0, 17.0, 14.0, 12.0, 7.0, 12.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.668701171875, -39.467994689941406, -38.26728439331055, -37.06657791137695, -35.865867614746094, -34.6651611328125, -33.464454650878906, -32.26374816894531, -31.063037872314453, -29.862329483032227, -28.66162109375, -27.460914611816406, -26.26020622253418, -25.059497833251953, -23.85879135131836, -22.658082962036133, -21.457374572753906, -20.25666618347168, -19.055957794189453, -17.85525131225586, -16.654542922973633, -15.453834533691406, -14.253127098083496, -13.052419662475586, -11.85171127319336, -10.651002883911133, -9.450295448303223, -8.249588012695312, -7.048879623413086, -5.848171710968018, -4.647463798522949, -3.446756362915039, -2.246044158935547, -1.0453362464904785, 0.15537166595458984, 1.3560795783996582, 2.5567874908447266, 3.757495403289795, 4.958203315734863, 6.158910751342773, 7.359619140625, 8.560327529907227, 9.761034965515137, 10.961742401123047, 12.162450790405273, 13.3631591796875, 14.56386661529541, 15.76457405090332, 16.965282440185547, 18.165990829467773, 19.36669921875, 20.567405700683594, 21.76811408996582, 22.968822479248047, 24.16952896118164, 25.370237350463867, 26.570945739746094, 27.77165412902832, 28.972362518310547, 30.17306900024414, 31.373777389526367, 32.574485778808594, 33.77519226074219, 34.97589874267578, 36.17660903930664]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 7.0, 11.0, 13.0, 17.0, 11.0, 11.0, 20.0, 30.0, 28.0, 29.0, 29.0, 27.0, 33.0, 30.0, 41.0, 33.0, 39.0, 44.0, 31.0, 36.0, 36.0, 41.0, 43.0, 44.0, 43.0, 35.0, 30.0, 22.0, 27.0, 17.0, 23.0, 14.0, 14.0, 9.0, 18.0, 12.0, 9.0, 6.0, 3.0, 7.0, 6.0, 0.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.953468322753906, -34.76715087890625, -33.58082962036133, -32.39451217651367, -31.20819091796875, -30.02187156677246, -28.835552215576172, -27.649234771728516, -26.462913513183594, -25.276594161987305, -24.090274810791016, -22.903955459594727, -21.717636108398438, -20.53131675720215, -19.34499740600586, -18.158679962158203, -16.972360610961914, -15.786041259765625, -14.599721908569336, -13.413402557373047, -12.227083206176758, -11.040763854980469, -9.854445457458496, -8.668126106262207, -7.481806755065918, -6.295487403869629, -5.10916805267334, -3.922849178314209, -2.73652982711792, -1.5502104759216309, -0.3638916015625, 0.8224277496337891, 2.008747100830078, 3.195066452026367, 4.381385803222656, 5.567704677581787, 6.754024028778076, 7.940343379974365, 9.126662254333496, 10.312981605529785, 11.499300956726074, 12.685620307922363, 13.871939659118652, 15.058258056640625, 16.244577407836914, 17.430896759033203, 18.617216110229492, 19.80353546142578, 20.98985481262207, 22.17617416381836, 23.36249351501465, 24.548812866210938, 25.735132217407227, 26.921451568603516, 28.107769012451172, 29.294090270996094, 30.48040771484375, 31.66672706604004, 32.85304641723633, 34.039363861083984, 35.225685119628906, 36.41200256347656, 37.598323822021484, 38.78464126586914, 39.97096252441406]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 10.0, 14.0, 12.0, 14.0, 40.0, 55.0, 85.0, 104.0, 179.0, 306.0, 404.0, 649.0, 1042.0, 1655.0, 2620.0, 4007.0, 6191.0, 9622.0, 14835.0, 22602.0, 33991.0, 49528.0, 69993.0, 96479.0, 126708.0, 152008.0, 129982.0, 98737.0, 72483.0, 51437.0, 35140.0, 23750.0, 15604.0, 10132.0, 6592.0, 4195.0, 2650.0, 1673.0, 1045.0, 693.0, 465.0, 290.0, 221.0, 104.0, 74.0, 43.0, 37.0, 19.0, 17.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-88.8125, -86.083984375, -83.35546875, -80.626953125, -77.8984375, -75.169921875, -72.44140625, -69.712890625, -66.984375, -64.255859375, -61.52734375, -58.798828125, -56.0703125, -53.341796875, -50.61328125, -47.884765625, -45.15625, -42.427734375, -39.69921875, -36.970703125, -34.2421875, -31.513671875, -28.78515625, -26.056640625, -23.328125, -20.599609375, -17.87109375, -15.142578125, -12.4140625, -9.685546875, -6.95703125, -4.228515625, -1.5, 1.228515625, 3.95703125, 6.685546875, 9.4140625, 12.142578125, 14.87109375, 17.599609375, 20.328125, 23.056640625, 25.78515625, 28.513671875, 31.2421875, 33.970703125, 36.69921875, 39.427734375, 42.15625, 44.884765625, 47.61328125, 50.341796875, 53.0703125, 55.798828125, 58.52734375, 61.255859375, 63.984375, 66.712890625, 69.44140625, 72.169921875, 74.8984375, 77.626953125, 80.35546875, 83.083984375, 85.8125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 11.0, 13.0, 9.0, 11.0, 11.0, 27.0, 18.0, 21.0, 27.0, 24.0, 20.0, 37.0, 32.0, 40.0, 45.0, 44.0, 47.0, 56.0, 62.0, 48.0, 49.0, 38.0, 44.0, 37.0, 24.0, 25.0, 17.0, 27.0, 21.0, 13.0, 16.0, 14.0, 11.0, 12.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.5625, -49.97119140625, -48.3798828125, -46.78857421875, -45.197265625, -43.60595703125, -42.0146484375, -40.42333984375, -38.83203125, -37.24072265625, -35.6494140625, -34.05810546875, -32.466796875, -30.87548828125, -29.2841796875, -27.69287109375, -26.1015625, -24.51025390625, -22.9189453125, -21.32763671875, -19.736328125, -18.14501953125, -16.5537109375, -14.96240234375, -13.37109375, -11.77978515625, -10.1884765625, -8.59716796875, -7.005859375, -5.41455078125, -3.8232421875, -2.23193359375, -0.640625, 0.95068359375, 2.5419921875, 4.13330078125, 5.724609375, 7.31591796875, 8.9072265625, 10.49853515625, 12.08984375, 13.68115234375, 15.2724609375, 16.86376953125, 18.455078125, 20.04638671875, 21.6376953125, 23.22900390625, 24.8203125, 26.41162109375, 28.0029296875, 29.59423828125, 31.185546875, 32.77685546875, 34.3681640625, 35.95947265625, 37.55078125, 39.14208984375, 40.7333984375, 42.32470703125, 43.916015625, 45.50732421875, 47.0986328125, 48.68994140625, 50.28125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 12.0, 17.0, 20.0, 22.0, 30.0, 35.0, 36.0, 48.0, 42.0, 41.0, 45.0, 48.0, 52.0, 57.0, 40.0, 41.0, 39.0, 39.0, 28.0, 47.0, 38.0, 27.0, 16.0, 19.0, 27.0, 18.0, 16.0, 10.0, 11.0, 11.0, 4.0, 6.0, 8.0, 7.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.643905639648438, -24.86617660522461, -24.08844757080078, -23.31071662902832, -22.532987594604492, -21.755258560180664, -20.977529525756836, -20.199798583984375, -19.422069549560547, -18.64434051513672, -17.86661148071289, -17.08888053894043, -16.3111515045166, -15.533422470092773, -14.755693435668945, -13.9779634475708, -13.200234413146973, -12.422505378723145, -11.644775390625, -10.867046356201172, -10.089316368103027, -9.3115873336792, -8.533857345581055, -7.756128311157227, -6.97839879989624, -6.200669288635254, -5.422939777374268, -4.645210266113281, -3.867480993270874, -3.0897514820098877, -2.3120222091674805, -1.5342926979064941, -0.7565631866455078, 0.02116626501083374, 0.7988957166671753, 1.576625108718872, 2.3543546199798584, 3.1320841312408447, 3.909813404083252, 4.687542915344238, 5.465272426605225, 6.243001937866211, 7.020731449127197, 7.798460960388184, 8.576189994812012, 9.353919982910156, 10.131649017333984, 10.909378051757812, 11.687108039855957, 12.464837074279785, 13.24256706237793, 14.020296096801758, 14.798026084899902, 15.57575511932373, 16.353485107421875, 17.131214141845703, 17.90894317626953, 18.68667221069336, 19.464401245117188, 20.24213218688965, 21.019861221313477, 21.797590255737305, 22.575319290161133, 23.353050231933594, 24.130779266357422]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 5.0, 2.0, 10.0, 8.0, 12.0, 16.0, 17.0, 23.0, 16.0, 25.0, 29.0, 18.0, 35.0, 27.0, 41.0, 56.0, 46.0, 35.0, 36.0, 40.0, 41.0, 36.0, 50.0, 51.0, 47.0, 27.0, 35.0, 23.0, 22.0, 20.0, 28.0, 20.0, 14.0, 15.0, 10.0, 11.0, 8.0, 12.0, 9.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.28187561035156, -37.19178771972656, -36.10169982910156, -35.01161575317383, -33.92152786254883, -32.83143997192383, -31.741352081298828, -30.65126609802246, -29.561180114746094, -28.471092224121094, -27.381006240844727, -26.290918350219727, -25.20083236694336, -24.11074447631836, -23.02065658569336, -21.930570602416992, -20.840482711791992, -19.750394821166992, -18.660308837890625, -17.570220947265625, -16.480134963989258, -15.390047073364258, -14.299960136413574, -13.20987319946289, -12.119786262512207, -11.029699325561523, -9.93961238861084, -8.849525451660156, -7.7594380378723145, -6.669351100921631, -5.579263687133789, -4.4891767501831055, -3.3990917205810547, -2.309004783630371, -1.2189176082611084, -0.1288304328918457, 0.9612565040588379, 2.0513434410095215, 3.1414308547973633, 4.231517791748047, 5.3216047286987305, 6.411691665649414, 7.501778602600098, 8.591865539550781, 9.681953430175781, 10.772039413452148, 11.862127304077148, 12.952214241027832, 14.042301177978516, 15.1323881149292, 16.222475051879883, 17.312562942504883, 18.40264892578125, 19.49273681640625, 20.58282470703125, 21.672910690307617, 22.762996673583984, 23.853084564208984, 24.94317054748535, 26.03325843811035, 27.12334442138672, 28.21343231201172, 29.30352020263672, 30.393606185913086, 31.483694076538086]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 7.0, 8.0, 17.0, 28.0, 46.0, 80.0, 115.0, 229.0, 360.0, 692.0, 1462.0, 2774.0, 5707.0, 11383.0, 23953.0, 50198.0, 105267.0, 214963.0, 408883.0, 664621.0, 835979.0, 766686.0, 522347.0, 292453.0, 148352.0, 71726.0, 34223.0, 16139.0, 7837.0, 3774.0, 1886.0, 978.0, 450.0, 274.0, 134.0, 92.0, 57.0, 29.0, 21.0, 15.0, 8.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.83349609375, -31.7294921875, -30.62548828125, -29.521484375, -28.41748046875, -27.3134765625, -26.20947265625, -25.10546875, -24.00146484375, -22.8974609375, -21.79345703125, -20.689453125, -19.58544921875, -18.4814453125, -17.37744140625, -16.2734375, -15.16943359375, -14.0654296875, -12.96142578125, -11.857421875, -10.75341796875, -9.6494140625, -8.54541015625, -7.44140625, -6.33740234375, -5.2333984375, -4.12939453125, -3.025390625, -1.92138671875, -0.8173828125, 0.28662109375, 1.390625, 2.49462890625, 3.5986328125, 4.70263671875, 5.806640625, 6.91064453125, 8.0146484375, 9.11865234375, 10.22265625, 11.32666015625, 12.4306640625, 13.53466796875, 14.638671875, 15.74267578125, 16.8466796875, 17.95068359375, 19.0546875, 20.15869140625, 21.2626953125, 22.36669921875, 23.470703125, 24.57470703125, 25.6787109375, 26.78271484375, 27.88671875, 28.99072265625, 30.0947265625, 31.19873046875, 32.302734375, 33.40673828125, 34.5107421875, 35.61474609375, 36.71875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 2.0, 10.0, 9.0, 4.0, 14.0, 13.0, 12.0, 23.0, 22.0, 23.0, 14.0, 29.0, 35.0, 33.0, 42.0, 44.0, 37.0, 49.0, 52.0, 37.0, 38.0, 42.0, 56.0, 43.0, 40.0, 30.0, 34.0, 25.0, 23.0, 26.0, 21.0, 18.0, 18.0, 18.0, 15.0, 5.0, 14.0, 7.0, 9.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.03125, -33.08251953125, -32.1337890625, -31.18505859375, -30.236328125, -29.28759765625, -28.3388671875, -27.39013671875, -26.44140625, -25.49267578125, -24.5439453125, -23.59521484375, -22.646484375, -21.69775390625, -20.7490234375, -19.80029296875, -18.8515625, -17.90283203125, -16.9541015625, -16.00537109375, -15.056640625, -14.10791015625, -13.1591796875, -12.21044921875, -11.26171875, -10.31298828125, -9.3642578125, -8.41552734375, -7.466796875, -6.51806640625, -5.5693359375, -4.62060546875, -3.671875, -2.72314453125, -1.7744140625, -0.82568359375, 0.123046875, 1.07177734375, 2.0205078125, 2.96923828125, 3.91796875, 4.86669921875, 5.8154296875, 6.76416015625, 7.712890625, 8.66162109375, 9.6103515625, 10.55908203125, 11.5078125, 12.45654296875, 13.4052734375, 14.35400390625, 15.302734375, 16.25146484375, 17.2001953125, 18.14892578125, 19.09765625, 20.04638671875, 20.9951171875, 21.94384765625, 22.892578125, 23.84130859375, 24.7900390625, 25.73876953125, 26.6875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 8.0, 14.0, 13.0, 19.0, 30.0, 42.0, 68.0, 130.0, 177.0, 414.0, 800.0, 1664.0, 3446.0, 7621.0, 17480.0, 40305.0, 94239.0, 207850.0, 409516.0, 669369.0, 844058.0, 786207.0, 548998.0, 304049.0, 144888.0, 64047.0, 27249.0, 11692.0, 5197.0, 2343.0, 1116.0, 562.0, 292.0, 135.0, 94.0, 47.0, 34.0, 19.0, 13.0, 14.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.28125, -37.076171875, -35.87109375, -34.666015625, -33.4609375, -32.255859375, -31.05078125, -29.845703125, -28.640625, -27.435546875, -26.23046875, -25.025390625, -23.8203125, -22.615234375, -21.41015625, -20.205078125, -19.0, -17.794921875, -16.58984375, -15.384765625, -14.1796875, -12.974609375, -11.76953125, -10.564453125, -9.359375, -8.154296875, -6.94921875, -5.744140625, -4.5390625, -3.333984375, -2.12890625, -0.923828125, 0.28125, 1.486328125, 2.69140625, 3.896484375, 5.1015625, 6.306640625, 7.51171875, 8.716796875, 9.921875, 11.126953125, 12.33203125, 13.537109375, 14.7421875, 15.947265625, 17.15234375, 18.357421875, 19.5625, 20.767578125, 21.97265625, 23.177734375, 24.3828125, 25.587890625, 26.79296875, 27.998046875, 29.203125, 30.408203125, 31.61328125, 32.818359375, 34.0234375, 35.228515625, 36.43359375, 37.638671875, 38.84375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 6.0, 8.0, 9.0, 23.0, 17.0, 34.0, 43.0, 58.0, 55.0, 66.0, 102.0, 125.0, 153.0, 182.0, 190.0, 236.0, 259.0, 233.0, 274.0, 252.0, 228.0, 250.0, 224.0, 184.0, 168.0, 155.0, 122.0, 99.0, 72.0, 67.0, 39.0, 45.0, 29.0, 16.0, 14.0, 8.0, 5.0, 9.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-21.4375, -20.8759765625, -20.314453125, -19.7529296875, -19.19140625, -18.6298828125, -18.068359375, -17.5068359375, -16.9453125, -16.3837890625, -15.822265625, -15.2607421875, -14.69921875, -14.1376953125, -13.576171875, -13.0146484375, -12.453125, -11.8916015625, -11.330078125, -10.7685546875, -10.20703125, -9.6455078125, -9.083984375, -8.5224609375, -7.9609375, -7.3994140625, -6.837890625, -6.2763671875, -5.71484375, -5.1533203125, -4.591796875, -4.0302734375, -3.46875, -2.9072265625, -2.345703125, -1.7841796875, -1.22265625, -0.6611328125, -0.099609375, 0.4619140625, 1.0234375, 1.5849609375, 2.146484375, 2.7080078125, 3.26953125, 3.8310546875, 4.392578125, 4.9541015625, 5.515625, 6.0771484375, 6.638671875, 7.2001953125, 7.76171875, 8.3232421875, 8.884765625, 9.4462890625, 10.0078125, 10.5693359375, 11.130859375, 11.6923828125, 12.25390625, 12.8154296875, 13.376953125, 13.9384765625, 14.5]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 14.0, 4.0, 12.0, 17.0, 14.0, 29.0, 20.0, 29.0, 23.0, 36.0, 38.0, 58.0, 63.0, 57.0, 55.0, 61.0, 49.0, 55.0, 49.0, 41.0, 33.0, 29.0, 34.0, 22.0, 20.0, 17.0, 18.0, 16.0, 13.0, 13.0, 14.0, 8.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.28201675415039, -23.386783599853516, -22.491552352905273, -21.5963191986084, -20.701086044311523, -19.80585479736328, -18.910621643066406, -18.01538848876953, -17.12015724182129, -16.224924087524414, -15.329691886901855, -14.434459686279297, -13.539227485656738, -12.64399528503418, -11.748762130737305, -10.853529930114746, -9.958296775817871, -9.063064575195312, -8.167831420898438, -7.272599220275879, -6.37736701965332, -5.4821343421936035, -4.586901664733887, -3.691669464111328, -2.7964367866516113, -1.9012043476104736, -1.0059717893600464, -0.11073923110961914, 0.7844932079315186, 1.6797256469726562, 2.574958324432373, 3.4701905250549316, 4.365423202514648, 5.260655879974365, 6.155888080596924, 7.051120758056641, 7.946352958679199, 8.841585159301758, 9.736818313598633, 10.632050514221191, 11.52728271484375, 12.422514915466309, 13.317748069763184, 14.212980270385742, 15.1082124710083, 16.00344467163086, 16.898677825927734, 17.79391098022461, 18.689144134521484, 19.58437728881836, 20.4796085357666, 21.374841690063477, 22.27007484436035, 23.165306091308594, 24.06053924560547, 24.955772399902344, 25.851003646850586, 26.74623680114746, 27.641468048095703, 28.536701202392578, 29.431934356689453, 30.327165603637695, 31.22239875793457, 32.11763000488281, 33.01286315917969]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 4.0, 3.0, 12.0, 7.0, 13.0, 12.0, 17.0, 17.0, 27.0, 12.0, 18.0, 17.0, 24.0, 21.0, 35.0, 35.0, 25.0, 41.0, 26.0, 31.0, 36.0, 41.0, 42.0, 31.0, 43.0, 33.0, 40.0, 32.0, 26.0, 39.0, 28.0, 25.0, 25.0, 20.0, 14.0, 18.0, 17.0, 16.0, 11.0, 12.0, 7.0, 10.0, 4.0, 5.0, 2.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.78183937072754, -29.761730194091797, -28.741619110107422, -27.72150993347168, -26.701400756835938, -25.681289672851562, -24.66118049621582, -23.641071319580078, -22.620960235595703, -21.60085105895996, -20.580739974975586, -19.560630798339844, -18.5405216217041, -17.52041244506836, -16.500301361083984, -15.480192184448242, -14.4600830078125, -13.439972877502441, -12.4198637008667, -11.39975357055664, -10.379644393920898, -9.35953426361084, -8.339424133300781, -7.319314479827881, -6.2992048263549805, -5.27909517288208, -4.25898551940918, -3.238875389099121, -2.2187657356262207, -1.1986560821533203, -0.17854595184326172, 0.8415637016296387, 1.8616752624511719, 2.8817849159240723, 3.9018948078155518, 4.922004699707031, 5.942114353179932, 6.962224006652832, 7.982334136962891, 9.002443313598633, 10.022553443908691, 11.04266357421875, 12.062772750854492, 13.08288288116455, 14.10299301147461, 15.123102188110352, 16.143211364746094, 17.16332244873047, 18.18343162536621, 19.203540802001953, 20.223651885986328, 21.24376106262207, 22.263870239257812, 23.283981323242188, 24.30409049987793, 25.324199676513672, 26.344310760498047, 27.36441993713379, 28.384531021118164, 29.404640197753906, 30.42474937438965, 31.44485855102539, 32.464969635009766, 33.48508071899414, 34.50518798828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 11.0, 11.0, 18.0, 28.0, 36.0, 36.0, 68.0, 109.0, 154.0, 225.0, 353.0, 555.0, 790.0, 1167.0, 1791.0, 2792.0, 4560.0, 6830.0, 10985.0, 18127.0, 29415.0, 47940.0, 78431.0, 121671.0, 169004.0, 179272.0, 137146.0, 90123.0, 56029.0, 34270.0, 20997.0, 13174.0, 8240.0, 4868.0, 3247.0, 2096.0, 1295.0, 914.0, 540.0, 412.0, 272.0, 175.0, 120.0, 89.0, 57.0, 28.0, 17.0, 20.0, 12.0, 9.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0], "bins": [-35.875, -34.79296875, -33.7109375, -32.62890625, -31.546875, -30.46484375, -29.3828125, -28.30078125, -27.21875, -26.13671875, -25.0546875, -23.97265625, -22.890625, -21.80859375, -20.7265625, -19.64453125, -18.5625, -17.48046875, -16.3984375, -15.31640625, -14.234375, -13.15234375, -12.0703125, -10.98828125, -9.90625, -8.82421875, -7.7421875, -6.66015625, -5.578125, -4.49609375, -3.4140625, -2.33203125, -1.25, -0.16796875, 0.9140625, 1.99609375, 3.078125, 4.16015625, 5.2421875, 6.32421875, 7.40625, 8.48828125, 9.5703125, 10.65234375, 11.734375, 12.81640625, 13.8984375, 14.98046875, 16.0625, 17.14453125, 18.2265625, 19.30859375, 20.390625, 21.47265625, 22.5546875, 23.63671875, 24.71875, 25.80078125, 26.8828125, 27.96484375, 29.046875, 30.12890625, 31.2109375, 32.29296875, 33.375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 5.0, 10.0, 8.0, 13.0, 10.0, 12.0, 15.0, 21.0, 17.0, 21.0, 22.0, 35.0, 22.0, 33.0, 32.0, 29.0, 33.0, 38.0, 44.0, 41.0, 41.0, 40.0, 44.0, 35.0, 35.0, 41.0, 38.0, 19.0, 29.0, 33.0, 25.0, 21.0, 17.0, 24.0, 9.0, 12.0, 11.0, 10.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.78125, -30.7353515625, -29.689453125, -28.6435546875, -27.59765625, -26.5517578125, -25.505859375, -24.4599609375, -23.4140625, -22.3681640625, -21.322265625, -20.2763671875, -19.23046875, -18.1845703125, -17.138671875, -16.0927734375, -15.046875, -14.0009765625, -12.955078125, -11.9091796875, -10.86328125, -9.8173828125, -8.771484375, -7.7255859375, -6.6796875, -5.6337890625, -4.587890625, -3.5419921875, -2.49609375, -1.4501953125, -0.404296875, 0.6416015625, 1.6875, 2.7333984375, 3.779296875, 4.8251953125, 5.87109375, 6.9169921875, 7.962890625, 9.0087890625, 10.0546875, 11.1005859375, 12.146484375, 13.1923828125, 14.23828125, 15.2841796875, 16.330078125, 17.3759765625, 18.421875, 19.4677734375, 20.513671875, 21.5595703125, 22.60546875, 23.6513671875, 24.697265625, 25.7431640625, 26.7890625, 27.8349609375, 28.880859375, 29.9267578125, 30.97265625, 32.0185546875, 33.064453125, 34.1103515625, 35.15625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 6.0, 9.0, 15.0, 21.0, 23.0, 39.0, 59.0, 63.0, 94.0, 125.0, 143.0, 218.0, 304.0, 407.0, 682.0, 1068.0, 1629.0, 2629.0, 4783.0, 8768.0, 17511.0, 37165.0, 88280.0, 239846.0, 372980.0, 154866.0, 60535.0, 26592.0, 12835.0, 6773.0, 3747.0, 2164.0, 1398.0, 836.0, 575.0, 375.0, 261.0, 186.0, 125.0, 89.0, 89.0, 56.0, 46.0, 30.0, 26.0, 18.0, 9.0, 11.0, 14.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0], "bins": [-63.34375, -61.3818359375, -59.419921875, -57.4580078125, -55.49609375, -53.5341796875, -51.572265625, -49.6103515625, -47.6484375, -45.6865234375, -43.724609375, -41.7626953125, -39.80078125, -37.8388671875, -35.876953125, -33.9150390625, -31.953125, -29.9912109375, -28.029296875, -26.0673828125, -24.10546875, -22.1435546875, -20.181640625, -18.2197265625, -16.2578125, -14.2958984375, -12.333984375, -10.3720703125, -8.41015625, -6.4482421875, -4.486328125, -2.5244140625, -0.5625, 1.3994140625, 3.361328125, 5.3232421875, 7.28515625, 9.2470703125, 11.208984375, 13.1708984375, 15.1328125, 17.0947265625, 19.056640625, 21.0185546875, 22.98046875, 24.9423828125, 26.904296875, 28.8662109375, 30.828125, 32.7900390625, 34.751953125, 36.7138671875, 38.67578125, 40.6376953125, 42.599609375, 44.5615234375, 46.5234375, 48.4853515625, 50.447265625, 52.4091796875, 54.37109375, 56.3330078125, 58.294921875, 60.2568359375, 62.21875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 7.0, 14.0, 15.0, 14.0, 19.0, 19.0, 10.0, 29.0, 40.0, 44.0, 34.0, 35.0, 38.0, 45.0, 42.0, 34.0, 43.0, 36.0, 55.0, 52.0, 36.0, 33.0, 41.0, 31.0, 31.0, 24.0, 20.0, 23.0, 18.0, 16.0, 18.0, 16.0, 11.0, 4.0, 7.0, 8.0, 6.0, 8.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -33.83447265625, -32.7314453125, -31.62841796875, -30.525390625, -29.42236328125, -28.3193359375, -27.21630859375, -26.11328125, -25.01025390625, -23.9072265625, -22.80419921875, -21.701171875, -20.59814453125, -19.4951171875, -18.39208984375, -17.2890625, -16.18603515625, -15.0830078125, -13.97998046875, -12.876953125, -11.77392578125, -10.6708984375, -9.56787109375, -8.46484375, -7.36181640625, -6.2587890625, -5.15576171875, -4.052734375, -2.94970703125, -1.8466796875, -0.74365234375, 0.359375, 1.46240234375, 2.5654296875, 3.66845703125, 4.771484375, 5.87451171875, 6.9775390625, 8.08056640625, 9.18359375, 10.28662109375, 11.3896484375, 12.49267578125, 13.595703125, 14.69873046875, 15.8017578125, 16.90478515625, 18.0078125, 19.11083984375, 20.2138671875, 21.31689453125, 22.419921875, 23.52294921875, 24.6259765625, 25.72900390625, 26.83203125, 27.93505859375, 29.0380859375, 30.14111328125, 31.244140625, 32.34716796875, 33.4501953125, 34.55322265625, 35.65625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 3.0, 6.0, 10.0, 9.0, 17.0, 30.0, 25.0, 42.0, 57.0, 103.0, 116.0, 176.0, 260.0, 412.0, 616.0, 1086.0, 1908.0, 3854.0, 9034.0, 25896.0, 119092.0, 673017.0, 161710.0, 30868.0, 10398.0, 4440.0, 2151.0, 1182.0, 672.0, 426.0, 294.0, 178.0, 126.0, 78.0, 66.0, 33.0, 40.0, 25.0, 17.0, 19.0, 12.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-111.1875, -107.666015625, -104.14453125, -100.623046875, -97.1015625, -93.580078125, -90.05859375, -86.537109375, -83.015625, -79.494140625, -75.97265625, -72.451171875, -68.9296875, -65.408203125, -61.88671875, -58.365234375, -54.84375, -51.322265625, -47.80078125, -44.279296875, -40.7578125, -37.236328125, -33.71484375, -30.193359375, -26.671875, -23.150390625, -19.62890625, -16.107421875, -12.5859375, -9.064453125, -5.54296875, -2.021484375, 1.5, 5.021484375, 8.54296875, 12.064453125, 15.5859375, 19.107421875, 22.62890625, 26.150390625, 29.671875, 33.193359375, 36.71484375, 40.236328125, 43.7578125, 47.279296875, 50.80078125, 54.322265625, 57.84375, 61.365234375, 64.88671875, 68.408203125, 71.9296875, 75.451171875, 78.97265625, 82.494140625, 86.015625, 89.537109375, 93.05859375, 96.580078125, 100.1015625, 103.623046875, 107.14453125, 110.666015625, 114.1875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 2.0, 5.0, 5.0, 4.0, 7.0, 14.0, 10.0, 15.0, 15.0, 26.0, 49.0, 90.0, 145.0, 195.0, 181.0, 71.0, 59.0, 25.0, 12.0, 7.0, 16.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00423431396484375, -0.004104018211364746, -0.003973722457885742, -0.0038434267044067383, -0.0037131309509277344, -0.0035828351974487305, -0.0034525394439697266, -0.0033222436904907227, -0.0031919479370117188, -0.003061652183532715, -0.002931356430053711, -0.002801060676574707, -0.002670764923095703, -0.0025404691696166992, -0.0024101734161376953, -0.0022798776626586914, -0.0021495819091796875, -0.0020192861557006836, -0.0018889904022216797, -0.0017586946487426758, -0.0016283988952636719, -0.001498103141784668, -0.001367807388305664, -0.0012375116348266602, -0.0011072158813476562, -0.0009769201278686523, -0.0008466243743896484, -0.0007163286209106445, -0.0005860328674316406, -0.0004557371139526367, -0.0003254413604736328, -0.0001951456069946289, -6.4849853515625e-05, 6.54458999633789e-05, 0.0001957416534423828, 0.0003260374069213867, 0.0004563331604003906, 0.0005866289138793945, 0.0007169246673583984, 0.0008472204208374023, 0.0009775161743164062, 0.0011078119277954102, 0.001238107681274414, 0.001368403434753418, 0.0014986991882324219, 0.0016289949417114258, 0.0017592906951904297, 0.0018895864486694336, 0.0020198822021484375, 0.0021501779556274414, 0.0022804737091064453, 0.0024107694625854492, 0.002541065216064453, 0.002671360969543457, 0.002801656723022461, 0.002931952476501465, 0.0030622482299804688, 0.0031925439834594727, 0.0033228397369384766, 0.0034531354904174805, 0.0035834312438964844, 0.0037137269973754883, 0.003844022750854492, 0.003974318504333496, 0.0041046142578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 13.0, 20.0, 28.0, 39.0, 43.0, 77.0, 98.0, 116.0, 205.0, 239.0, 395.0, 559.0, 894.0, 1377.0, 2166.0, 3297.0, 5507.0, 9681.0, 17506.0, 33149.0, 63878.0, 130621.0, 250503.0, 253931.0, 132532.0, 65159.0, 33438.0, 17797.0, 9968.0, 5690.0, 3351.0, 2127.0, 1394.0, 830.0, 586.0, 376.0, 289.0, 187.0, 118.0, 104.0, 58.0, 65.0, 38.0, 41.0, 16.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-48.40625, -46.93994140625, -45.4736328125, -44.00732421875, -42.541015625, -41.07470703125, -39.6083984375, -38.14208984375, -36.67578125, -35.20947265625, -33.7431640625, -32.27685546875, -30.810546875, -29.34423828125, -27.8779296875, -26.41162109375, -24.9453125, -23.47900390625, -22.0126953125, -20.54638671875, -19.080078125, -17.61376953125, -16.1474609375, -14.68115234375, -13.21484375, -11.74853515625, -10.2822265625, -8.81591796875, -7.349609375, -5.88330078125, -4.4169921875, -2.95068359375, -1.484375, -0.01806640625, 1.4482421875, 2.91455078125, 4.380859375, 5.84716796875, 7.3134765625, 8.77978515625, 10.24609375, 11.71240234375, 13.1787109375, 14.64501953125, 16.111328125, 17.57763671875, 19.0439453125, 20.51025390625, 21.9765625, 23.44287109375, 24.9091796875, 26.37548828125, 27.841796875, 29.30810546875, 30.7744140625, 32.24072265625, 33.70703125, 35.17333984375, 36.6396484375, 38.10595703125, 39.572265625, 41.03857421875, 42.5048828125, 43.97119140625, 45.4375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 8.0, 6.0, 12.0, 11.0, 15.0, 19.0, 15.0, 29.0, 37.0, 31.0, 49.0, 46.0, 51.0, 66.0, 80.0, 60.0, 70.0, 61.0, 55.0, 41.0, 42.0, 33.0, 29.0, 27.0, 18.0, 21.0, 15.0, 14.0, 3.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-29.03125, -28.1982421875, -27.365234375, -26.5322265625, -25.69921875, -24.8662109375, -24.033203125, -23.2001953125, -22.3671875, -21.5341796875, -20.701171875, -19.8681640625, -19.03515625, -18.2021484375, -17.369140625, -16.5361328125, -15.703125, -14.8701171875, -14.037109375, -13.2041015625, -12.37109375, -11.5380859375, -10.705078125, -9.8720703125, -9.0390625, -8.2060546875, -7.373046875, -6.5400390625, -5.70703125, -4.8740234375, -4.041015625, -3.2080078125, -2.375, -1.5419921875, -0.708984375, 0.1240234375, 0.95703125, 1.7900390625, 2.623046875, 3.4560546875, 4.2890625, 5.1220703125, 5.955078125, 6.7880859375, 7.62109375, 8.4541015625, 9.287109375, 10.1201171875, 10.953125, 11.7861328125, 12.619140625, 13.4521484375, 14.28515625, 15.1181640625, 15.951171875, 16.7841796875, 17.6171875, 18.4501953125, 19.283203125, 20.1162109375, 20.94921875, 21.7822265625, 22.615234375, 23.4482421875, 24.28125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 15.0, 9.0, 8.0, 19.0, 26.0, 36.0, 39.0, 39.0, 42.0, 60.0, 60.0, 64.0, 70.0, 56.0, 51.0, 48.0, 41.0, 48.0, 36.0, 42.0, 28.0, 22.0, 26.0, 20.0, 12.0, 15.0, 10.0, 10.0, 10.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.605266571044922, -23.577030181884766, -22.548791885375977, -21.52055549621582, -20.49231719970703, -19.464080810546875, -18.43584442138672, -17.407608032226562, -16.379369735717773, -15.3511323928833, -14.322895050048828, -13.294658660888672, -12.2664213180542, -11.238183975219727, -10.20994758605957, -9.181710243225098, -8.153472900390625, -7.125235557556152, -6.096998691558838, -5.068761825561523, -4.040524482727051, -3.012287139892578, -1.9840502738952637, -0.9558134078979492, 0.07242393493652344, 1.100661039352417, 2.1288981437683105, 3.157135248184204, 4.185372352600098, 5.21360969543457, 6.241846561431885, 7.270083427429199, 8.298324584960938, 9.32656192779541, 10.354799270629883, 11.383035659790039, 12.411273002624512, 13.439510345458984, 14.46774673461914, 15.495984077453613, 16.524221420288086, 17.552457809448242, 18.58069610595703, 19.608932495117188, 20.637168884277344, 21.665407180786133, 22.69364356994629, 23.721881866455078, 24.750118255615234, 25.77835464477539, 26.80659294128418, 27.834829330444336, 28.863067626953125, 29.89130401611328, 30.919540405273438, 31.947776794433594, 32.97601318359375, 34.004249572753906, 35.03248596191406, 36.060726165771484, 37.08896255493164, 38.1171989440918, 39.14543533325195, 40.17367172241211, 41.20191192626953]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 10.0, 9.0, 8.0, 14.0, 18.0, 15.0, 21.0, 31.0, 24.0, 28.0, 29.0, 45.0, 33.0, 37.0, 28.0, 31.0, 39.0, 46.0, 47.0, 36.0, 45.0, 30.0, 42.0, 30.0, 30.0, 32.0, 32.0, 30.0, 28.0, 21.0, 14.0, 15.0, 10.0, 12.0, 16.0, 9.0, 14.0, 5.0, 7.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.857177734375, -35.56743240356445, -34.27769088745117, -32.987945556640625, -31.698204040527344, -30.40846061706543, -29.118717193603516, -27.82897186279297, -26.539230346679688, -25.249486923217773, -23.95974349975586, -22.670000076293945, -21.38025665283203, -20.090513229370117, -18.800769805908203, -17.511024475097656, -16.221281051635742, -14.931537628173828, -13.641794204711914, -12.35205078125, -11.062307357788086, -9.772563934326172, -8.482819557189941, -7.193076133728027, -5.903332710266113, -4.613589286804199, -3.323845624923706, -2.034101963043213, -0.7443585395812988, 0.5453848838806152, 1.8351287841796875, 3.1248722076416016, 4.414615631103516, 5.70435905456543, 6.994102478027344, 8.283845901489258, 9.573589324951172, 10.863332748413086, 12.153077125549316, 13.44282054901123, 14.732563972473145, 16.022308349609375, 17.31205177307129, 18.601795196533203, 19.891538619995117, 21.18128204345703, 22.471025466918945, 23.76076889038086, 25.050512313842773, 26.340255737304688, 27.6299991607666, 28.919742584228516, 30.20948600769043, 31.499229431152344, 32.78897476196289, 34.07871627807617, 35.36846160888672, 36.658206939697266, 37.94794845581055, 39.237693786621094, 40.527435302734375, 41.81718063354492, 43.1069221496582, 44.39666748046875, 45.68640899658203]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 7.0, 12.0, 13.0, 37.0, 41.0, 53.0, 102.0, 132.0, 172.0, 329.0, 461.0, 781.0, 1138.0, 1676.0, 2420.0, 3737.0, 5612.0, 8250.0, 12210.0, 17701.0, 25447.0, 35456.0, 48399.0, 63901.0, 80160.0, 93375.0, 103014.0, 104725.0, 98267.0, 85509.0, 69194.0, 54040.0, 39871.0, 28761.0, 20402.0, 13950.0, 9694.0, 6615.0, 4262.0, 2984.0, 1907.0, 1318.0, 863.0, 533.0, 337.0, 258.0, 139.0, 109.0, 76.0, 48.0, 29.0, 14.0, 10.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-22.359375, -21.642333984375, -20.92529296875, -20.208251953125, -19.4912109375, -18.774169921875, -18.05712890625, -17.340087890625, -16.623046875, -15.906005859375, -15.18896484375, -14.471923828125, -13.7548828125, -13.037841796875, -12.32080078125, -11.603759765625, -10.88671875, -10.169677734375, -9.45263671875, -8.735595703125, -8.0185546875, -7.301513671875, -6.58447265625, -5.867431640625, -5.150390625, -4.433349609375, -3.71630859375, -2.999267578125, -2.2822265625, -1.565185546875, -0.84814453125, -0.131103515625, 0.5859375, 1.302978515625, 2.02001953125, 2.737060546875, 3.4541015625, 4.171142578125, 4.88818359375, 5.605224609375, 6.322265625, 7.039306640625, 7.75634765625, 8.473388671875, 9.1904296875, 9.907470703125, 10.62451171875, 11.341552734375, 12.05859375, 12.775634765625, 13.49267578125, 14.209716796875, 14.9267578125, 15.643798828125, 16.36083984375, 17.077880859375, 17.794921875, 18.511962890625, 19.22900390625, 19.946044921875, 20.6630859375, 21.380126953125, 22.09716796875, 22.814208984375, 23.53125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 14.0, 17.0, 14.0, 23.0, 15.0, 28.0, 28.0, 30.0, 46.0, 29.0, 33.0, 40.0, 32.0, 47.0, 40.0, 46.0, 49.0, 29.0, 40.0, 35.0, 38.0, 33.0, 27.0, 33.0, 26.0, 28.0, 25.0, 16.0, 15.0, 14.0, 10.0, 17.0, 11.0, 11.0, 9.0, 5.0, 7.0, 2.0, 9.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.90625, -34.66845703125, -33.4306640625, -32.19287109375, -30.955078125, -29.71728515625, -28.4794921875, -27.24169921875, -26.00390625, -24.76611328125, -23.5283203125, -22.29052734375, -21.052734375, -19.81494140625, -18.5771484375, -17.33935546875, -16.1015625, -14.86376953125, -13.6259765625, -12.38818359375, -11.150390625, -9.91259765625, -8.6748046875, -7.43701171875, -6.19921875, -4.96142578125, -3.7236328125, -2.48583984375, -1.248046875, -0.01025390625, 1.2275390625, 2.46533203125, 3.703125, 4.94091796875, 6.1787109375, 7.41650390625, 8.654296875, 9.89208984375, 11.1298828125, 12.36767578125, 13.60546875, 14.84326171875, 16.0810546875, 17.31884765625, 18.556640625, 19.79443359375, 21.0322265625, 22.27001953125, 23.5078125, 24.74560546875, 25.9833984375, 27.22119140625, 28.458984375, 29.69677734375, 30.9345703125, 32.17236328125, 33.41015625, 34.64794921875, 35.8857421875, 37.12353515625, 38.361328125, 39.59912109375, 40.8369140625, 42.07470703125, 43.3125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 10.0, 20.0, 31.0, 36.0, 54.0, 131.0, 162.0, 259.0, 458.0, 740.0, 1200.0, 2053.0, 3632.0, 6590.0, 11292.0, 20573.0, 38145.0, 70631.0, 125807.0, 190840.0, 210010.0, 157602.0, 93914.0, 51462.0, 27930.0, 14933.0, 8482.0, 4772.0, 2712.0, 1611.0, 985.0, 559.0, 347.0, 212.0, 99.0, 71.0, 66.0, 43.0, 28.0, 15.0, 13.0, 3.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.8125, -60.9228515625, -59.033203125, -57.1435546875, -55.25390625, -53.3642578125, -51.474609375, -49.5849609375, -47.6953125, -45.8056640625, -43.916015625, -42.0263671875, -40.13671875, -38.2470703125, -36.357421875, -34.4677734375, -32.578125, -30.6884765625, -28.798828125, -26.9091796875, -25.01953125, -23.1298828125, -21.240234375, -19.3505859375, -17.4609375, -15.5712890625, -13.681640625, -11.7919921875, -9.90234375, -8.0126953125, -6.123046875, -4.2333984375, -2.34375, -0.4541015625, 1.435546875, 3.3251953125, 5.21484375, 7.1044921875, 8.994140625, 10.8837890625, 12.7734375, 14.6630859375, 16.552734375, 18.4423828125, 20.33203125, 22.2216796875, 24.111328125, 26.0009765625, 27.890625, 29.7802734375, 31.669921875, 33.5595703125, 35.44921875, 37.3388671875, 39.228515625, 41.1181640625, 43.0078125, 44.8974609375, 46.787109375, 48.6767578125, 50.56640625, 52.4560546875, 54.345703125, 56.2353515625, 58.125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 8.0, 15.0, 17.0, 18.0, 22.0, 19.0, 38.0, 26.0, 38.0, 41.0, 49.0, 44.0, 53.0, 37.0, 59.0, 55.0, 50.0, 41.0, 52.0, 34.0, 35.0, 28.0, 36.0, 29.0, 33.0, 16.0, 15.0, 14.0, 13.0, 9.0, 5.0, 8.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -36.990234375, -35.63671875, -34.283203125, -32.9296875, -31.576171875, -30.22265625, -28.869140625, -27.515625, -26.162109375, -24.80859375, -23.455078125, -22.1015625, -20.748046875, -19.39453125, -18.041015625, -16.6875, -15.333984375, -13.98046875, -12.626953125, -11.2734375, -9.919921875, -8.56640625, -7.212890625, -5.859375, -4.505859375, -3.15234375, -1.798828125, -0.4453125, 0.908203125, 2.26171875, 3.615234375, 4.96875, 6.322265625, 7.67578125, 9.029296875, 10.3828125, 11.736328125, 13.08984375, 14.443359375, 15.796875, 17.150390625, 18.50390625, 19.857421875, 21.2109375, 22.564453125, 23.91796875, 25.271484375, 26.625, 27.978515625, 29.33203125, 30.685546875, 32.0390625, 33.392578125, 34.74609375, 36.099609375, 37.453125, 38.806640625, 40.16015625, 41.513671875, 42.8671875, 44.220703125, 45.57421875, 46.927734375, 48.28125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 9.0, 17.0, 24.0, 20.0, 45.0, 68.0, 106.0, 123.0, 212.0, 310.0, 466.0, 658.0, 1064.0, 1554.0, 2255.0, 3410.0, 5151.0, 7991.0, 12945.0, 21972.0, 39840.0, 81728.0, 167550.0, 258755.0, 210442.0, 108613.0, 52338.0, 27414.0, 15768.0, 9597.0, 6233.0, 3863.0, 2636.0, 1757.0, 1176.0, 760.0, 550.0, 376.0, 260.0, 148.0, 101.0, 88.0, 58.0, 34.0, 32.0, 18.0, 13.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.09375, -35.88525390625, -34.6767578125, -33.46826171875, -32.259765625, -31.05126953125, -29.8427734375, -28.63427734375, -27.42578125, -26.21728515625, -25.0087890625, -23.80029296875, -22.591796875, -21.38330078125, -20.1748046875, -18.96630859375, -17.7578125, -16.54931640625, -15.3408203125, -14.13232421875, -12.923828125, -11.71533203125, -10.5068359375, -9.29833984375, -8.08984375, -6.88134765625, -5.6728515625, -4.46435546875, -3.255859375, -2.04736328125, -0.8388671875, 0.36962890625, 1.578125, 2.78662109375, 3.9951171875, 5.20361328125, 6.412109375, 7.62060546875, 8.8291015625, 10.03759765625, 11.24609375, 12.45458984375, 13.6630859375, 14.87158203125, 16.080078125, 17.28857421875, 18.4970703125, 19.70556640625, 20.9140625, 22.12255859375, 23.3310546875, 24.53955078125, 25.748046875, 26.95654296875, 28.1650390625, 29.37353515625, 30.58203125, 31.79052734375, 32.9990234375, 34.20751953125, 35.416015625, 36.62451171875, 37.8330078125, 39.04150390625, 40.25]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 4.0, 10.0, 13.0, 17.0, 27.0, 33.0, 40.0, 45.0, 52.0, 49.0, 90.0, 64.0, 73.0, 70.0, 66.0, 61.0, 44.0, 48.0, 34.0, 32.0, 20.0, 23.0, 16.0, 10.0, 10.0, 4.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027675628662109375, -0.002673417329788208, -0.0025792717933654785, -0.002485126256942749, -0.0023909807205200195, -0.00229683518409729, -0.0022026896476745605, -0.002108544111251831, -0.0020143985748291016, -0.001920253038406372, -0.0018261075019836426, -0.001731961965560913, -0.0016378164291381836, -0.001543670892715454, -0.0014495253562927246, -0.0013553798198699951, -0.0012612342834472656, -0.0011670887470245361, -0.0010729432106018066, -0.0009787976741790771, -0.0008846521377563477, -0.0007905066013336182, -0.0006963610649108887, -0.0006022155284881592, -0.0005080699920654297, -0.0004139244556427002, -0.0003197789192199707, -0.0002256333827972412, -0.00013148784637451172, -3.7342309951782227e-05, 5.6803226470947266e-05, 0.00015094876289367676, 0.00024509429931640625, 0.00033923983573913574, 0.00043338537216186523, 0.0005275309085845947, 0.0006216764450073242, 0.0007158219814300537, 0.0008099675178527832, 0.0009041130542755127, 0.0009982585906982422, 0.0010924041271209717, 0.0011865496635437012, 0.0012806951999664307, 0.0013748407363891602, 0.0014689862728118896, 0.0015631318092346191, 0.0016572773456573486, 0.0017514228820800781, 0.0018455684185028076, 0.0019397139549255371, 0.0020338594913482666, 0.002128005027770996, 0.0022221505641937256, 0.002316296100616455, 0.0024104416370391846, 0.002504587173461914, 0.0025987327098846436, 0.002692878246307373, 0.0027870237827301025, 0.002881169319152832, 0.0029753148555755615, 0.003069460391998291, 0.0031636059284210205, 0.00325775146484375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 8.0, 15.0, 18.0, 21.0, 29.0, 64.0, 73.0, 125.0, 193.0, 225.0, 383.0, 478.0, 793.0, 1137.0, 1672.0, 2540.0, 3920.0, 6035.0, 9799.0, 16399.0, 27941.0, 49330.0, 87849.0, 144246.0, 191761.0, 185126.0, 132194.0, 77946.0, 43621.0, 24724.0, 14534.0, 8965.0, 5688.0, 3628.0, 2339.0, 1539.0, 995.0, 689.0, 476.0, 314.0, 235.0, 166.0, 104.0, 74.0, 60.0, 35.0, 20.0, 9.0, 8.0, 9.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.6875, -25.876220703125, -25.06494140625, -24.253662109375, -23.4423828125, -22.631103515625, -21.81982421875, -21.008544921875, -20.197265625, -19.385986328125, -18.57470703125, -17.763427734375, -16.9521484375, -16.140869140625, -15.32958984375, -14.518310546875, -13.70703125, -12.895751953125, -12.08447265625, -11.273193359375, -10.4619140625, -9.650634765625, -8.83935546875, -8.028076171875, -7.216796875, -6.405517578125, -5.59423828125, -4.782958984375, -3.9716796875, -3.160400390625, -2.34912109375, -1.537841796875, -0.7265625, 0.084716796875, 0.89599609375, 1.707275390625, 2.5185546875, 3.329833984375, 4.14111328125, 4.952392578125, 5.763671875, 6.574951171875, 7.38623046875, 8.197509765625, 9.0087890625, 9.820068359375, 10.63134765625, 11.442626953125, 12.25390625, 13.065185546875, 13.87646484375, 14.687744140625, 15.4990234375, 16.310302734375, 17.12158203125, 17.932861328125, 18.744140625, 19.555419921875, 20.36669921875, 21.177978515625, 21.9892578125, 22.800537109375, 23.61181640625, 24.423095703125, 25.234375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 3.0, 7.0, 6.0, 6.0, 7.0, 11.0, 18.0, 16.0, 21.0, 27.0, 30.0, 42.0, 38.0, 48.0, 52.0, 70.0, 62.0, 76.0, 59.0, 62.0, 67.0, 54.0, 31.0, 35.0, 22.0, 21.0, 17.0, 16.0, 18.0, 6.0, 10.0, 7.0, 3.0, 7.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.390625, -13.9425048828125, -13.494384765625, -13.0462646484375, -12.59814453125, -12.1500244140625, -11.701904296875, -11.2537841796875, -10.8056640625, -10.3575439453125, -9.909423828125, -9.4613037109375, -9.01318359375, -8.5650634765625, -8.116943359375, -7.6688232421875, -7.220703125, -6.7725830078125, -6.324462890625, -5.8763427734375, -5.42822265625, -4.9801025390625, -4.531982421875, -4.0838623046875, -3.6357421875, -3.1876220703125, -2.739501953125, -2.2913818359375, -1.84326171875, -1.3951416015625, -0.947021484375, -0.4989013671875, -0.05078125, 0.3973388671875, 0.845458984375, 1.2935791015625, 1.74169921875, 2.1898193359375, 2.637939453125, 3.0860595703125, 3.5341796875, 3.9822998046875, 4.430419921875, 4.8785400390625, 5.32666015625, 5.7747802734375, 6.222900390625, 6.6710205078125, 7.119140625, 7.5672607421875, 8.015380859375, 8.4635009765625, 8.91162109375, 9.3597412109375, 9.807861328125, 10.2559814453125, 10.7041015625, 11.1522216796875, 11.600341796875, 12.0484619140625, 12.49658203125, 12.9447021484375, 13.392822265625, 13.8409423828125, 14.2890625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 10.0, 12.0, 23.0, 16.0, 32.0, 35.0, 37.0, 46.0, 43.0, 46.0, 66.0, 61.0, 82.0, 52.0, 53.0, 54.0, 44.0, 44.0, 29.0, 26.0, 33.0, 29.0, 23.0, 13.0, 15.0, 14.0, 10.0, 8.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.9296875, -33.767860412597656, -32.60603713989258, -31.444211959838867, -30.282386779785156, -29.120559692382812, -27.9587345123291, -26.79690933227539, -25.63508415222168, -24.47325897216797, -23.311433792114258, -22.149608612060547, -20.987781524658203, -19.825958251953125, -18.66413116455078, -17.50230598449707, -16.34048080444336, -15.178655624389648, -14.016830444335938, -12.85500431060791, -11.6931791305542, -10.531353950500488, -9.369527816772461, -8.20770263671875, -7.045877456665039, -5.884052276611328, -4.722226619720459, -3.560401201248169, -2.398575782775879, -1.236750602722168, -0.07492494583129883, 1.0869007110595703, 2.248729705810547, 3.410555124282837, 4.572380542755127, 5.734206199645996, 6.896031379699707, 8.057856559753418, 9.219682693481445, 10.381507873535156, 11.543333053588867, 12.705158233642578, 13.866983413696289, 15.028809547424316, 16.190635681152344, 17.352458953857422, 18.514286041259766, 19.676111221313477, 20.837936401367188, 21.9997615814209, 23.16158676147461, 24.32341194152832, 25.48523712158203, 26.647064208984375, 27.808889389038086, 28.970714569091797, 30.132539749145508, 31.29436492919922, 32.45619201660156, 33.61801528930664, 34.779842376708984, 35.94166564941406, 37.103492736816406, 38.26531982421875, 39.42714309692383]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 2.0, 11.0, 11.0, 14.0, 10.0, 25.0, 18.0, 33.0, 19.0, 30.0, 32.0, 46.0, 36.0, 44.0, 44.0, 47.0, 33.0, 44.0, 59.0, 38.0, 56.0, 28.0, 33.0, 45.0, 31.0, 29.0, 30.0, 21.0, 20.0, 19.0, 21.0, 11.0, 10.0, 7.0, 12.0, 10.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09160614013672, -54.30624771118164, -52.52088928222656, -50.735530853271484, -48.950172424316406, -47.16481399536133, -45.37945556640625, -43.59409713745117, -41.808738708496094, -40.023380279541016, -38.23802185058594, -36.45266342163086, -34.66730499267578, -32.8819465637207, -31.096588134765625, -29.311229705810547, -27.525869369506836, -25.740510940551758, -23.95515251159668, -22.1697940826416, -20.384435653686523, -18.599075317382812, -16.813716888427734, -15.028359413146973, -13.243000984191895, -11.457642555236816, -9.672284126281738, -7.886925220489502, -6.101566791534424, -4.3162078857421875, -2.5308494567871094, -0.7454910278320312, 1.0398674011230469, 2.825225830078125, 4.610584259033203, 6.3959431648254395, 8.18130111694336, 9.966660499572754, 11.752018928527832, 13.53737735748291, 15.322735786437988, 17.108095169067383, 18.89345359802246, 20.67881202697754, 22.464170455932617, 24.249528884887695, 26.034887313842773, 27.82024574279785, 29.60560417175293, 31.390962600708008, 33.17632293701172, 34.9616813659668, 36.747039794921875, 38.53239822387695, 40.31775665283203, 42.10311508178711, 43.88847351074219, 45.673831939697266, 47.459190368652344, 49.24454879760742, 51.0299072265625, 52.81526565551758, 54.600624084472656, 56.385982513427734, 58.17134094238281]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 8.0, 11.0, 17.0, 24.0, 47.0, 78.0, 103.0, 169.0, 278.0, 492.0, 697.0, 1153.0, 1783.0, 2897.0, 4505.0, 7372.0, 11686.0, 18446.0, 29674.0, 46611.0, 72714.0, 111716.0, 167366.0, 242828.0, 335057.0, 427943.0, 498202.0, 513177.0, 466229.0, 377985.0, 283260.0, 198932.0, 134019.0, 87788.0, 56988.0, 35996.0, 22387.0, 13741.0, 8468.0, 5084.0, 3181.0, 2009.0, 1240.0, 726.0, 437.0, 266.0, 187.0, 116.0, 85.0, 44.0, 15.0, 22.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0], "bins": [-31.109375, -30.17236328125, -29.2353515625, -28.29833984375, -27.361328125, -26.42431640625, -25.4873046875, -24.55029296875, -23.61328125, -22.67626953125, -21.7392578125, -20.80224609375, -19.865234375, -18.92822265625, -17.9912109375, -17.05419921875, -16.1171875, -15.18017578125, -14.2431640625, -13.30615234375, -12.369140625, -11.43212890625, -10.4951171875, -9.55810546875, -8.62109375, -7.68408203125, -6.7470703125, -5.81005859375, -4.873046875, -3.93603515625, -2.9990234375, -2.06201171875, -1.125, -0.18798828125, 0.7490234375, 1.68603515625, 2.623046875, 3.56005859375, 4.4970703125, 5.43408203125, 6.37109375, 7.30810546875, 8.2451171875, 9.18212890625, 10.119140625, 11.05615234375, 11.9931640625, 12.93017578125, 13.8671875, 14.80419921875, 15.7412109375, 16.67822265625, 17.615234375, 18.55224609375, 19.4892578125, 20.42626953125, 21.36328125, 22.30029296875, 23.2373046875, 24.17431640625, 25.111328125, 26.04833984375, 26.9853515625, 27.92236328125, 28.859375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 3.0, 8.0, 7.0, 11.0, 12.0, 16.0, 8.0, 23.0, 25.0, 17.0, 22.0, 35.0, 24.0, 42.0, 36.0, 46.0, 38.0, 34.0, 46.0, 37.0, 42.0, 46.0, 45.0, 41.0, 41.0, 37.0, 28.0, 24.0, 31.0, 24.0, 28.0, 20.0, 13.0, 15.0, 21.0, 9.0, 8.0, 9.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.59375, -40.24560546875, -38.8974609375, -37.54931640625, -36.201171875, -34.85302734375, -33.5048828125, -32.15673828125, -30.80859375, -29.46044921875, -28.1123046875, -26.76416015625, -25.416015625, -24.06787109375, -22.7197265625, -21.37158203125, -20.0234375, -18.67529296875, -17.3271484375, -15.97900390625, -14.630859375, -13.28271484375, -11.9345703125, -10.58642578125, -9.23828125, -7.89013671875, -6.5419921875, -5.19384765625, -3.845703125, -2.49755859375, -1.1494140625, 0.19873046875, 1.546875, 2.89501953125, 4.2431640625, 5.59130859375, 6.939453125, 8.28759765625, 9.6357421875, 10.98388671875, 12.33203125, 13.68017578125, 15.0283203125, 16.37646484375, 17.724609375, 19.07275390625, 20.4208984375, 21.76904296875, 23.1171875, 24.46533203125, 25.8134765625, 27.16162109375, 28.509765625, 29.85791015625, 31.2060546875, 32.55419921875, 33.90234375, 35.25048828125, 36.5986328125, 37.94677734375, 39.294921875, 40.64306640625, 41.9912109375, 43.33935546875, 44.6875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 10.0, 20.0, 25.0, 52.0, 62.0, 103.0, 184.0, 326.0, 487.0, 764.0, 1266.0, 2166.0, 3675.0, 6347.0, 10902.0, 19282.0, 33881.0, 59452.0, 102877.0, 170586.0, 268299.0, 387464.0, 502598.0, 575057.0, 567345.0, 485478.0, 366973.0, 249544.0, 157608.0, 94081.0, 54428.0, 30814.0, 17572.0, 10014.0, 5870.0, 3394.0, 2080.0, 1213.0, 756.0, 457.0, 254.0, 192.0, 127.0, 64.0, 53.0, 30.0, 21.0, 7.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.125, -31.0859375, -30.046875, -29.0078125, -27.96875, -26.9296875, -25.890625, -24.8515625, -23.8125, -22.7734375, -21.734375, -20.6953125, -19.65625, -18.6171875, -17.578125, -16.5390625, -15.5, -14.4609375, -13.421875, -12.3828125, -11.34375, -10.3046875, -9.265625, -8.2265625, -7.1875, -6.1484375, -5.109375, -4.0703125, -3.03125, -1.9921875, -0.953125, 0.0859375, 1.125, 2.1640625, 3.203125, 4.2421875, 5.28125, 6.3203125, 7.359375, 8.3984375, 9.4375, 10.4765625, 11.515625, 12.5546875, 13.59375, 14.6328125, 15.671875, 16.7109375, 17.75, 18.7890625, 19.828125, 20.8671875, 21.90625, 22.9453125, 23.984375, 25.0234375, 26.0625, 27.1015625, 28.140625, 29.1796875, 30.21875, 31.2578125, 32.296875, 33.3359375, 34.375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 12.0, 13.0, 21.0, 16.0, 24.0, 37.0, 45.0, 57.0, 56.0, 69.0, 93.0, 103.0, 99.0, 127.0, 137.0, 175.0, 166.0, 186.0, 192.0, 218.0, 199.0, 190.0, 189.0, 196.0, 158.0, 163.0, 172.0, 130.0, 129.0, 107.0, 108.0, 77.0, 73.0, 63.0, 42.0, 45.0, 46.0, 21.0, 23.0, 21.0, 15.0, 10.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.5, -17.86474609375, -17.2294921875, -16.59423828125, -15.958984375, -15.32373046875, -14.6884765625, -14.05322265625, -13.41796875, -12.78271484375, -12.1474609375, -11.51220703125, -10.876953125, -10.24169921875, -9.6064453125, -8.97119140625, -8.3359375, -7.70068359375, -7.0654296875, -6.43017578125, -5.794921875, -5.15966796875, -4.5244140625, -3.88916015625, -3.25390625, -2.61865234375, -1.9833984375, -1.34814453125, -0.712890625, -0.07763671875, 0.5576171875, 1.19287109375, 1.828125, 2.46337890625, 3.0986328125, 3.73388671875, 4.369140625, 5.00439453125, 5.6396484375, 6.27490234375, 6.91015625, 7.54541015625, 8.1806640625, 8.81591796875, 9.451171875, 10.08642578125, 10.7216796875, 11.35693359375, 11.9921875, 12.62744140625, 13.2626953125, 13.89794921875, 14.533203125, 15.16845703125, 15.8037109375, 16.43896484375, 17.07421875, 17.70947265625, 18.3447265625, 18.97998046875, 19.615234375, 20.25048828125, 20.8857421875, 21.52099609375, 22.15625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 14.0, 15.0, 19.0, 33.0, 36.0, 35.0, 42.0, 61.0, 54.0, 56.0, 62.0, 44.0, 52.0, 59.0, 49.0, 47.0, 34.0, 43.0, 38.0, 32.0, 33.0, 22.0, 13.0, 11.0, 18.0, 8.0, 8.0, 14.0, 2.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.6821403503418, -46.37725067138672, -45.072357177734375, -43.7674674987793, -42.46257400512695, -41.157684326171875, -39.85279083251953, -38.54790115356445, -37.243011474609375, -35.9381217956543, -34.63322830200195, -33.328338623046875, -32.02344512939453, -30.718555450439453, -29.413663864135742, -28.10877227783203, -26.803878784179688, -25.498987197875977, -24.194095611572266, -22.889204025268555, -21.584312438964844, -20.279422760009766, -18.974531173706055, -17.669639587402344, -16.364748001098633, -15.059856414794922, -13.754964828491211, -12.450074195861816, -11.145182609558105, -9.840291023254395, -8.535400390625, -7.230508804321289, -5.925621032714844, -4.620729446411133, -3.31583833694458, -2.0109469890594482, -0.7060556411743164, 0.5988359451293945, 1.9037270545959473, 3.2086181640625, 4.513509750366211, 5.818401336669922, 7.123292446136475, 8.428183555603027, 9.733075141906738, 11.03796672821045, 12.342857360839844, 13.647748947143555, 14.952640533447266, 16.257532119750977, 17.562423706054688, 18.8673152923584, 20.17220687866211, 21.477096557617188, 22.7819881439209, 24.08687973022461, 25.39177131652832, 26.69666290283203, 28.001554489135742, 29.306446075439453, 30.61133575439453, 31.916229248046875, 33.22111892700195, 34.52600860595703, 35.830902099609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 11.0, 12.0, 14.0, 11.0, 10.0, 14.0, 21.0, 19.0, 15.0, 18.0, 32.0, 19.0, 27.0, 41.0, 30.0, 37.0, 43.0, 45.0, 33.0, 45.0, 31.0, 33.0, 49.0, 39.0, 37.0, 26.0, 20.0, 28.0, 34.0, 31.0, 19.0, 22.0, 20.0, 14.0, 13.0, 11.0, 13.0, 16.0, 8.0, 8.0, 13.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.886688232421875, -53.0567626953125, -51.226837158203125, -49.39691162109375, -47.56698226928711, -45.737056732177734, -43.90713119506836, -42.077205657958984, -40.24728012084961, -38.417354583740234, -36.58742904663086, -34.75749969482422, -32.927574157714844, -31.09764862060547, -29.267723083496094, -27.43779754638672, -25.60787010192871, -23.777944564819336, -21.948017120361328, -20.118091583251953, -18.288166046142578, -16.458240509033203, -14.628313064575195, -12.79838752746582, -10.968461036682129, -9.138534545898438, -7.3086090087890625, -5.478682518005371, -3.648756504058838, -1.8188304901123047, 0.011096000671386719, 1.8410215377807617, 3.670948028564453, 5.500874042510986, 7.3308000564575195, 9.160726547241211, 10.990652084350586, 12.820578575134277, 14.650505065917969, 16.480430603027344, 18.31035614013672, 20.140281677246094, 21.9702091217041, 23.800134658813477, 25.63006019592285, 27.45998764038086, 29.289913177490234, 31.11983871459961, 32.94976806640625, 34.779693603515625, 36.609619140625, 38.439544677734375, 40.269474029541016, 42.09939956665039, 43.929325103759766, 45.75925064086914, 47.589176177978516, 49.41910171508789, 51.249027252197266, 53.078956604003906, 54.90888214111328, 56.738807678222656, 58.56873321533203, 60.398658752441406, 62.22858428955078]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 14.0, 19.0, 19.0, 33.0, 43.0, 75.0, 135.0, 210.0, 285.0, 464.0, 769.0, 1201.0, 2071.0, 3727.0, 6099.0, 10913.0, 19688.0, 36969.0, 70599.0, 141381.0, 254366.0, 236590.0, 125191.0, 63109.0, 33071.0, 17626.0, 9864.0, 5574.0, 3342.0, 1958.0, 1231.0, 686.0, 425.0, 257.0, 182.0, 124.0, 75.0, 48.0, 34.0, 20.0, 11.0, 11.0, 6.0, 8.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-69.5, -67.322265625, -65.14453125, -62.966796875, -60.7890625, -58.611328125, -56.43359375, -54.255859375, -52.078125, -49.900390625, -47.72265625, -45.544921875, -43.3671875, -41.189453125, -39.01171875, -36.833984375, -34.65625, -32.478515625, -30.30078125, -28.123046875, -25.9453125, -23.767578125, -21.58984375, -19.412109375, -17.234375, -15.056640625, -12.87890625, -10.701171875, -8.5234375, -6.345703125, -4.16796875, -1.990234375, 0.1875, 2.365234375, 4.54296875, 6.720703125, 8.8984375, 11.076171875, 13.25390625, 15.431640625, 17.609375, 19.787109375, 21.96484375, 24.142578125, 26.3203125, 28.498046875, 30.67578125, 32.853515625, 35.03125, 37.208984375, 39.38671875, 41.564453125, 43.7421875, 45.919921875, 48.09765625, 50.275390625, 52.453125, 54.630859375, 56.80859375, 58.986328125, 61.1640625, 63.341796875, 65.51953125, 67.697265625, 69.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 8.0, 12.0, 15.0, 13.0, 12.0, 17.0, 16.0, 27.0, 23.0, 22.0, 23.0, 31.0, 36.0, 33.0, 44.0, 42.0, 32.0, 40.0, 44.0, 39.0, 33.0, 44.0, 43.0, 35.0, 29.0, 20.0, 25.0, 34.0, 24.0, 22.0, 19.0, 20.0, 15.0, 17.0, 15.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.25, -56.36865234375, -54.4873046875, -52.60595703125, -50.724609375, -48.84326171875, -46.9619140625, -45.08056640625, -43.19921875, -41.31787109375, -39.4365234375, -37.55517578125, -35.673828125, -33.79248046875, -31.9111328125, -30.02978515625, -28.1484375, -26.26708984375, -24.3857421875, -22.50439453125, -20.623046875, -18.74169921875, -16.8603515625, -14.97900390625, -13.09765625, -11.21630859375, -9.3349609375, -7.45361328125, -5.572265625, -3.69091796875, -1.8095703125, 0.07177734375, 1.953125, 3.83447265625, 5.7158203125, 7.59716796875, 9.478515625, 11.35986328125, 13.2412109375, 15.12255859375, 17.00390625, 18.88525390625, 20.7666015625, 22.64794921875, 24.529296875, 26.41064453125, 28.2919921875, 30.17333984375, 32.0546875, 33.93603515625, 35.8173828125, 37.69873046875, 39.580078125, 41.46142578125, 43.3427734375, 45.22412109375, 47.10546875, 48.98681640625, 50.8681640625, 52.74951171875, 54.630859375, 56.51220703125, 58.3935546875, 60.27490234375, 62.15625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 17.0, 6.0, 10.0, 16.0, 21.0, 30.0, 35.0, 42.0, 66.0, 107.0, 168.0, 218.0, 360.0, 611.0, 1270.0, 2560.0, 5870.0, 15853.0, 53792.0, 271030.0, 543304.0, 109049.0, 27257.0, 9253.0, 3743.0, 1632.0, 808.0, 479.0, 324.0, 192.0, 101.0, 96.0, 49.0, 45.0, 34.0, 28.0, 21.0, 13.0, 8.0, 9.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-156.25, -151.248046875, -146.24609375, -141.244140625, -136.2421875, -131.240234375, -126.23828125, -121.236328125, -116.234375, -111.232421875, -106.23046875, -101.228515625, -96.2265625, -91.224609375, -86.22265625, -81.220703125, -76.21875, -71.216796875, -66.21484375, -61.212890625, -56.2109375, -51.208984375, -46.20703125, -41.205078125, -36.203125, -31.201171875, -26.19921875, -21.197265625, -16.1953125, -11.193359375, -6.19140625, -1.189453125, 3.8125, 8.814453125, 13.81640625, 18.818359375, 23.8203125, 28.822265625, 33.82421875, 38.826171875, 43.828125, 48.830078125, 53.83203125, 58.833984375, 63.8359375, 68.837890625, 73.83984375, 78.841796875, 83.84375, 88.845703125, 93.84765625, 98.849609375, 103.8515625, 108.853515625, 113.85546875, 118.857421875, 123.859375, 128.861328125, 133.86328125, 138.865234375, 143.8671875, 148.869140625, 153.87109375, 158.873046875, 163.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 14.0, 17.0, 13.0, 12.0, 14.0, 18.0, 25.0, 24.0, 32.0, 41.0, 43.0, 58.0, 45.0, 46.0, 45.0, 45.0, 45.0, 55.0, 55.0, 43.0, 42.0, 47.0, 24.0, 35.0, 28.0, 14.0, 25.0, 13.0, 20.0, 12.0, 7.0, 6.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-65.25, -63.41455078125, -61.5791015625, -59.74365234375, -57.908203125, -56.07275390625, -54.2373046875, -52.40185546875, -50.56640625, -48.73095703125, -46.8955078125, -45.06005859375, -43.224609375, -41.38916015625, -39.5537109375, -37.71826171875, -35.8828125, -34.04736328125, -32.2119140625, -30.37646484375, -28.541015625, -26.70556640625, -24.8701171875, -23.03466796875, -21.19921875, -19.36376953125, -17.5283203125, -15.69287109375, -13.857421875, -12.02197265625, -10.1865234375, -8.35107421875, -6.515625, -4.68017578125, -2.8447265625, -1.00927734375, 0.826171875, 2.66162109375, 4.4970703125, 6.33251953125, 8.16796875, 10.00341796875, 11.8388671875, 13.67431640625, 15.509765625, 17.34521484375, 19.1806640625, 21.01611328125, 22.8515625, 24.68701171875, 26.5224609375, 28.35791015625, 30.193359375, 32.02880859375, 33.8642578125, 35.69970703125, 37.53515625, 39.37060546875, 41.2060546875, 43.04150390625, 44.876953125, 46.71240234375, 48.5478515625, 50.38330078125, 52.21875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 14.0, 17.0, 19.0, 23.0, 25.0, 49.0, 63.0, 89.0, 135.0, 157.0, 252.0, 381.0, 555.0, 840.0, 1501.0, 2879.0, 5723.0, 13335.0, 40398.0, 185929.0, 610044.0, 131742.0, 31972.0, 11194.0, 4957.0, 2445.0, 1299.0, 765.0, 510.0, 361.0, 242.0, 164.0, 136.0, 90.0, 64.0, 51.0, 33.0, 23.0, 12.0, 14.0, 13.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-117.6875, -114.2666015625, -110.845703125, -107.4248046875, -104.00390625, -100.5830078125, -97.162109375, -93.7412109375, -90.3203125, -86.8994140625, -83.478515625, -80.0576171875, -76.63671875, -73.2158203125, -69.794921875, -66.3740234375, -62.953125, -59.5322265625, -56.111328125, -52.6904296875, -49.26953125, -45.8486328125, -42.427734375, -39.0068359375, -35.5859375, -32.1650390625, -28.744140625, -25.3232421875, -21.90234375, -18.4814453125, -15.060546875, -11.6396484375, -8.21875, -4.7978515625, -1.376953125, 2.0439453125, 5.46484375, 8.8857421875, 12.306640625, 15.7275390625, 19.1484375, 22.5693359375, 25.990234375, 29.4111328125, 32.83203125, 36.2529296875, 39.673828125, 43.0947265625, 46.515625, 49.9365234375, 53.357421875, 56.7783203125, 60.19921875, 63.6201171875, 67.041015625, 70.4619140625, 73.8828125, 77.3037109375, 80.724609375, 84.1455078125, 87.56640625, 90.9873046875, 94.408203125, 97.8291015625, 101.25]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 17.0, 33.0, 36.0, 37.0, 54.0, 89.0, 110.0, 132.0, 107.0, 97.0, 71.0, 53.0, 29.0, 22.0, 26.0, 10.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00237274169921875, -0.002311334013938904, -0.0022499263286590576, -0.0021885186433792114, -0.0021271109580993652, -0.002065703272819519, -0.002004295587539673, -0.0019428879022598267, -0.0018814802169799805, -0.0018200725317001343, -0.001758664846420288, -0.001697257161140442, -0.0016358494758605957, -0.0015744417905807495, -0.0015130341053009033, -0.0014516264200210571, -0.001390218734741211, -0.0013288110494613647, -0.0012674033641815186, -0.0012059956789016724, -0.0011445879936218262, -0.00108318030834198, -0.0010217726230621338, -0.0009603649377822876, -0.0008989572525024414, -0.0008375495672225952, -0.000776141881942749, -0.0007147341966629028, -0.0006533265113830566, -0.0005919188261032104, -0.0005305111408233643, -0.00046910345554351807, -0.0004076957702636719, -0.0003462880849838257, -0.0002848803997039795, -0.0002234727144241333, -0.0001620650291442871, -0.00010065734386444092, -3.9249658584594727e-05, 2.2158026695251465e-05, 8.356571197509766e-05, 0.00014497339725494385, 0.00020638108253479004, 0.00026778876781463623, 0.0003291964530944824, 0.0003906041383743286, 0.0004520118236541748, 0.000513419508934021, 0.0005748271942138672, 0.0006362348794937134, 0.0006976425647735596, 0.0007590502500534058, 0.000820457935333252, 0.0008818656206130981, 0.0009432733058929443, 0.0010046809911727905, 0.0010660886764526367, 0.001127496361732483, 0.001188904047012329, 0.0012503117322921753, 0.0013117194175720215, 0.0013731271028518677, 0.0014345347881317139, 0.00149594247341156, 0.0015573501586914062]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 6.0, 8.0, 15.0, 25.0, 32.0, 45.0, 68.0, 96.0, 123.0, 195.0, 276.0, 364.0, 519.0, 815.0, 1280.0, 1951.0, 3069.0, 5004.0, 8324.0, 15063.0, 28612.0, 58348.0, 127837.0, 270640.0, 271351.0, 129280.0, 58637.0, 28750.0, 15081.0, 8560.0, 5206.0, 3161.0, 1908.0, 1316.0, 828.0, 553.0, 384.0, 241.0, 175.0, 126.0, 96.0, 54.0, 48.0, 33.0, 15.0, 13.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -50.23681640625, -48.5048828125, -46.77294921875, -45.041015625, -43.30908203125, -41.5771484375, -39.84521484375, -38.11328125, -36.38134765625, -34.6494140625, -32.91748046875, -31.185546875, -29.45361328125, -27.7216796875, -25.98974609375, -24.2578125, -22.52587890625, -20.7939453125, -19.06201171875, -17.330078125, -15.59814453125, -13.8662109375, -12.13427734375, -10.40234375, -8.67041015625, -6.9384765625, -5.20654296875, -3.474609375, -1.74267578125, -0.0107421875, 1.72119140625, 3.453125, 5.18505859375, 6.9169921875, 8.64892578125, 10.380859375, 12.11279296875, 13.8447265625, 15.57666015625, 17.30859375, 19.04052734375, 20.7724609375, 22.50439453125, 24.236328125, 25.96826171875, 27.7001953125, 29.43212890625, 31.1640625, 32.89599609375, 34.6279296875, 36.35986328125, 38.091796875, 39.82373046875, 41.5556640625, 43.28759765625, 45.01953125, 46.75146484375, 48.4833984375, 50.21533203125, 51.947265625, 53.67919921875, 55.4111328125, 57.14306640625, 58.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 8.0, 7.0, 12.0, 18.0, 24.0, 16.0, 33.0, 47.0, 60.0, 45.0, 63.0, 77.0, 54.0, 55.0, 69.0, 53.0, 50.0, 55.0, 37.0, 31.0, 30.0, 26.0, 14.0, 16.0, 12.0, 10.0, 6.0, 7.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.25, -34.2421875, -33.234375, -32.2265625, -31.21875, -30.2109375, -29.203125, -28.1953125, -27.1875, -26.1796875, -25.171875, -24.1640625, -23.15625, -22.1484375, -21.140625, -20.1328125, -19.125, -18.1171875, -17.109375, -16.1015625, -15.09375, -14.0859375, -13.078125, -12.0703125, -11.0625, -10.0546875, -9.046875, -8.0390625, -7.03125, -6.0234375, -5.015625, -4.0078125, -3.0, -1.9921875, -0.984375, 0.0234375, 1.03125, 2.0390625, 3.046875, 4.0546875, 5.0625, 6.0703125, 7.078125, 8.0859375, 9.09375, 10.1015625, 11.109375, 12.1171875, 13.125, 14.1328125, 15.140625, 16.1484375, 17.15625, 18.1640625, 19.171875, 20.1796875, 21.1875, 22.1953125, 23.203125, 24.2109375, 25.21875, 26.2265625, 27.234375, 28.2421875, 29.25]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 12.0, 18.0, 28.0, 42.0, 33.0, 42.0, 52.0, 53.0, 50.0, 70.0, 49.0, 67.0, 55.0, 53.0, 53.0, 48.0, 44.0, 31.0, 32.0, 29.0, 24.0, 13.0, 18.0, 17.0, 13.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.668922424316406, -45.141170501708984, -43.61341857910156, -42.085662841796875, -40.55791091918945, -39.03015899658203, -37.50240707397461, -35.97465515136719, -34.4468994140625, -32.91914749145508, -31.391393661499023, -29.8636417388916, -28.335887908935547, -26.808135986328125, -25.280384063720703, -23.75263023376465, -22.224878311157227, -20.697126388549805, -19.16937255859375, -17.641620635986328, -16.113866806030273, -14.586114883422852, -13.058362007141113, -11.530609130859375, -10.002856254577637, -8.475103378295898, -6.94735050201416, -5.41959810256958, -3.891845226287842, -2.3640923500061035, -0.8363399505615234, 0.6914129257202148, 2.219165802001953, 3.7469186782836914, 5.27467155456543, 6.80242395401001, 8.330177307128906, 9.857929229736328, 11.385682106018066, 12.913434982299805, 14.441187858581543, 15.968940734863281, 17.496692657470703, 19.024446487426758, 20.55219841003418, 22.079952239990234, 23.607704162597656, 25.135456085205078, 26.663209915161133, 28.190961837768555, 29.71871566772461, 31.24646759033203, 32.77421951293945, 34.30197525024414, 35.82972717285156, 37.357479095458984, 38.885231018066406, 40.41298294067383, 41.94073486328125, 43.46849060058594, 44.99624252319336, 46.52399444580078, 48.0517463684082, 49.579498291015625, 51.10725402832031]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 11.0, 13.0, 10.0, 12.0, 8.0, 12.0, 16.0, 17.0, 21.0, 21.0, 32.0, 36.0, 36.0, 33.0, 26.0, 50.0, 35.0, 41.0, 35.0, 48.0, 45.0, 38.0, 31.0, 32.0, 38.0, 41.0, 37.0, 26.0, 22.0, 25.0, 16.0, 21.0, 19.0, 26.0, 16.0, 20.0, 5.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.77210235595703, -74.27994537353516, -71.78778839111328, -69.29562377929688, -66.803466796875, -64.31130981445312, -61.81915283203125, -59.326995849609375, -56.8348388671875, -54.342681884765625, -51.850521087646484, -49.35836410522461, -46.866207122802734, -44.374046325683594, -41.88188934326172, -39.389732360839844, -36.8975715637207, -34.40541458129883, -31.91325569152832, -29.421096801757812, -26.928939819335938, -24.43678092956543, -21.944622039794922, -19.452465057373047, -16.96030616760254, -14.468148231506348, -11.975990295410156, -9.483831405639648, -6.991673469543457, -4.499515533447266, -2.007356643676758, 0.4848003387451172, 2.976959228515625, 5.469117164611816, 7.961275577545166, 10.453433990478516, 12.945591926574707, 15.437749862670898, 17.929908752441406, 20.42206573486328, 22.91422462463379, 25.406383514404297, 27.898540496826172, 30.39069938659668, 32.88285827636719, 35.37501525878906, 37.86717224121094, 40.35932922363281, 42.85149002075195, 45.34364700317383, 47.83580780029297, 50.327964782714844, 52.82012176513672, 55.312278747558594, 57.804439544677734, 60.29659652709961, 62.78875732421875, 65.28091430664062, 67.7730712890625, 70.26522827148438, 72.75739288330078, 75.24954986572266, 77.74170684814453, 80.2338638305664, 82.72602081298828]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 23.0, 27.0, 37.0, 50.0, 87.0, 149.0, 232.0, 316.0, 489.0, 724.0, 1301.0, 2103.0, 3719.0, 6544.0, 11856.0, 22506.0, 43857.0, 87429.0, 168590.0, 244540.0, 208717.0, 119328.0, 60058.0, 29967.0, 15632.0, 8538.0, 4710.0, 2803.0, 1559.0, 958.0, 565.0, 385.0, 254.0, 169.0, 114.0, 71.0, 47.0, 21.0, 14.0, 11.0, 16.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.34375, -57.34716796875, -55.3505859375, -53.35400390625, -51.357421875, -49.36083984375, -47.3642578125, -45.36767578125, -43.37109375, -41.37451171875, -39.3779296875, -37.38134765625, -35.384765625, -33.38818359375, -31.3916015625, -29.39501953125, -27.3984375, -25.40185546875, -23.4052734375, -21.40869140625, -19.412109375, -17.41552734375, -15.4189453125, -13.42236328125, -11.42578125, -9.42919921875, -7.4326171875, -5.43603515625, -3.439453125, -1.44287109375, 0.5537109375, 2.55029296875, 4.546875, 6.54345703125, 8.5400390625, 10.53662109375, 12.533203125, 14.52978515625, 16.5263671875, 18.52294921875, 20.51953125, 22.51611328125, 24.5126953125, 26.50927734375, 28.505859375, 30.50244140625, 32.4990234375, 34.49560546875, 36.4921875, 38.48876953125, 40.4853515625, 42.48193359375, 44.478515625, 46.47509765625, 48.4716796875, 50.46826171875, 52.46484375, 54.46142578125, 56.4580078125, 58.45458984375, 60.451171875, 62.44775390625, 64.4443359375, 66.44091796875, 68.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 15.0, 9.0, 9.0, 12.0, 18.0, 20.0, 19.0, 23.0, 24.0, 33.0, 36.0, 41.0, 39.0, 38.0, 46.0, 30.0, 40.0, 51.0, 44.0, 43.0, 25.0, 32.0, 49.0, 37.0, 34.0, 26.0, 25.0, 16.0, 25.0, 18.0, 22.0, 18.0, 13.0, 12.0, 13.0, 7.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.125, -70.728515625, -68.33203125, -65.935546875, -63.5390625, -61.142578125, -58.74609375, -56.349609375, -53.953125, -51.556640625, -49.16015625, -46.763671875, -44.3671875, -41.970703125, -39.57421875, -37.177734375, -34.78125, -32.384765625, -29.98828125, -27.591796875, -25.1953125, -22.798828125, -20.40234375, -18.005859375, -15.609375, -13.212890625, -10.81640625, -8.419921875, -6.0234375, -3.626953125, -1.23046875, 1.166015625, 3.5625, 5.958984375, 8.35546875, 10.751953125, 13.1484375, 15.544921875, 17.94140625, 20.337890625, 22.734375, 25.130859375, 27.52734375, 29.923828125, 32.3203125, 34.716796875, 37.11328125, 39.509765625, 41.90625, 44.302734375, 46.69921875, 49.095703125, 51.4921875, 53.888671875, 56.28515625, 58.681640625, 61.078125, 63.474609375, 65.87109375, 68.267578125, 70.6640625, 73.060546875, 75.45703125, 77.853515625, 80.25]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 15.0, 18.0, 23.0, 30.0, 62.0, 90.0, 113.0, 169.0, 254.0, 389.0, 631.0, 920.0, 1340.0, 2029.0, 3126.0, 4679.0, 7730.0, 12073.0, 19666.0, 34555.0, 62888.0, 131513.0, 270615.0, 245658.0, 114003.0, 56183.0, 30727.0, 18043.0, 10999.0, 6999.0, 4438.0, 2900.0, 1920.0, 1255.0, 797.0, 578.0, 382.0, 218.0, 169.0, 118.0, 71.0, 59.0, 37.0, 27.0, 16.0, 11.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-114.25, -110.7783203125, -107.306640625, -103.8349609375, -100.36328125, -96.8916015625, -93.419921875, -89.9482421875, -86.4765625, -83.0048828125, -79.533203125, -76.0615234375, -72.58984375, -69.1181640625, -65.646484375, -62.1748046875, -58.703125, -55.2314453125, -51.759765625, -48.2880859375, -44.81640625, -41.3447265625, -37.873046875, -34.4013671875, -30.9296875, -27.4580078125, -23.986328125, -20.5146484375, -17.04296875, -13.5712890625, -10.099609375, -6.6279296875, -3.15625, 0.3154296875, 3.787109375, 7.2587890625, 10.73046875, 14.2021484375, 17.673828125, 21.1455078125, 24.6171875, 28.0888671875, 31.560546875, 35.0322265625, 38.50390625, 41.9755859375, 45.447265625, 48.9189453125, 52.390625, 55.8623046875, 59.333984375, 62.8056640625, 66.27734375, 69.7490234375, 73.220703125, 76.6923828125, 80.1640625, 83.6357421875, 87.107421875, 90.5791015625, 94.05078125, 97.5224609375, 100.994140625, 104.4658203125, 107.9375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 8.0, 10.0, 15.0, 12.0, 11.0, 17.0, 20.0, 23.0, 27.0, 34.0, 28.0, 42.0, 38.0, 48.0, 43.0, 56.0, 45.0, 43.0, 58.0, 41.0, 46.0, 44.0, 31.0, 30.0, 30.0, 33.0, 21.0, 22.0, 8.0, 12.0, 17.0, 11.0, 5.0, 13.0, 10.0, 4.0, 10.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-60.40625, -58.52880859375, -56.6513671875, -54.77392578125, -52.896484375, -51.01904296875, -49.1416015625, -47.26416015625, -45.38671875, -43.50927734375, -41.6318359375, -39.75439453125, -37.876953125, -35.99951171875, -34.1220703125, -32.24462890625, -30.3671875, -28.48974609375, -26.6123046875, -24.73486328125, -22.857421875, -20.97998046875, -19.1025390625, -17.22509765625, -15.34765625, -13.47021484375, -11.5927734375, -9.71533203125, -7.837890625, -5.96044921875, -4.0830078125, -2.20556640625, -0.328125, 1.54931640625, 3.4267578125, 5.30419921875, 7.181640625, 9.05908203125, 10.9365234375, 12.81396484375, 14.69140625, 16.56884765625, 18.4462890625, 20.32373046875, 22.201171875, 24.07861328125, 25.9560546875, 27.83349609375, 29.7109375, 31.58837890625, 33.4658203125, 35.34326171875, 37.220703125, 39.09814453125, 40.9755859375, 42.85302734375, 44.73046875, 46.60791015625, 48.4853515625, 50.36279296875, 52.240234375, 54.11767578125, 55.9951171875, 57.87255859375, 59.75]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 9.0, 11.0, 15.0, 31.0, 38.0, 57.0, 85.0, 123.0, 160.0, 243.0, 303.0, 475.0, 653.0, 958.0, 1488.0, 2286.0, 3800.0, 6425.0, 11648.0, 23118.0, 51404.0, 145839.0, 401533.0, 248916.0, 78943.0, 32761.0, 15562.0, 8469.0, 4835.0, 2800.0, 1797.0, 1167.0, 777.0, 541.0, 336.0, 276.0, 224.0, 123.0, 89.0, 72.0, 49.0, 31.0, 19.0, 20.0, 14.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-55.4375, -53.8857421875, -52.333984375, -50.7822265625, -49.23046875, -47.6787109375, -46.126953125, -44.5751953125, -43.0234375, -41.4716796875, -39.919921875, -38.3681640625, -36.81640625, -35.2646484375, -33.712890625, -32.1611328125, -30.609375, -29.0576171875, -27.505859375, -25.9541015625, -24.40234375, -22.8505859375, -21.298828125, -19.7470703125, -18.1953125, -16.6435546875, -15.091796875, -13.5400390625, -11.98828125, -10.4365234375, -8.884765625, -7.3330078125, -5.78125, -4.2294921875, -2.677734375, -1.1259765625, 0.42578125, 1.9775390625, 3.529296875, 5.0810546875, 6.6328125, 8.1845703125, 9.736328125, 11.2880859375, 12.83984375, 14.3916015625, 15.943359375, 17.4951171875, 19.046875, 20.5986328125, 22.150390625, 23.7021484375, 25.25390625, 26.8056640625, 28.357421875, 29.9091796875, 31.4609375, 33.0126953125, 34.564453125, 36.1162109375, 37.66796875, 39.2197265625, 40.771484375, 42.3232421875, 43.875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 3.0, 15.0, 24.0, 17.0, 44.0, 73.0, 74.0, 114.0, 121.0, 111.0, 115.0, 86.0, 57.0, 49.0, 34.0, 21.0, 12.0, 6.0, 12.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0048370361328125, -0.004727572202682495, -0.00461810827255249, -0.004508644342422485, -0.0043991804122924805, -0.004289716482162476, -0.004180252552032471, -0.004070788621902466, -0.003961324691772461, -0.003851860761642456, -0.003742396831512451, -0.0036329329013824463, -0.0035234689712524414, -0.0034140050411224365, -0.0033045411109924316, -0.0031950771808624268, -0.003085613250732422, -0.002976149320602417, -0.002866685390472412, -0.0027572214603424072, -0.0026477575302124023, -0.0025382936000823975, -0.0024288296699523926, -0.0023193657398223877, -0.002209901809692383, -0.002100437879562378, -0.001990973949432373, -0.0018815100193023682, -0.0017720460891723633, -0.0016625821590423584, -0.0015531182289123535, -0.0014436542987823486, -0.0013341903686523438, -0.0012247264385223389, -0.001115262508392334, -0.001005798578262329, -0.0008963346481323242, -0.0007868707180023193, -0.0006774067878723145, -0.0005679428577423096, -0.0004584789276123047, -0.0003490149974822998, -0.00023955106735229492, -0.00013008713722229004, -2.0623207092285156e-05, 8.884072303771973e-05, 0.0001983046531677246, 0.0003077685832977295, 0.0004172325134277344, 0.0005266964435577393, 0.0006361603736877441, 0.000745624303817749, 0.0008550882339477539, 0.0009645521640777588, 0.0010740160942077637, 0.0011834800243377686, 0.0012929439544677734, 0.0014024078845977783, 0.0015118718147277832, 0.001621335744857788, 0.001730799674987793, 0.0018402636051177979, 0.0019497275352478027, 0.0020591914653778076, 0.0021686553955078125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 13.0, 11.0, 25.0, 22.0, 36.0, 45.0, 55.0, 91.0, 106.0, 140.0, 204.0, 255.0, 405.0, 547.0, 769.0, 1160.0, 1846.0, 2903.0, 4900.0, 8313.0, 14806.0, 28745.0, 61179.0, 142480.0, 286756.0, 261413.0, 120688.0, 52609.0, 24961.0, 13270.0, 7425.0, 4369.0, 2609.0, 1705.0, 1069.0, 700.0, 542.0, 363.0, 266.0, 192.0, 156.0, 105.0, 82.0, 65.0, 38.0, 32.0, 28.0, 20.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-46.71875, -45.25439453125, -43.7900390625, -42.32568359375, -40.861328125, -39.39697265625, -37.9326171875, -36.46826171875, -35.00390625, -33.53955078125, -32.0751953125, -30.61083984375, -29.146484375, -27.68212890625, -26.2177734375, -24.75341796875, -23.2890625, -21.82470703125, -20.3603515625, -18.89599609375, -17.431640625, -15.96728515625, -14.5029296875, -13.03857421875, -11.57421875, -10.10986328125, -8.6455078125, -7.18115234375, -5.716796875, -4.25244140625, -2.7880859375, -1.32373046875, 0.140625, 1.60498046875, 3.0693359375, 4.53369140625, 5.998046875, 7.46240234375, 8.9267578125, 10.39111328125, 11.85546875, 13.31982421875, 14.7841796875, 16.24853515625, 17.712890625, 19.17724609375, 20.6416015625, 22.10595703125, 23.5703125, 25.03466796875, 26.4990234375, 27.96337890625, 29.427734375, 30.89208984375, 32.3564453125, 33.82080078125, 35.28515625, 36.74951171875, 38.2138671875, 39.67822265625, 41.142578125, 42.60693359375, 44.0712890625, 45.53564453125, 47.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 8.0, 9.0, 22.0, 19.0, 20.0, 41.0, 40.0, 35.0, 53.0, 63.0, 72.0, 91.0, 104.0, 89.0, 51.0, 60.0, 28.0, 40.0, 28.0, 21.0, 25.0, 19.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.15625, -26.3310546875, -25.505859375, -24.6806640625, -23.85546875, -23.0302734375, -22.205078125, -21.3798828125, -20.5546875, -19.7294921875, -18.904296875, -18.0791015625, -17.25390625, -16.4287109375, -15.603515625, -14.7783203125, -13.953125, -13.1279296875, -12.302734375, -11.4775390625, -10.65234375, -9.8271484375, -9.001953125, -8.1767578125, -7.3515625, -6.5263671875, -5.701171875, -4.8759765625, -4.05078125, -3.2255859375, -2.400390625, -1.5751953125, -0.75, 0.0751953125, 0.900390625, 1.7255859375, 2.55078125, 3.3759765625, 4.201171875, 5.0263671875, 5.8515625, 6.6767578125, 7.501953125, 8.3271484375, 9.15234375, 9.9775390625, 10.802734375, 11.6279296875, 12.453125, 13.2783203125, 14.103515625, 14.9287109375, 15.75390625, 16.5791015625, 17.404296875, 18.2294921875, 19.0546875, 19.8798828125, 20.705078125, 21.5302734375, 22.35546875, 23.1806640625, 24.005859375, 24.8310546875, 25.65625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 13.0, 15.0, 15.0, 16.0, 31.0, 31.0, 39.0, 42.0, 48.0, 54.0, 69.0, 66.0, 50.0, 53.0, 54.0, 53.0, 55.0, 45.0, 32.0, 24.0, 23.0, 25.0, 23.0, 17.0, 17.0, 7.0, 8.0, 9.0, 7.0, 7.0, 9.0, 8.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.31404113769531, -39.45559310913086, -37.597145080566406, -35.73869705200195, -33.8802490234375, -32.02180099487305, -30.163352966308594, -28.30490493774414, -26.446456909179688, -24.588008880615234, -22.72956085205078, -20.871112823486328, -19.012664794921875, -17.154216766357422, -15.295769691467285, -13.437321662902832, -11.578874588012695, -9.720426559448242, -7.861978530883789, -6.003530979156494, -4.145082950592041, -2.286635398864746, -0.42818737030029297, 1.4302606582641602, 3.2887086868286133, 5.147156715393066, 7.0056047439575195, 8.864051818847656, 10.72249984741211, 12.580947875976562, 14.439395904541016, 16.29784393310547, 18.156291961669922, 20.014739990234375, 21.873188018798828, 23.73163604736328, 25.590084075927734, 27.448532104492188, 29.30698013305664, 31.165428161621094, 33.02387619018555, 34.88232421875, 36.74077224731445, 38.599220275878906, 40.45766830444336, 42.31611633300781, 44.174564361572266, 46.03301239013672, 47.891456604003906, 49.74990463256836, 51.60835266113281, 53.466800689697266, 55.32524871826172, 57.18369674682617, 59.042144775390625, 60.90059280395508, 62.75904083251953, 64.61748504638672, 66.47593688964844, 68.33438110351562, 70.19283294677734, 72.05127716064453, 73.90972900390625, 75.76817321777344, 77.62662506103516]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 4.0, 8.0, 8.0, 11.0, 12.0, 15.0, 16.0, 23.0, 23.0, 24.0, 28.0, 32.0, 33.0, 44.0, 43.0, 48.0, 40.0, 44.0, 50.0, 47.0, 46.0, 42.0, 37.0, 49.0, 27.0, 35.0, 30.0, 27.0, 23.0, 27.0, 22.0, 13.0, 13.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-135.17872619628906, -131.38404846191406, -127.58937072753906, -123.79469299316406, -120.00000762939453, -116.20532989501953, -112.41065216064453, -108.61597442626953, -104.82129669189453, -101.02661895751953, -97.23194122314453, -93.437255859375, -89.642578125, -85.847900390625, -82.05322265625, -78.258544921875, -74.4638671875, -70.669189453125, -66.87451171875, -63.079830169677734, -59.285152435302734, -55.49047088623047, -51.69579315185547, -47.90111541748047, -44.10643005371094, -40.31175231933594, -36.51707077026367, -32.72239303588867, -28.927715301513672, -25.13303565979004, -21.338356018066406, -17.543678283691406, -13.749000549316406, -9.95432186126709, -6.159642696380615, -2.3649635314941406, 1.4297151565551758, 5.224393844604492, 9.019073486328125, 12.813751220703125, 16.608430862426758, 20.40311050415039, 24.19778823852539, 27.992467880249023, 31.787147521972656, 35.581825256347656, 39.376502990722656, 43.171180725097656, 46.96586227416992, 50.76054000854492, 54.55522155761719, 58.34989929199219, 62.14457702636719, 65.93925476074219, 69.73393249511719, 73.52861022949219, 77.32329559326172, 81.11797332763672, 84.91265106201172, 88.70733642578125, 92.50201416015625, 96.29669189453125, 100.09136962890625, 103.88604736328125, 107.68072509765625]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 12.0, 18.0, 40.0, 42.0, 66.0, 109.0, 137.0, 190.0, 304.0, 449.0, 617.0, 908.0, 1175.0, 1566.0, 2271.0, 2894.0, 4026.0, 5293.0, 7698.0, 469793.0, 7149.0, 5171.0, 3918.0, 2935.0, 2203.0, 1616.0, 1122.0, 817.0, 572.0, 348.0, 269.0, 184.0, 114.0, 92.0, 53.0, 33.0, 25.0, 12.0, 7.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-323.0233459472656, -313.05865478515625, -303.093994140625, -293.12933349609375, -283.1646423339844, -273.199951171875, -263.23529052734375, -253.27061462402344, -243.30593872070312, -233.3412628173828, -223.3765869140625, -213.4119110107422, -203.44723510742188, -193.48255920410156, -183.51788330078125, -173.55320739746094, -163.58853149414062, -153.6238555908203, -143.6591796875, -133.6945037841797, -123.72982788085938, -113.76515197753906, -103.80047607421875, -93.83580017089844, -83.87112426757812, -73.90644836425781, -63.9417724609375, -53.97709655761719, -44.012420654296875, -34.04774475097656, -24.08306884765625, -14.118392944335938, -4.1536865234375, 5.8109893798828125, 15.775665283203125, 25.740341186523438, 35.70501708984375, 45.66969299316406, 55.634368896484375, 65.59904479980469, 75.563720703125, 85.52839660644531, 95.49307250976562, 105.45774841308594, 115.42242431640625, 125.38710021972656, 135.35177612304688, 145.3164520263672, 155.2811279296875, 165.2458038330078, 175.21047973632812, 185.17515563964844, 195.13983154296875, 205.10450744628906, 215.06918334960938, 225.0338592529297, 234.99853515625, 244.9632110595703, 254.92788696289062, 264.892578125, 274.85723876953125, 284.8218994140625, 294.7865905761719, 304.75128173828125, 314.7159423828125]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 8.0, 10.0, 8.0, 13.0, 14.0, 19.0, 23.0, 22.0, 25.0, 26.0, 38.0, 27.0, 44.0, 47.0, 50.0, 42.0, 36.0, 1088.0, 39.0, 44.0, 49.0, 38.0, 45.0, 28.0, 37.0, 24.0, 31.0, 24.0, 20.0, 22.0, 13.0, 12.0, 11.0, 11.0, 3.0, 9.0, 1.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4216.19384765625, -4097.05224609375, -3977.91064453125, -3858.76904296875, -3739.627197265625, -3620.485595703125, -3501.343994140625, -3382.202392578125, -3263.060546875, -3143.9189453125, -3024.77734375, -2905.6357421875, -2786.493896484375, -2667.352294921875, -2548.210693359375, -2429.069091796875, -2309.927490234375, -2190.785888671875, -2071.644287109375, -1952.5025634765625, -1833.36083984375, -1714.21923828125, -1595.07763671875, -1475.93603515625, -1356.7943115234375, -1237.6527099609375, -1118.510986328125, -999.369384765625, -880.2277221679688, -761.0860595703125, -641.9444580078125, -522.8027954101562, -403.6611328125, -284.51947021484375, -165.37783813476562, -46.2362060546875, 72.90545654296875, 192.047119140625, 311.188720703125, 430.33038330078125, 549.4720458984375, 668.6137084960938, 787.75537109375, 906.89697265625, 1026.03857421875, 1145.1802978515625, 1264.3218994140625, 1383.463623046875, 1502.605224609375, 1621.746826171875, 1740.8885498046875, 1860.0301513671875, 1979.171875, 2098.3134765625, 2217.455078125, 2336.5966796875, 2455.73828125, 2574.8798828125, 2694.021484375, 2813.1630859375, 2932.304931640625, 3051.446533203125, 3170.588134765625, 3289.729736328125, 3408.87158203125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 43.0, 65.0, 62.0, 65.0, 52.0, 58.0, 57.0, 67.0, 60.0, 98.0, 101.0, 165.0, 253.0, 453.0, 999.0, 3380.0, 19315.0, 104024.0, 31038668.0, 74961.0, 7904.0, 1781.0, 645.0, 293.0, 197.0, 111.0, 87.0, 77.0, 69.0, 44.0, 46.0, 34.0, 36.0, 36.0, 27.0, 31.0, 20.0, 17.0, 9.0, 21.0, 7.0, 9.0, 14.0, 10.0, 3.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-522.0484619140625, -500.6414489746094, -479.23443603515625, -457.82745361328125, -436.4204406738281, -415.013427734375, -393.6064147949219, -372.19940185546875, -350.79241943359375, -329.3854064941406, -307.9783935546875, -286.5714111328125, -265.1643981933594, -243.75738525390625, -222.35037231445312, -200.94337463378906, -179.53634643554688, -158.12933349609375, -136.7223358154297, -115.31532287597656, -93.90831756591797, -72.50131225585938, -51.09429931640625, -29.687301635742188, -8.280288696289062, 13.126718521118164, 34.53372573852539, 55.94073486328125, 77.34774017333984, 98.75474548339844, 120.16175842285156, 141.56875610351562, 162.97576904296875, 184.38278198242188, 205.78977966308594, 227.19679260253906, 248.60379028320312, 270.01080322265625, 291.4178161621094, 312.8248291015625, 334.2318115234375, 355.6388244628906, 377.04583740234375, 398.45281982421875, 419.8598327636719, 441.266845703125, 462.6738586425781, 484.08087158203125, 505.4878845214844, 526.8948974609375, 548.3018798828125, 569.7089233398438, 591.1159057617188, 612.52294921875, 633.929931640625, 655.3369140625, 676.7439575195312, 698.1509399414062, 719.5579833984375, 740.9649658203125, 762.3720092773438, 783.7789916992188, 805.18603515625, 826.593017578125, 848.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 7.0, 15.0, 22.0, 41.0, 46.0, 51.0, 92.0, 127.0, 158.0, 238.0, 358.0, 529.0, 803.0, 1149.0, 1723.0, 2571.0, 4035.0, 6291.0, 10569.0, 17298.0, 30183.0, 55657.0, 106789.0, 222712.0, 504162.0, 1301486.0, 2337244.0, 931986.0, 383044.0, 174052.0, 86277.0, 45807.0, 25604.0, 15113.0, 9008.0, 5592.0, 3573.0, 2253.0, 1517.0, 1012.0, 668.0, 465.0, 329.0, 230.0, 163.0, 132.0, 83.0, 51.0, 40.0, 21.0, 18.0, 6.0, 12.0, 5.0, 6.0, 1.0, 1.0], "bins": [-43.84375, -42.52880859375, -41.2138671875, -39.89892578125, -38.583984375, -37.26904296875, -35.9541015625, -34.63916015625, -33.32421875, -32.00927734375, -30.6943359375, -29.37939453125, -28.064453125, -26.74951171875, -25.4345703125, -24.11962890625, -22.8046875, -21.48974609375, -20.1748046875, -18.85986328125, -17.544921875, -16.22998046875, -14.9150390625, -13.60009765625, -12.28515625, -10.97021484375, -9.6552734375, -8.34033203125, -7.025390625, -5.71044921875, -4.3955078125, -3.08056640625, -1.765625, -0.45068359375, 0.8642578125, 2.17919921875, 3.494140625, 4.80908203125, 6.1240234375, 7.43896484375, 8.75390625, 10.06884765625, 11.3837890625, 12.69873046875, 14.013671875, 15.32861328125, 16.6435546875, 17.95849609375, 19.2734375, 20.58837890625, 21.9033203125, 23.21826171875, 24.533203125, 25.84814453125, 27.1630859375, 28.47802734375, 29.79296875, 31.10791015625, 32.4228515625, 33.73779296875, 35.052734375, 36.36767578125, 37.6826171875, 38.99755859375, 40.3125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 8.0, 13.0, 17.0, 22.0, 33.0, 31.0, 33.0, 42.0, 45.0, 71.0, 101.0, 128.0, 230.0, 256.0, 231.0, 156.0, 126.0, 99.0, 70.0, 70.0, 51.0, 31.0, 33.0, 34.0, 18.0, 20.0, 15.0, 3.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.3623046875, -42.974609375, -41.5869140625, -40.19921875, -38.8115234375, -37.423828125, -36.0361328125, -34.6484375, -33.2607421875, -31.873046875, -30.4853515625, -29.09765625, -27.7099609375, -26.322265625, -24.9345703125, -23.546875, -22.1591796875, -20.771484375, -19.3837890625, -17.99609375, -16.6083984375, -15.220703125, -13.8330078125, -12.4453125, -11.0576171875, -9.669921875, -8.2822265625, -6.89453125, -5.5068359375, -4.119140625, -2.7314453125, -1.34375, 0.0439453125, 1.431640625, 2.8193359375, 4.20703125, 5.5947265625, 6.982421875, 8.3701171875, 9.7578125, 11.1455078125, 12.533203125, 13.9208984375, 15.30859375, 16.6962890625, 18.083984375, 19.4716796875, 20.859375, 22.2470703125, 23.634765625, 25.0224609375, 26.41015625, 27.7978515625, 29.185546875, 30.5732421875, 31.9609375, 33.3486328125, 34.736328125, 36.1240234375, 37.51171875, 38.8994140625, 40.287109375, 41.6748046875, 43.0625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [9.0, 9.0, 3.0, 7.0, 5.0, 6.0, 5.0, 13.0, 21.0, 18.0, 23.0, 31.0, 42.0, 88.0, 101.0, 160.0, 205.0, 285.0, 439.0, 625.0, 1063.0, 1718.0, 3007.0, 5190.0, 10057.0, 20414.0, 45231.0, 106043.0, 273906.0, 818781.0, 3176391.0, 1215033.0, 366506.0, 136773.0, 55913.0, 25596.0, 12432.0, 6374.0, 3444.0, 1926.0, 1193.0, 793.0, 538.0, 328.0, 187.0, 141.0, 112.0, 78.0, 59.0, 44.0, 29.0, 19.0, 9.0, 7.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-35.625, -34.46240234375, -33.2998046875, -32.13720703125, -30.974609375, -29.81201171875, -28.6494140625, -27.48681640625, -26.32421875, -25.16162109375, -23.9990234375, -22.83642578125, -21.673828125, -20.51123046875, -19.3486328125, -18.18603515625, -17.0234375, -15.86083984375, -14.6982421875, -13.53564453125, -12.373046875, -11.21044921875, -10.0478515625, -8.88525390625, -7.72265625, -6.56005859375, -5.3974609375, -4.23486328125, -3.072265625, -1.90966796875, -0.7470703125, 0.41552734375, 1.578125, 2.74072265625, 3.9033203125, 5.06591796875, 6.228515625, 7.39111328125, 8.5537109375, 9.71630859375, 10.87890625, 12.04150390625, 13.2041015625, 14.36669921875, 15.529296875, 16.69189453125, 17.8544921875, 19.01708984375, 20.1796875, 21.34228515625, 22.5048828125, 23.66748046875, 24.830078125, 25.99267578125, 27.1552734375, 28.31787109375, 29.48046875, 30.64306640625, 31.8056640625, 32.96826171875, 34.130859375, 35.29345703125, 36.4560546875, 37.61865234375, 38.78125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 19.0, 15.0, 15.0, 34.0, 35.0, 27.0, 36.0, 55.0, 60.0, 68.0, 118.0, 201.0, 348.0, 257.0, 165.0, 112.0, 88.0, 70.0, 35.0, 46.0, 35.0, 38.0, 24.0, 17.0, 20.0, 6.0, 13.0, 4.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.8125, -44.28759765625, -42.7626953125, -41.23779296875, -39.712890625, -38.18798828125, -36.6630859375, -35.13818359375, -33.61328125, -32.08837890625, -30.5634765625, -29.03857421875, -27.513671875, -25.98876953125, -24.4638671875, -22.93896484375, -21.4140625, -19.88916015625, -18.3642578125, -16.83935546875, -15.314453125, -13.78955078125, -12.2646484375, -10.73974609375, -9.21484375, -7.68994140625, -6.1650390625, -4.64013671875, -3.115234375, -1.59033203125, -0.0654296875, 1.45947265625, 2.984375, 4.50927734375, 6.0341796875, 7.55908203125, 9.083984375, 10.60888671875, 12.1337890625, 13.65869140625, 15.18359375, 16.70849609375, 18.2333984375, 19.75830078125, 21.283203125, 22.80810546875, 24.3330078125, 25.85791015625, 27.3828125, 28.90771484375, 30.4326171875, 31.95751953125, 33.482421875, 35.00732421875, 36.5322265625, 38.05712890625, 39.58203125, 41.10693359375, 42.6318359375, 44.15673828125, 45.681640625, 47.20654296875, 48.7314453125, 50.25634765625, 51.78125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 3.0, 11.0, 21.0, 19.0, 28.0, 61.0, 56.0, 90.0, 102.0, 142.0, 187.0, 286.0, 429.0, 608.0, 886.0, 1371.0, 2132.0, 3190.0, 5227.0, 8699.0, 14831.0, 28249.0, 61377.0, 198678.0, 5691731.0, 157272.0, 53335.0, 26035.0, 14001.0, 8324.0, 5062.0, 3109.0, 1969.0, 1185.0, 791.0, 528.0, 391.0, 263.0, 197.0, 150.0, 108.0, 82.0, 50.0, 44.0, 24.0, 28.0, 14.0, 18.0, 5.0, 8.0, 1.0, 5.0, 5.0, 3.0, 4.0, 4.0], "bins": [-91.3125, -88.4970703125, -85.681640625, -82.8662109375, -80.05078125, -77.2353515625, -74.419921875, -71.6044921875, -68.7890625, -65.9736328125, -63.158203125, -60.3427734375, -57.52734375, -54.7119140625, -51.896484375, -49.0810546875, -46.265625, -43.4501953125, -40.634765625, -37.8193359375, -35.00390625, -32.1884765625, -29.373046875, -26.5576171875, -23.7421875, -20.9267578125, -18.111328125, -15.2958984375, -12.48046875, -9.6650390625, -6.849609375, -4.0341796875, -1.21875, 1.5966796875, 4.412109375, 7.2275390625, 10.04296875, 12.8583984375, 15.673828125, 18.4892578125, 21.3046875, 24.1201171875, 26.935546875, 29.7509765625, 32.56640625, 35.3818359375, 38.197265625, 41.0126953125, 43.828125, 46.6435546875, 49.458984375, 52.2744140625, 55.08984375, 57.9052734375, 60.720703125, 63.5361328125, 66.3515625, 69.1669921875, 71.982421875, 74.7978515625, 77.61328125, 80.4287109375, 83.244140625, 86.0595703125, 88.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 4.0, 9.0, 5.0, 9.0, 12.0, 21.0, 21.0, 16.0, 22.0, 33.0, 28.0, 38.0, 33.0, 40.0, 58.0, 113.0, 248.0, 414.0, 254.0, 128.0, 84.0, 75.0, 49.0, 42.0, 37.0, 38.0, 29.0, 17.0, 21.0, 16.0, 16.0, 17.0, 8.0, 18.0, 7.0, 6.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.6875, -58.666015625, -56.64453125, -54.623046875, -52.6015625, -50.580078125, -48.55859375, -46.537109375, -44.515625, -42.494140625, -40.47265625, -38.451171875, -36.4296875, -34.408203125, -32.38671875, -30.365234375, -28.34375, -26.322265625, -24.30078125, -22.279296875, -20.2578125, -18.236328125, -16.21484375, -14.193359375, -12.171875, -10.150390625, -8.12890625, -6.107421875, -4.0859375, -2.064453125, -0.04296875, 1.978515625, 4.0, 6.021484375, 8.04296875, 10.064453125, 12.0859375, 14.107421875, 16.12890625, 18.150390625, 20.171875, 22.193359375, 24.21484375, 26.236328125, 28.2578125, 30.279296875, 32.30078125, 34.322265625, 36.34375, 38.365234375, 40.38671875, 42.408203125, 44.4296875, 46.451171875, 48.47265625, 50.494140625, 52.515625, 54.537109375, 56.55859375, 58.580078125, 60.6015625, 62.623046875, 64.64453125, 66.666015625, 68.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 12.0, 14.0, 37.0, 72.0, 212.0, 451.0, 94.0, 44.0, 16.0, 15.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1816.7227783203125, -1765.09765625, -1713.4725341796875, -1661.847412109375, -1610.22216796875, -1558.59716796875, -1506.971923828125, -1455.3468017578125, -1403.7216796875, -1352.0965576171875, -1300.471435546875, -1248.8463134765625, -1197.22119140625, -1145.595947265625, -1093.9708251953125, -1042.345703125, -990.7205810546875, -939.095458984375, -887.4703369140625, -835.8451538085938, -784.2200317382812, -732.5949096679688, -680.9697265625, -629.3446044921875, -577.719482421875, -526.0943603515625, -474.4692077636719, -422.84405517578125, -371.21893310546875, -319.59381103515625, -267.9686584472656, -216.343505859375, -164.718505859375, -113.09336853027344, -61.468231201171875, -9.843093872070312, 41.78204345703125, 93.40716552734375, 145.03231811523438, 196.657470703125, 248.2825927734375, 299.90771484375, 351.5328674316406, 403.15802001953125, 454.78314208984375, 506.40826416015625, 558.033447265625, 609.6585693359375, 661.28369140625, 712.9088134765625, 764.533935546875, 816.1591186523438, 867.7842407226562, 919.4093627929688, 971.0345458984375, 1022.65966796875, 1074.2847900390625, 1125.909912109375, 1177.5350341796875, 1229.16015625, 1280.785400390625, 1332.410400390625, 1384.03564453125, 1435.6607666015625, 1487.285888671875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 3.0, 4.0, 12.0, 12.0, 18.0, 53.0, 175.0, 406.0, 161.0, 40.0, 26.0, 11.0, 15.0, 12.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3320.310302734375, -3233.904541015625, -3147.4990234375, -3061.09326171875, -2974.687744140625, -2888.281982421875, -2801.87646484375, -2715.470703125, -2629.06494140625, -2542.6591796875, -2456.253662109375, -2369.847900390625, -2283.4423828125, -2197.03662109375, -2110.630859375, -2024.225341796875, -1937.81982421875, -1851.4141845703125, -1765.008544921875, -1678.602783203125, -1592.197265625, -1505.79150390625, -1419.3858642578125, -1332.980224609375, -1246.5745849609375, -1160.1689453125, -1073.7633056640625, -987.3576049804688, -900.9519653320312, -814.5463256835938, -728.140625, -641.7349853515625, -555.329345703125, -468.9237060546875, -382.5180358886719, -296.11236572265625, -209.70672607421875, -123.30108642578125, -36.8953857421875, 49.51025390625, 135.9158935546875, 222.32154846191406, 308.7272033691406, 395.13287353515625, 481.53851318359375, 567.9441528320312, 654.349853515625, 740.7554931640625, 827.1611328125, 913.5667724609375, 999.972412109375, 1086.378173828125, 1172.78369140625, 1259.189453125, 1345.5950927734375, 1432.000732421875, 1518.4063720703125, 1604.81201171875, 1691.2176513671875, 1777.623291015625, 1864.029052734375, 1950.4345703125, 2036.84033203125, 2123.24609375, 2209.651611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 12.0, 8.0, 12.0, 18.0, 27.0, 32.0, 61.0, 69.0, 93.0, 161.0, 244.0, 363.0, 462.0, 724.0, 1150.0, 1864.0, 3038.0, 5397.0, 9725.0, 19862.0, 47779.0, 224791.0, 3667938.0, 132294.0, 39843.0, 16953.0, 8382.0, 4782.0, 2934.0, 1782.0, 1200.0, 723.0, 531.0, 352.0, 205.0, 150.0, 94.0, 89.0, 51.0, 28.0, 22.0, 17.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1953125, -11.7325439453125, -11.269775390625, -10.8070068359375, -10.34423828125, -9.8814697265625, -9.418701171875, -8.9559326171875, -8.4931640625, -8.0303955078125, -7.567626953125, -7.1048583984375, -6.64208984375, -6.1793212890625, -5.716552734375, -5.2537841796875, -4.791015625, -4.3282470703125, -3.865478515625, -3.4027099609375, -2.93994140625, -2.4771728515625, -2.014404296875, -1.5516357421875, -1.0888671875, -0.6260986328125, -0.163330078125, 0.2994384765625, 0.76220703125, 1.2249755859375, 1.687744140625, 2.1505126953125, 2.61328125, 3.0760498046875, 3.538818359375, 4.0015869140625, 4.46435546875, 4.9271240234375, 5.389892578125, 5.8526611328125, 6.3154296875, 6.7781982421875, 7.240966796875, 7.7037353515625, 8.16650390625, 8.6292724609375, 9.092041015625, 9.5548095703125, 10.017578125, 10.4803466796875, 10.943115234375, 11.4058837890625, 11.86865234375, 12.3314208984375, 12.794189453125, 13.2569580078125, 13.7197265625, 14.1824951171875, 14.645263671875, 15.1080322265625, 15.57080078125, 16.0335693359375, 16.496337890625, 16.9591064453125, 17.421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 4.0, 9.0, 6.0, 16.0, 12.0, 16.0, 37.0, 90.0, 388.0, 248.0, 47.0, 19.0, 18.0, 18.0, 10.0, 9.0, 5.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6357421875, -1.5843658447265625, -1.532989501953125, -1.4816131591796875, -1.43023681640625, -1.3788604736328125, -1.327484130859375, -1.2761077880859375, -1.2247314453125, -1.1733551025390625, -1.121978759765625, -1.0706024169921875, -1.01922607421875, -0.9678497314453125, -0.916473388671875, -0.8650970458984375, -0.813720703125, -0.7623443603515625, -0.710968017578125, -0.6595916748046875, -0.60821533203125, -0.5568389892578125, -0.505462646484375, -0.4540863037109375, -0.4027099609375, -0.3513336181640625, -0.299957275390625, -0.2485809326171875, -0.19720458984375, -0.1458282470703125, -0.094451904296875, -0.0430755615234375, 0.00830078125, 0.0596771240234375, 0.111053466796875, 0.1624298095703125, 0.21380615234375, 0.2651824951171875, 0.316558837890625, 0.3679351806640625, 0.4193115234375, 0.4706878662109375, 0.522064208984375, 0.5734405517578125, 0.62481689453125, 0.6761932373046875, 0.727569580078125, 0.7789459228515625, 0.830322265625, 0.8816986083984375, 0.933074951171875, 0.9844512939453125, 1.03582763671875, 1.0872039794921875, 1.138580322265625, 1.1899566650390625, 1.2413330078125, 1.2927093505859375, 1.344085693359375, 1.3954620361328125, 1.44683837890625, 1.4982147216796875, 1.549591064453125, 1.6009674072265625, 1.65234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 22.0, 17.0, 32.0, 36.0, 52.0, 88.0, 140.0, 175.0, 240.0, 384.0, 569.0, 932.0, 1685.0, 3075.0, 5987.0, 13551.0, 35308.0, 125944.0, 935148.0, 2761315.0, 219647.0, 54073.0, 18800.0, 7894.0, 3811.0, 2059.0, 1185.0, 710.0, 428.0, 264.0, 203.0, 140.0, 82.0, 73.0, 47.0, 36.0, 26.0, 19.0, 18.0, 13.0, 8.0, 5.0, 6.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.3671875, -12.924072265625, -12.48095703125, -12.037841796875, -11.5947265625, -11.151611328125, -10.70849609375, -10.265380859375, -9.822265625, -9.379150390625, -8.93603515625, -8.492919921875, -8.0498046875, -7.606689453125, -7.16357421875, -6.720458984375, -6.27734375, -5.834228515625, -5.39111328125, -4.947998046875, -4.5048828125, -4.061767578125, -3.61865234375, -3.175537109375, -2.732421875, -2.289306640625, -1.84619140625, -1.403076171875, -0.9599609375, -0.516845703125, -0.07373046875, 0.369384765625, 0.8125, 1.255615234375, 1.69873046875, 2.141845703125, 2.5849609375, 3.028076171875, 3.47119140625, 3.914306640625, 4.357421875, 4.800537109375, 5.24365234375, 5.686767578125, 6.1298828125, 6.572998046875, 7.01611328125, 7.459228515625, 7.90234375, 8.345458984375, 8.78857421875, 9.231689453125, 9.6748046875, 10.117919921875, 10.56103515625, 11.004150390625, 11.447265625, 11.890380859375, 12.33349609375, 12.776611328125, 13.2197265625, 13.662841796875, 14.10595703125, 14.549072265625, 14.9921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 7.0, 5.0, 5.0, 8.0, 7.0, 9.0, 6.0, 17.0, 15.0, 25.0, 27.0, 43.0, 51.0, 50.0, 70.0, 67.0, 79.0, 101.0, 129.0, 189.0, 219.0, 292.0, 511.0, 505.0, 335.0, 222.0, 197.0, 145.0, 112.0, 111.0, 98.0, 68.0, 59.0, 59.0, 43.0, 34.0, 31.0, 20.0, 25.0, 12.0, 12.0, 10.0, 14.0, 5.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-2.6796875, -2.595855712890625, -2.51202392578125, -2.428192138671875, -2.3443603515625, -2.260528564453125, -2.17669677734375, -2.092864990234375, -2.009033203125, -1.925201416015625, -1.84136962890625, -1.757537841796875, -1.6737060546875, -1.589874267578125, -1.50604248046875, -1.422210693359375, -1.33837890625, -1.254547119140625, -1.17071533203125, -1.086883544921875, -1.0030517578125, -0.919219970703125, -0.83538818359375, -0.751556396484375, -0.667724609375, -0.583892822265625, -0.50006103515625, -0.416229248046875, -0.3323974609375, -0.248565673828125, -0.16473388671875, -0.080902099609375, 0.0029296875, 0.086761474609375, 0.17059326171875, 0.254425048828125, 0.3382568359375, 0.422088623046875, 0.50592041015625, 0.589752197265625, 0.673583984375, 0.757415771484375, 0.84124755859375, 0.925079345703125, 1.0089111328125, 1.092742919921875, 1.17657470703125, 1.260406494140625, 1.34423828125, 1.428070068359375, 1.51190185546875, 1.595733642578125, 1.6795654296875, 1.763397216796875, 1.84722900390625, 1.931060791015625, 2.014892578125, 2.098724365234375, 2.18255615234375, 2.266387939453125, 2.3502197265625, 2.434051513671875, 2.51788330078125, 2.601715087890625, 2.685546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 11.0, 20.0, 60.0, 130.0, 260.0, 240.0, 98.0, 66.0, 44.0, 15.0, 14.0, 12.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.200767517089844, -32.062713623046875, -29.92465591430664, -27.786602020263672, -25.64854621887207, -23.51049041748047, -21.3724365234375, -19.2343807220459, -17.096324920654297, -14.958269119262695, -12.82021427154541, -10.682159423828125, -8.544103622436523, -6.406047821044922, -4.267992973327637, -2.1299381256103516, 0.00811767578125, 2.1461730003356934, 4.284228324890137, 6.42228364944458, 8.560338973999023, 10.698394775390625, 12.83644962310791, 14.974504470825195, 17.112560272216797, 19.2506160736084, 21.388671875, 23.52672576904297, 25.66478157043457, 27.802837371826172, 29.94089126586914, 32.078948974609375, 34.21699523925781, 36.35504913330078, 38.493106842041016, 40.631160736083984, 42.76921844482422, 44.90727233886719, 47.045326232910156, 49.183380126953125, 51.32143783569336, 53.45949172973633, 55.59754943847656, 57.73560333251953, 59.8736572265625, 62.011714935302734, 64.14977264404297, 66.28782653808594, 68.4258804321289, 70.56393432617188, 72.70198822021484, 74.84004974365234, 76.97810363769531, 79.11615753173828, 81.25421142578125, 83.39226531982422, 85.53031921386719, 87.66837310791016, 89.80642700195312, 91.94448852539062, 94.0825424194336, 96.22059631347656, 98.35865020751953, 100.4967041015625, 102.634765625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 9.0, 6.0, 12.0, 18.0, 16.0, 24.0, 32.0, 44.0, 52.0, 47.0, 64.0, 59.0, 60.0, 71.0, 60.0, 60.0, 75.0, 48.0, 49.0, 49.0, 32.0, 31.0, 29.0, 13.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.93444061279297, -32.90512466430664, -31.875810623168945, -30.846494674682617, -29.817180633544922, -28.787864685058594, -27.758548736572266, -26.729232788085938, -25.699918746948242, -24.670602798461914, -23.64128875732422, -22.61197280883789, -21.582656860351562, -20.553342819213867, -19.52402687072754, -18.494712829589844, -17.465396881103516, -16.436080932617188, -15.406766891479492, -14.377450942993164, -13.348135948181152, -12.31882095336914, -11.289505004882812, -10.2601900100708, -9.230875015258789, -8.201560020446777, -7.172244548797607, -6.1429290771484375, -5.113614082336426, -4.084299087524414, -3.054983615875244, -2.025668144226074, -0.9963512420654297, 0.03296399116516113, 1.062279224395752, 2.0915944576263428, 3.1209096908569336, 4.150224685668945, 5.179540157318115, 6.208855628967285, 7.238170623779297, 8.267485618591309, 9.29680061340332, 10.326116561889648, 11.35543155670166, 12.384746551513672, 13.4140625, 14.443377494812012, 15.472692489624023, 16.50200843811035, 17.531322479248047, 18.560638427734375, 19.589954376220703, 20.6192684173584, 21.648584365844727, 22.677898406982422, 23.70721435546875, 24.736530303955078, 25.765844345092773, 26.7951602935791, 27.824474334716797, 28.853790283203125, 29.883106231689453, 30.91242218017578, 31.941736221313477]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 14.0, 23.0, 22.0, 31.0, 35.0, 51.0, 83.0, 97.0, 180.0, 256.0, 438.0, 655.0, 1090.0, 1907.0, 3866.0, 9089.0, 30905.0, 308164.0, 626346.0, 43643.0, 11583.0, 4628.0, 2183.0, 1223.0, 711.0, 465.0, 265.0, 179.0, 133.0, 84.0, 59.0, 42.0, 28.0, 21.0, 12.0, 15.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0], "bins": [-20.953125, -20.388427734375, -19.82373046875, -19.259033203125, -18.6943359375, -18.129638671875, -17.56494140625, -17.000244140625, -16.435546875, -15.870849609375, -15.30615234375, -14.741455078125, -14.1767578125, -13.612060546875, -13.04736328125, -12.482666015625, -11.91796875, -11.353271484375, -10.78857421875, -10.223876953125, -9.6591796875, -9.094482421875, -8.52978515625, -7.965087890625, -7.400390625, -6.835693359375, -6.27099609375, -5.706298828125, -5.1416015625, -4.576904296875, -4.01220703125, -3.447509765625, -2.8828125, -2.318115234375, -1.75341796875, -1.188720703125, -0.6240234375, -0.059326171875, 0.50537109375, 1.070068359375, 1.634765625, 2.199462890625, 2.76416015625, 3.328857421875, 3.8935546875, 4.458251953125, 5.02294921875, 5.587646484375, 6.15234375, 6.717041015625, 7.28173828125, 7.846435546875, 8.4111328125, 8.975830078125, 9.54052734375, 10.105224609375, 10.669921875, 11.234619140625, 11.79931640625, 12.364013671875, 12.9287109375, 13.493408203125, 14.05810546875, 14.622802734375, 15.1875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 10.0, 17.0, 28.0, 27.0, 59.0, 110.0, 154.0, 189.0, 151.0, 100.0, 42.0, 36.0, 17.0, 10.0, 4.0, 6.0, 6.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.625, -1.561187744140625, -1.49737548828125, -1.433563232421875, -1.3697509765625, -1.305938720703125, -1.24212646484375, -1.178314208984375, -1.114501953125, -1.050689697265625, -0.98687744140625, -0.923065185546875, -0.8592529296875, -0.795440673828125, -0.73162841796875, -0.667816162109375, -0.60400390625, -0.540191650390625, -0.47637939453125, -0.412567138671875, -0.3487548828125, -0.284942626953125, -0.22113037109375, -0.157318115234375, -0.093505859375, -0.029693603515625, 0.03411865234375, 0.097930908203125, 0.1617431640625, 0.225555419921875, 0.28936767578125, 0.353179931640625, 0.4169921875, 0.480804443359375, 0.54461669921875, 0.608428955078125, 0.6722412109375, 0.736053466796875, 0.79986572265625, 0.863677978515625, 0.927490234375, 0.991302490234375, 1.05511474609375, 1.118927001953125, 1.1827392578125, 1.246551513671875, 1.31036376953125, 1.374176025390625, 1.43798828125, 1.501800537109375, 1.56561279296875, 1.629425048828125, 1.6932373046875, 1.757049560546875, 1.82086181640625, 1.884674072265625, 1.948486328125, 2.012298583984375, 2.07611083984375, 2.139923095703125, 2.2037353515625, 2.267547607421875, 2.33135986328125, 2.395172119140625, 2.458984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 14.0, 12.0, 12.0, 16.0, 29.0, 29.0, 65.0, 115.0, 177.0, 334.0, 611.0, 1330.0, 3862.0, 16955.0, 259925.0, 728744.0, 27584.0, 5350.0, 1740.0, 789.0, 347.0, 184.0, 106.0, 62.0, 43.0, 24.0, 23.0, 14.0, 15.0, 7.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.234375, -28.263916015625, -27.29345703125, -26.322998046875, -25.3525390625, -24.382080078125, -23.41162109375, -22.441162109375, -21.470703125, -20.500244140625, -19.52978515625, -18.559326171875, -17.5888671875, -16.618408203125, -15.64794921875, -14.677490234375, -13.70703125, -12.736572265625, -11.76611328125, -10.795654296875, -9.8251953125, -8.854736328125, -7.88427734375, -6.913818359375, -5.943359375, -4.972900390625, -4.00244140625, -3.031982421875, -2.0615234375, -1.091064453125, -0.12060546875, 0.849853515625, 1.8203125, 2.790771484375, 3.76123046875, 4.731689453125, 5.7021484375, 6.672607421875, 7.64306640625, 8.613525390625, 9.583984375, 10.554443359375, 11.52490234375, 12.495361328125, 13.4658203125, 14.436279296875, 15.40673828125, 16.377197265625, 17.34765625, 18.318115234375, 19.28857421875, 20.259033203125, 21.2294921875, 22.199951171875, 23.17041015625, 24.140869140625, 25.111328125, 26.081787109375, 27.05224609375, 28.022705078125, 28.9931640625, 29.963623046875, 30.93408203125, 31.904541015625, 32.875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 15.0, 8.0, 13.0, 11.0, 19.0, 16.0, 24.0, 23.0, 25.0, 27.0, 30.0, 45.0, 35.0, 50.0, 53.0, 57.0, 52.0, 37.0, 41.0, 42.0, 45.0, 29.0, 33.0, 35.0, 41.0, 19.0, 24.0, 32.0, 20.0, 13.0, 13.0, 13.0, 10.0, 8.0, 10.0, 2.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-8.7109375, -8.460205078125, -8.20947265625, -7.958740234375, -7.7080078125, -7.457275390625, -7.20654296875, -6.955810546875, -6.705078125, -6.454345703125, -6.20361328125, -5.952880859375, -5.7021484375, -5.451416015625, -5.20068359375, -4.949951171875, -4.69921875, -4.448486328125, -4.19775390625, -3.947021484375, -3.6962890625, -3.445556640625, -3.19482421875, -2.944091796875, -2.693359375, -2.442626953125, -2.19189453125, -1.941162109375, -1.6904296875, -1.439697265625, -1.18896484375, -0.938232421875, -0.6875, -0.436767578125, -0.18603515625, 0.064697265625, 0.3154296875, 0.566162109375, 0.81689453125, 1.067626953125, 1.318359375, 1.569091796875, 1.81982421875, 2.070556640625, 2.3212890625, 2.572021484375, 2.82275390625, 3.073486328125, 3.32421875, 3.574951171875, 3.82568359375, 4.076416015625, 4.3271484375, 4.577880859375, 4.82861328125, 5.079345703125, 5.330078125, 5.580810546875, 5.83154296875, 6.082275390625, 6.3330078125, 6.583740234375, 6.83447265625, 7.085205078125, 7.3359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 11.0, 8.0, 22.0, 37.0, 56.0, 68.0, 132.0, 239.0, 448.0, 873.0, 2005.0, 5437.0, 25589.0, 900975.0, 97157.0, 9815.0, 3060.0, 1264.0, 621.0, 279.0, 163.0, 95.0, 54.0, 45.0, 30.0, 14.0, 18.0, 11.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-48.71875, -47.39208984375, -46.0654296875, -44.73876953125, -43.412109375, -42.08544921875, -40.7587890625, -39.43212890625, -38.10546875, -36.77880859375, -35.4521484375, -34.12548828125, -32.798828125, -31.47216796875, -30.1455078125, -28.81884765625, -27.4921875, -26.16552734375, -24.8388671875, -23.51220703125, -22.185546875, -20.85888671875, -19.5322265625, -18.20556640625, -16.87890625, -15.55224609375, -14.2255859375, -12.89892578125, -11.572265625, -10.24560546875, -8.9189453125, -7.59228515625, -6.265625, -4.93896484375, -3.6123046875, -2.28564453125, -0.958984375, 0.36767578125, 1.6943359375, 3.02099609375, 4.34765625, 5.67431640625, 7.0009765625, 8.32763671875, 9.654296875, 10.98095703125, 12.3076171875, 13.63427734375, 14.9609375, 16.28759765625, 17.6142578125, 18.94091796875, 20.267578125, 21.59423828125, 22.9208984375, 24.24755859375, 25.57421875, 26.90087890625, 28.2275390625, 29.55419921875, 30.880859375, 32.20751953125, 33.5341796875, 34.86083984375, 36.1875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 12.0, 20.0, 32.0, 31.0, 71.0, 118.0, 152.0, 170.0, 142.0, 86.0, 56.0, 29.0, 17.0, 16.0, 13.0, 12.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00063323974609375, -0.0006124526262283325, -0.000591665506362915, -0.0005708783864974976, -0.0005500912666320801, -0.0005293041467666626, -0.0005085170269012451, -0.00048772990703582764, -0.00046694278717041016, -0.0004461556673049927, -0.0004253685474395752, -0.0004045814275741577, -0.00038379430770874023, -0.00036300718784332275, -0.0003422200679779053, -0.0003214329481124878, -0.0003006458282470703, -0.00027985870838165283, -0.00025907158851623535, -0.00023828446865081787, -0.0002174973487854004, -0.0001967102289199829, -0.00017592310905456543, -0.00015513598918914795, -0.00013434886932373047, -0.00011356174945831299, -9.277462959289551e-05, -7.198750972747803e-05, -5.120038986206055e-05, -3.0413269996643066e-05, -9.626150131225586e-06, 1.1160969734191895e-05, 3.1948089599609375e-05, 5.2735209465026855e-05, 7.352232933044434e-05, 9.430944919586182e-05, 0.0001150965690612793, 0.00013588368892669678, 0.00015667080879211426, 0.00017745792865753174, 0.00019824504852294922, 0.0002190321683883667, 0.00023981928825378418, 0.00026060640811920166, 0.00028139352798461914, 0.0003021806478500366, 0.0003229677677154541, 0.0003437548875808716, 0.00036454200744628906, 0.00038532912731170654, 0.000406116247177124, 0.0004269033670425415, 0.000447690486907959, 0.00046847760677337646, 0.0004892647266387939, 0.0005100518465042114, 0.0005308389663696289, 0.0005516260862350464, 0.0005724132061004639, 0.0005932003259658813, 0.0006139874458312988, 0.0006347745656967163, 0.0006555616855621338, 0.0006763488054275513, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 12.0, 8.0, 12.0, 15.0, 38.0, 45.0, 52.0, 99.0, 123.0, 229.0, 360.0, 559.0, 1052.0, 1891.0, 4148.0, 10936.0, 44394.0, 707188.0, 236999.0, 25997.0, 7635.0, 3179.0, 1515.0, 808.0, 473.0, 262.0, 180.0, 106.0, 68.0, 46.0, 46.0, 20.0, 11.0, 15.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.25, -29.2998046875, -28.349609375, -27.3994140625, -26.44921875, -25.4990234375, -24.548828125, -23.5986328125, -22.6484375, -21.6982421875, -20.748046875, -19.7978515625, -18.84765625, -17.8974609375, -16.947265625, -15.9970703125, -15.046875, -14.0966796875, -13.146484375, -12.1962890625, -11.24609375, -10.2958984375, -9.345703125, -8.3955078125, -7.4453125, -6.4951171875, -5.544921875, -4.5947265625, -3.64453125, -2.6943359375, -1.744140625, -0.7939453125, 0.15625, 1.1064453125, 2.056640625, 3.0068359375, 3.95703125, 4.9072265625, 5.857421875, 6.8076171875, 7.7578125, 8.7080078125, 9.658203125, 10.6083984375, 11.55859375, 12.5087890625, 13.458984375, 14.4091796875, 15.359375, 16.3095703125, 17.259765625, 18.2099609375, 19.16015625, 20.1103515625, 21.060546875, 22.0107421875, 22.9609375, 23.9111328125, 24.861328125, 25.8115234375, 26.76171875, 27.7119140625, 28.662109375, 29.6123046875, 30.5625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 13.0, 25.0, 41.0, 51.0, 74.0, 107.0, 175.0, 158.0, 111.0, 77.0, 59.0, 32.0, 22.0, 17.0, 9.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.614501953125, -19.94775390625, -19.281005859375, -18.6142578125, -17.947509765625, -17.28076171875, -16.614013671875, -15.947265625, -15.280517578125, -14.61376953125, -13.947021484375, -13.2802734375, -12.613525390625, -11.94677734375, -11.280029296875, -10.61328125, -9.946533203125, -9.27978515625, -8.613037109375, -7.9462890625, -7.279541015625, -6.61279296875, -5.946044921875, -5.279296875, -4.612548828125, -3.94580078125, -3.279052734375, -2.6123046875, -1.945556640625, -1.27880859375, -0.612060546875, 0.0546875, 0.721435546875, 1.38818359375, 2.054931640625, 2.7216796875, 3.388427734375, 4.05517578125, 4.721923828125, 5.388671875, 6.055419921875, 6.72216796875, 7.388916015625, 8.0556640625, 8.722412109375, 9.38916015625, 10.055908203125, 10.72265625, 11.389404296875, 12.05615234375, 12.722900390625, 13.3896484375, 14.056396484375, 14.72314453125, 15.389892578125, 16.056640625, 16.723388671875, 17.39013671875, 18.056884765625, 18.7236328125, 19.390380859375, 20.05712890625, 20.723876953125, 21.390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 16.0, 27.0, 57.0, 158.0, 385.0, 190.0, 83.0, 31.0, 19.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.3048095703125, -179.0391082763672, -172.77340698242188, -166.50770568847656, -160.24200439453125, -153.97630310058594, -147.71060180664062, -141.44488525390625, -135.17919921875, -128.9134979248047, -122.64779663085938, -116.38209533691406, -110.11639404296875, -103.85069274902344, -97.5849838256836, -91.31928253173828, -85.05357360839844, -78.78787231445312, -72.52217102050781, -66.2564697265625, -59.99076461791992, -53.72506332397461, -47.45935821533203, -41.19365692138672, -34.927955627441406, -28.662254333496094, -22.39655113220215, -16.130847930908203, -9.86514663696289, -3.599445343017578, 2.666259765625, 8.931961059570312, 15.197662353515625, 21.463363647460938, 27.729066848754883, 33.99477005004883, 40.26047134399414, 46.52617263793945, 52.79187774658203, 59.057579040527344, 65.32328033447266, 71.58898162841797, 77.85468292236328, 84.12039184570312, 90.38609313964844, 96.65179443359375, 102.91749572753906, 109.18319702148438, 115.44889831542969, 121.714599609375, 127.98030090332031, 134.24600219726562, 140.51170349121094, 146.77740478515625, 153.04312133789062, 159.30880737304688, 165.57452392578125, 171.84022521972656, 178.10592651367188, 184.3716278076172, 190.6373291015625, 196.9030303955078, 203.16873168945312, 209.4344482421875, 215.70013427734375]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 8.0, 8.0, 15.0, 19.0, 38.0, 40.0, 46.0, 78.0, 110.0, 97.0, 117.0, 106.0, 85.0, 64.0, 39.0, 31.0, 25.0, 15.0, 8.0, 5.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-128.6031036376953, -124.95463562011719, -121.30615997314453, -117.65768432617188, -114.00921630859375, -110.36074829101562, -106.71227264404297, -103.06379699707031, -99.41532897949219, -95.76686096191406, -92.1183853149414, -88.46990966796875, -84.82144165039062, -81.1729736328125, -77.52449798583984, -73.87602233886719, -70.22755432128906, -66.57908630371094, -62.93061065673828, -59.28213882446289, -55.6336669921875, -51.98519515991211, -48.33672332763672, -44.68825149536133, -41.03977966308594, -37.39130783081055, -33.742835998535156, -30.094364166259766, -26.445892333984375, -22.797420501708984, -19.148948669433594, -15.500476837158203, -11.852012634277344, -8.203540802001953, -4.5550689697265625, -0.9065971374511719, 2.7418746948242188, 6.390346527099609, 10.038818359375, 13.68729019165039, 17.33576202392578, 20.984233856201172, 24.632705688476562, 28.281177520751953, 31.929649353027344, 35.578121185302734, 39.226593017578125, 42.875064849853516, 46.523536682128906, 50.1720085144043, 53.82048034667969, 57.46895217895508, 61.11742401123047, 64.76589965820312, 68.41436767578125, 72.06283569335938, 75.71131134033203, 79.35978698730469, 83.00825500488281, 86.65672302246094, 90.3051986694336, 93.95367431640625, 97.60214233398438, 101.2506103515625, 104.89908599853516]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 6.0, 8.0, 21.0, 28.0, 38.0, 71.0, 100.0, 171.0, 282.0, 561.0, 1161.0, 2792.0, 8445.0, 36829.0, 1264008.0, 2825247.0, 38689.0, 9338.0, 3302.0, 1406.0, 758.0, 383.0, 264.0, 143.0, 79.0, 44.0, 40.0, 19.0, 18.0, 9.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.03125, -39.78857421875, -38.5458984375, -37.30322265625, -36.060546875, -34.81787109375, -33.5751953125, -32.33251953125, -31.08984375, -29.84716796875, -28.6044921875, -27.36181640625, -26.119140625, -24.87646484375, -23.6337890625, -22.39111328125, -21.1484375, -19.90576171875, -18.6630859375, -17.42041015625, -16.177734375, -14.93505859375, -13.6923828125, -12.44970703125, -11.20703125, -9.96435546875, -8.7216796875, -7.47900390625, -6.236328125, -4.99365234375, -3.7509765625, -2.50830078125, -1.265625, -0.02294921875, 1.2197265625, 2.46240234375, 3.705078125, 4.94775390625, 6.1904296875, 7.43310546875, 8.67578125, 9.91845703125, 11.1611328125, 12.40380859375, 13.646484375, 14.88916015625, 16.1318359375, 17.37451171875, 18.6171875, 19.85986328125, 21.1025390625, 22.34521484375, 23.587890625, 24.83056640625, 26.0732421875, 27.31591796875, 28.55859375, 29.80126953125, 31.0439453125, 32.28662109375, 33.529296875, 34.77197265625, 36.0146484375, 37.25732421875, 38.5]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 21.0, 21.0, 25.0, 51.0, 51.0, 85.0, 109.0, 111.0, 126.0, 100.0, 85.0, 65.0, 47.0, 22.0, 11.0, 12.0, 12.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4296875, -1.382110595703125, -1.33453369140625, -1.286956787109375, -1.2393798828125, -1.191802978515625, -1.14422607421875, -1.096649169921875, -1.049072265625, -1.001495361328125, -0.95391845703125, -0.906341552734375, -0.8587646484375, -0.811187744140625, -0.76361083984375, -0.716033935546875, -0.66845703125, -0.620880126953125, -0.57330322265625, -0.525726318359375, -0.4781494140625, -0.430572509765625, -0.38299560546875, -0.335418701171875, -0.287841796875, -0.240264892578125, -0.19268798828125, -0.145111083984375, -0.0975341796875, -0.049957275390625, -0.00238037109375, 0.045196533203125, 0.0927734375, 0.140350341796875, 0.18792724609375, 0.235504150390625, 0.2830810546875, 0.330657958984375, 0.37823486328125, 0.425811767578125, 0.473388671875, 0.520965576171875, 0.56854248046875, 0.616119384765625, 0.6636962890625, 0.711273193359375, 0.75885009765625, 0.806427001953125, 0.85400390625, 0.901580810546875, 0.94915771484375, 0.996734619140625, 1.0443115234375, 1.091888427734375, 1.13946533203125, 1.187042236328125, 1.234619140625, 1.282196044921875, 1.32977294921875, 1.377349853515625, 1.4249267578125, 1.472503662109375, 1.52008056640625, 1.567657470703125, 1.615234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 2.0, 10.0, 10.0, 7.0, 22.0, 21.0, 40.0, 63.0, 99.0, 139.0, 337.0, 590.0, 1428.0, 3528.0, 12461.0, 76786.0, 3857326.0, 211594.0, 21121.0, 5286.0, 1809.0, 771.0, 330.0, 194.0, 101.0, 48.0, 43.0, 37.0, 15.0, 14.0, 7.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -37.2177734375, -35.873046875, -34.5283203125, -33.18359375, -31.8388671875, -30.494140625, -29.1494140625, -27.8046875, -26.4599609375, -25.115234375, -23.7705078125, -22.42578125, -21.0810546875, -19.736328125, -18.3916015625, -17.046875, -15.7021484375, -14.357421875, -13.0126953125, -11.66796875, -10.3232421875, -8.978515625, -7.6337890625, -6.2890625, -4.9443359375, -3.599609375, -2.2548828125, -0.91015625, 0.4345703125, 1.779296875, 3.1240234375, 4.46875, 5.8134765625, 7.158203125, 8.5029296875, 9.84765625, 11.1923828125, 12.537109375, 13.8818359375, 15.2265625, 16.5712890625, 17.916015625, 19.2607421875, 20.60546875, 21.9501953125, 23.294921875, 24.6396484375, 25.984375, 27.3291015625, 28.673828125, 30.0185546875, 31.36328125, 32.7080078125, 34.052734375, 35.3974609375, 36.7421875, 38.0869140625, 39.431640625, 40.7763671875, 42.12109375, 43.4658203125, 44.810546875, 46.1552734375, 47.5]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 10.0, 5.0, 9.0, 13.0, 12.0, 20.0, 22.0, 41.0, 44.0, 64.0, 87.0, 125.0, 264.0, 1963.0, 678.0, 250.0, 131.0, 103.0, 55.0, 42.0, 35.0, 21.0, 12.0, 12.0, 14.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.669921875, -3.575225830078125, -3.48052978515625, -3.385833740234375, -3.2911376953125, -3.196441650390625, -3.10174560546875, -3.007049560546875, -2.912353515625, -2.817657470703125, -2.72296142578125, -2.628265380859375, -2.5335693359375, -2.438873291015625, -2.34417724609375, -2.249481201171875, -2.15478515625, -2.060089111328125, -1.96539306640625, -1.870697021484375, -1.7760009765625, -1.681304931640625, -1.58660888671875, -1.491912841796875, -1.397216796875, -1.302520751953125, -1.20782470703125, -1.113128662109375, -1.0184326171875, -0.923736572265625, -0.82904052734375, -0.734344482421875, -0.6396484375, -0.544952392578125, -0.45025634765625, -0.355560302734375, -0.2608642578125, -0.166168212890625, -0.07147216796875, 0.023223876953125, 0.117919921875, 0.212615966796875, 0.30731201171875, 0.402008056640625, 0.4967041015625, 0.591400146484375, 0.68609619140625, 0.780792236328125, 0.87548828125, 0.970184326171875, 1.06488037109375, 1.159576416015625, 1.2542724609375, 1.348968505859375, 1.44366455078125, 1.538360595703125, 1.633056640625, 1.727752685546875, 1.82244873046875, 1.917144775390625, 2.0118408203125, 2.106536865234375, 2.20123291015625, 2.295928955078125, 2.390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 11.0, 13.0, 14.0, 24.0, 39.0, 60.0, 98.0, 146.0, 197.0, 153.0, 87.0, 45.0, 30.0, 34.0, 14.0, 4.0, 6.0, 0.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.742218017578125, -27.732643127441406, -26.72307014465332, -25.713497161865234, -24.703922271728516, -23.694347381591797, -22.68477439880371, -21.675201416015625, -20.665626525878906, -19.656051635742188, -18.6464786529541, -17.636905670166016, -16.627330780029297, -15.617756843566895, -14.608182907104492, -13.59860897064209, -12.589035034179688, -11.579461097717285, -10.569887161254883, -9.56031322479248, -8.550739288330078, -7.541165351867676, -6.531591415405273, -5.522017478942871, -4.512443542480469, -3.5028696060180664, -2.493295669555664, -1.4837217330932617, -0.4741477966308594, 0.535426139831543, 1.5450000762939453, 2.5545740127563477, 3.56414794921875, 4.573721885681152, 5.583295822143555, 6.592869758605957, 7.602443695068359, 8.612017631530762, 9.621591567993164, 10.631165504455566, 11.640739440917969, 12.650313377380371, 13.659887313842773, 14.669461250305176, 15.679035186767578, 16.688610076904297, 17.698183059692383, 18.70775604248047, 19.717330932617188, 20.726905822753906, 21.736478805541992, 22.746051788330078, 23.755626678466797, 24.765201568603516, 25.7747745513916, 26.784347534179688, 27.793922424316406, 28.803497314453125, 29.81307029724121, 30.822643280029297, 31.832218170166016, 32.841793060302734, 33.85136413574219, 34.860939025878906, 35.870513916015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 9.0, 13.0, 25.0, 16.0, 26.0, 30.0, 61.0, 53.0, 60.0, 74.0, 67.0, 67.0, 62.0, 84.0, 58.0, 54.0, 54.0, 37.0, 39.0, 22.0, 16.0, 7.0, 14.0, 10.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.961162567138672, -17.402986526489258, -16.844812393188477, -16.286636352539062, -15.728461265563965, -15.170286178588867, -14.612110137939453, -14.053935050964355, -13.495759963989258, -12.93758487701416, -12.379408836364746, -11.821233749389648, -11.26305866241455, -10.704883575439453, -10.146707534790039, -9.588532447814941, -9.030356407165527, -8.47218132019043, -7.914005756378174, -7.355830192565918, -6.79765510559082, -6.2394795417785645, -5.681303977966309, -5.123128890991211, -4.564953327178955, -4.006777763366699, -3.4486026763916016, -2.8904271125793457, -2.332251787185669, -1.7740764617919922, -1.2159008979797363, -0.6577255725860596, -0.09955024719238281, 0.4586251378059387, 1.0168005228042603, 1.5749759674072266, 2.1331512928009033, 2.69132661819458, 3.249502182006836, 3.8076775074005127, 4.3658528327941895, 4.924028396606445, 5.482203483581543, 6.040379047393799, 6.598554611206055, 7.156729698181152, 7.714905261993408, 8.273080825805664, 8.831255912780762, 9.38943099975586, 9.947607040405273, 10.505782127380371, 11.063957214355469, 11.622133255004883, 12.18030834197998, 12.738483428955078, 13.296659469604492, 13.85483455657959, 14.413010597229004, 14.971185684204102, 15.5293607711792, 16.087535858154297, 16.64571189880371, 17.203887939453125, 17.762062072753906]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 10.0, 6.0, 9.0, 13.0, 12.0, 30.0, 53.0, 52.0, 98.0, 175.0, 257.0, 401.0, 789.0, 1498.0, 3100.0, 7621.0, 24071.0, 173822.0, 755664.0, 57719.0, 13514.0, 4934.0, 2076.0, 1143.0, 592.0, 358.0, 198.0, 113.0, 66.0, 58.0, 26.0, 28.0, 19.0, 13.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.03125, -37.955078125, -36.87890625, -35.802734375, -34.7265625, -33.650390625, -32.57421875, -31.498046875, -30.421875, -29.345703125, -28.26953125, -27.193359375, -26.1171875, -25.041015625, -23.96484375, -22.888671875, -21.8125, -20.736328125, -19.66015625, -18.583984375, -17.5078125, -16.431640625, -15.35546875, -14.279296875, -13.203125, -12.126953125, -11.05078125, -9.974609375, -8.8984375, -7.822265625, -6.74609375, -5.669921875, -4.59375, -3.517578125, -2.44140625, -1.365234375, -0.2890625, 0.787109375, 1.86328125, 2.939453125, 4.015625, 5.091796875, 6.16796875, 7.244140625, 8.3203125, 9.396484375, 10.47265625, 11.548828125, 12.625, 13.701171875, 14.77734375, 15.853515625, 16.9296875, 18.005859375, 19.08203125, 20.158203125, 21.234375, 22.310546875, 23.38671875, 24.462890625, 25.5390625, 26.615234375, 27.69140625, 28.767578125, 29.84375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 10.0, 3.0, 3.0, 8.0, 11.0, 13.0, 20.0, 31.0, 37.0, 41.0, 53.0, 74.0, 87.0, 108.0, 78.0, 80.0, 79.0, 52.0, 45.0, 40.0, 35.0, 26.0, 19.0, 11.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0662841796875, -1.024169921875, -0.9820556640625, -0.93994140625, -0.8978271484375, -0.855712890625, -0.8135986328125, -0.771484375, -0.7293701171875, -0.687255859375, -0.6451416015625, -0.60302734375, -0.5609130859375, -0.518798828125, -0.4766845703125, -0.4345703125, -0.3924560546875, -0.350341796875, -0.3082275390625, -0.26611328125, -0.2239990234375, -0.181884765625, -0.1397705078125, -0.09765625, -0.0555419921875, -0.013427734375, 0.0286865234375, 0.07080078125, 0.1129150390625, 0.155029296875, 0.1971435546875, 0.2392578125, 0.2813720703125, 0.323486328125, 0.3656005859375, 0.40771484375, 0.4498291015625, 0.491943359375, 0.5340576171875, 0.576171875, 0.6182861328125, 0.660400390625, 0.7025146484375, 0.74462890625, 0.7867431640625, 0.828857421875, 0.8709716796875, 0.9130859375, 0.9552001953125, 0.997314453125, 1.0394287109375, 1.08154296875, 1.1236572265625, 1.165771484375, 1.2078857421875, 1.25, 1.2921142578125, 1.334228515625, 1.3763427734375, 1.41845703125, 1.4605712890625, 1.502685546875, 1.5447998046875, 1.5869140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 6.0, 3.0, 10.0, 12.0, 18.0, 17.0, 33.0, 130.0, 1435.0, 795197.0, 250383.0, 1063.0, 103.0, 31.0, 20.0, 11.0, 10.0, 9.0, 6.0, 8.0, 7.0, 3.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.125, -87.8642578125, -84.603515625, -81.3427734375, -78.08203125, -74.8212890625, -71.560546875, -68.2998046875, -65.0390625, -61.7783203125, -58.517578125, -55.2568359375, -51.99609375, -48.7353515625, -45.474609375, -42.2138671875, -38.953125, -35.6923828125, -32.431640625, -29.1708984375, -25.91015625, -22.6494140625, -19.388671875, -16.1279296875, -12.8671875, -9.6064453125, -6.345703125, -3.0849609375, 0.17578125, 3.4365234375, 6.697265625, 9.9580078125, 13.21875, 16.4794921875, 19.740234375, 23.0009765625, 26.26171875, 29.5224609375, 32.783203125, 36.0439453125, 39.3046875, 42.5654296875, 45.826171875, 49.0869140625, 52.34765625, 55.6083984375, 58.869140625, 62.1298828125, 65.390625, 68.6513671875, 71.912109375, 75.1728515625, 78.43359375, 81.6943359375, 84.955078125, 88.2158203125, 91.4765625, 94.7373046875, 97.998046875, 101.2587890625, 104.51953125, 107.7802734375, 111.041015625, 114.3017578125, 117.5625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 5.0, 1.0, 8.0, 15.0, 11.0, 12.0, 20.0, 22.0, 15.0, 23.0, 26.0, 41.0, 49.0, 32.0, 42.0, 39.0, 45.0, 55.0, 46.0, 51.0, 52.0, 49.0, 46.0, 37.0, 34.0, 40.0, 34.0, 28.0, 27.0, 11.0, 12.0, 14.0, 7.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.5703125, -5.39788818359375, -5.2254638671875, -5.05303955078125, -4.880615234375, -4.70819091796875, -4.5357666015625, -4.36334228515625, -4.19091796875, -4.01849365234375, -3.8460693359375, -3.67364501953125, -3.501220703125, -3.32879638671875, -3.1563720703125, -2.98394775390625, -2.8115234375, -2.63909912109375, -2.4666748046875, -2.29425048828125, -2.121826171875, -1.94940185546875, -1.7769775390625, -1.60455322265625, -1.43212890625, -1.25970458984375, -1.0872802734375, -0.91485595703125, -0.742431640625, -0.57000732421875, -0.3975830078125, -0.22515869140625, -0.052734375, 0.11968994140625, 0.2921142578125, 0.46453857421875, 0.636962890625, 0.80938720703125, 0.9818115234375, 1.15423583984375, 1.32666015625, 1.49908447265625, 1.6715087890625, 1.84393310546875, 2.016357421875, 2.18878173828125, 2.3612060546875, 2.53363037109375, 2.7060546875, 2.87847900390625, 3.0509033203125, 3.22332763671875, 3.395751953125, 3.56817626953125, 3.7406005859375, 3.91302490234375, 4.08544921875, 4.25787353515625, 4.4302978515625, 4.60272216796875, 4.775146484375, 4.94757080078125, 5.1199951171875, 5.29241943359375, 5.46484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 9.0, 7.0, 5.0, 22.0, 15.0, 28.0, 116.0, 568.0, 7905.0, 1030792.0, 8253.0, 545.0, 133.0, 45.0, 22.0, 16.0, 7.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.75, -160.31640625, -154.8828125, -149.44921875, -144.015625, -138.58203125, -133.1484375, -127.71484375, -122.28125, -116.84765625, -111.4140625, -105.98046875, -100.546875, -95.11328125, -89.6796875, -84.24609375, -78.8125, -73.37890625, -67.9453125, -62.51171875, -57.078125, -51.64453125, -46.2109375, -40.77734375, -35.34375, -29.91015625, -24.4765625, -19.04296875, -13.609375, -8.17578125, -2.7421875, 2.69140625, 8.125, 13.55859375, 18.9921875, 24.42578125, 29.859375, 35.29296875, 40.7265625, 46.16015625, 51.59375, 57.02734375, 62.4609375, 67.89453125, 73.328125, 78.76171875, 84.1953125, 89.62890625, 95.0625, 100.49609375, 105.9296875, 111.36328125, 116.796875, 122.23046875, 127.6640625, 133.09765625, 138.53125, 143.96484375, 149.3984375, 154.83203125, 160.265625, 165.69921875, 171.1328125, 176.56640625, 182.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 17.0, 22.0, 21.0, 54.0, 83.0, 158.0, 174.0, 165.0, 97.0, 55.0, 26.0, 20.0, 10.0, 11.0, 7.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001461029052734375, -0.0014147162437438965, -0.001368403434753418, -0.0013220906257629395, -0.001275777816772461, -0.0012294650077819824, -0.001183152198791504, -0.0011368393898010254, -0.0010905265808105469, -0.0010442137718200684, -0.0009979009628295898, -0.0009515881538391113, -0.0009052753448486328, -0.0008589625358581543, -0.0008126497268676758, -0.0007663369178771973, -0.0007200241088867188, -0.0006737112998962402, -0.0006273984909057617, -0.0005810856819152832, -0.0005347728729248047, -0.0004884600639343262, -0.00044214725494384766, -0.00039583444595336914, -0.0003495216369628906, -0.0003032088279724121, -0.0002568960189819336, -0.00021058320999145508, -0.00016427040100097656, -0.00011795759201049805, -7.164478302001953e-05, -2.5331974029541016e-05, 2.09808349609375e-05, 6.729364395141602e-05, 0.00011360645294189453, 0.00015991926193237305, 0.00020623207092285156, 0.0002525448799133301, 0.0002988576889038086, 0.0003451704978942871, 0.0003914833068847656, 0.00043779611587524414, 0.00048410892486572266, 0.0005304217338562012, 0.0005767345428466797, 0.0006230473518371582, 0.0006693601608276367, 0.0007156729698181152, 0.0007619857788085938, 0.0008082985877990723, 0.0008546113967895508, 0.0009009242057800293, 0.0009472370147705078, 0.0009935498237609863, 0.0010398626327514648, 0.0010861754417419434, 0.0011324882507324219, 0.0011788010597229004, 0.001225113868713379, 0.0012714266777038574, 0.001317739486694336, 0.0013640522956848145, 0.001410365104675293, 0.0014566779136657715, 0.00150299072265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 18.0, 21.0, 29.0, 41.0, 52.0, 83.0, 105.0, 173.0, 286.0, 459.0, 745.0, 1184.0, 2219.0, 4090.0, 9661.0, 31200.0, 458747.0, 487508.0, 32027.0, 10050.0, 4288.0, 2235.0, 1210.0, 734.0, 479.0, 292.0, 179.0, 133.0, 85.0, 66.0, 52.0, 26.0, 22.0, 13.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-51.125, -49.66455078125, -48.2041015625, -46.74365234375, -45.283203125, -43.82275390625, -42.3623046875, -40.90185546875, -39.44140625, -37.98095703125, -36.5205078125, -35.06005859375, -33.599609375, -32.13916015625, -30.6787109375, -29.21826171875, -27.7578125, -26.29736328125, -24.8369140625, -23.37646484375, -21.916015625, -20.45556640625, -18.9951171875, -17.53466796875, -16.07421875, -14.61376953125, -13.1533203125, -11.69287109375, -10.232421875, -8.77197265625, -7.3115234375, -5.85107421875, -4.390625, -2.93017578125, -1.4697265625, -0.00927734375, 1.451171875, 2.91162109375, 4.3720703125, 5.83251953125, 7.29296875, 8.75341796875, 10.2138671875, 11.67431640625, 13.134765625, 14.59521484375, 16.0556640625, 17.51611328125, 18.9765625, 20.43701171875, 21.8974609375, 23.35791015625, 24.818359375, 26.27880859375, 27.7392578125, 29.19970703125, 30.66015625, 32.12060546875, 33.5810546875, 35.04150390625, 36.501953125, 37.96240234375, 39.4228515625, 40.88330078125, 42.34375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 6.0, 8.0, 8.0, 13.0, 21.0, 24.0, 38.0, 80.0, 210.0, 265.0, 150.0, 54.0, 32.0, 20.0, 15.0, 12.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.71875, -24.84033203125, -23.9619140625, -23.08349609375, -22.205078125, -21.32666015625, -20.4482421875, -19.56982421875, -18.69140625, -17.81298828125, -16.9345703125, -16.05615234375, -15.177734375, -14.29931640625, -13.4208984375, -12.54248046875, -11.6640625, -10.78564453125, -9.9072265625, -9.02880859375, -8.150390625, -7.27197265625, -6.3935546875, -5.51513671875, -4.63671875, -3.75830078125, -2.8798828125, -2.00146484375, -1.123046875, -0.24462890625, 0.6337890625, 1.51220703125, 2.390625, 3.26904296875, 4.1474609375, 5.02587890625, 5.904296875, 6.78271484375, 7.6611328125, 8.53955078125, 9.41796875, 10.29638671875, 11.1748046875, 12.05322265625, 12.931640625, 13.81005859375, 14.6884765625, 15.56689453125, 16.4453125, 17.32373046875, 18.2021484375, 19.08056640625, 19.958984375, 20.83740234375, 21.7158203125, 22.59423828125, 23.47265625, 24.35107421875, 25.2294921875, 26.10791015625, 26.986328125, 27.86474609375, 28.7431640625, 29.62158203125, 30.5]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 15.0, 27.0, 67.0, 133.0, 233.0, 256.0, 166.0, 61.0, 23.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.5373764038086, -71.24346923828125, -65.94956970214844, -60.655662536621094, -55.36176300048828, -50.06785583496094, -44.77395248413086, -39.48004913330078, -34.1861457824707, -28.892242431640625, -23.598339080810547, -18.304433822631836, -13.010530471801758, -7.71662712097168, -2.4227218627929688, 2.8711814880371094, 8.165084838867188, 13.458988189697266, 18.752891540527344, 24.046796798706055, 29.340700149536133, 34.634605407714844, 39.92850875854492, 45.222412109375, 50.51631546020508, 55.810218811035156, 61.104122161865234, 66.39802551269531, 71.69193267822266, 76.98583221435547, 82.27973937988281, 87.57363891601562, 92.86753845214844, 98.16144561767578, 103.4553451538086, 108.74925231933594, 114.04315185546875, 119.3370590209961, 124.63096618652344, 129.92486572265625, 135.21876525878906, 140.51266479492188, 145.80657958984375, 151.10047912597656, 156.39437866210938, 161.6882781982422, 166.98219299316406, 172.27609252929688, 177.57000732421875, 182.86390686035156, 188.15782165527344, 193.45172119140625, 198.74562072753906, 204.03952026367188, 209.33343505859375, 214.62733459472656, 219.92123413085938, 225.2151336669922, 230.50904846191406, 235.80294799804688, 241.0968475341797, 246.3907470703125, 251.68466186523438, 256.97857666015625, 262.2724609375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 11.0, 9.0, 8.0, 19.0, 20.0, 19.0, 29.0, 34.0, 51.0, 46.0, 48.0, 73.0, 66.0, 72.0, 79.0, 72.0, 72.0, 53.0, 44.0, 44.0, 35.0, 23.0, 14.0, 14.0, 10.0, 4.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.68582534790039, -58.53425598144531, -56.382686614990234, -54.231117248535156, -52.07954406738281, -49.927974700927734, -47.776405334472656, -45.62483596801758, -43.4732666015625, -41.32169723510742, -39.170127868652344, -37.0185546875, -34.86698532104492, -32.715415954589844, -30.563846588134766, -28.412277221679688, -26.260704040527344, -24.109134674072266, -21.957563400268555, -19.805994033813477, -17.654422760009766, -15.502853393554688, -13.35128402709961, -11.199713706970215, -9.04814338684082, -6.896573066711426, -4.7450032234191895, -2.593433380126953, -0.4418630599975586, 1.709707260131836, 3.861276626586914, 6.012846946716309, 8.164421081542969, 10.315991401672363, 12.467561721801758, 14.619131088256836, 16.770702362060547, 18.922271728515625, 21.073841094970703, 23.22541046142578, 25.376981735229492, 27.52855110168457, 29.68012237548828, 31.83169174194336, 33.98326110839844, 36.13483428955078, 38.286399841308594, 40.43797302246094, 42.589542388916016, 44.741111755371094, 46.89268112182617, 49.04425048828125, 51.195823669433594, 53.34739303588867, 55.49896240234375, 57.65053176879883, 59.802101135253906, 61.953670501708984, 64.10523986816406, 66.2568130493164, 68.40837860107422, 70.55995178222656, 72.71151733398438, 74.86309051513672, 77.01466369628906]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 24.0, 49.0, 148.0, 381.0, 1582.0, 8097.0, 100302.0, 4026298.0, 49388.0, 5764.0, 1290.0, 444.0, 179.0, 104.0, 57.0, 31.0, 21.0, 19.0, 17.0, 12.0, 13.0, 14.0, 8.0, 10.0, 6.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -64.9423828125, -62.384765625, -59.8271484375, -57.26953125, -54.7119140625, -52.154296875, -49.5966796875, -47.0390625, -44.4814453125, -41.923828125, -39.3662109375, -36.80859375, -34.2509765625, -31.693359375, -29.1357421875, -26.578125, -24.0205078125, -21.462890625, -18.9052734375, -16.34765625, -13.7900390625, -11.232421875, -8.6748046875, -6.1171875, -3.5595703125, -1.001953125, 1.5556640625, 4.11328125, 6.6708984375, 9.228515625, 11.7861328125, 14.34375, 16.9013671875, 19.458984375, 22.0166015625, 24.57421875, 27.1318359375, 29.689453125, 32.2470703125, 34.8046875, 37.3623046875, 39.919921875, 42.4775390625, 45.03515625, 47.5927734375, 50.150390625, 52.7080078125, 55.265625, 57.8232421875, 60.380859375, 62.9384765625, 65.49609375, 68.0537109375, 70.611328125, 73.1689453125, 75.7265625, 78.2841796875, 80.841796875, 83.3994140625, 85.95703125, 88.5146484375, 91.072265625, 93.6298828125, 96.1875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 20.0, 24.0, 32.0, 46.0, 64.0, 86.0, 110.0, 104.0, 101.0, 99.0, 82.0, 60.0, 45.0, 37.0, 31.0, 18.0, 11.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -0.9845733642578125, -0.923248291015625, -0.8619232177734375, -0.80059814453125, -0.7392730712890625, -0.677947998046875, -0.6166229248046875, -0.5552978515625, -0.4939727783203125, -0.432647705078125, -0.3713226318359375, -0.30999755859375, -0.2486724853515625, -0.187347412109375, -0.1260223388671875, -0.064697265625, -0.0033721923828125, 0.057952880859375, 0.1192779541015625, 0.18060302734375, 0.2419281005859375, 0.303253173828125, 0.3645782470703125, 0.4259033203125, 0.4872283935546875, 0.548553466796875, 0.6098785400390625, 0.67120361328125, 0.7325286865234375, 0.793853759765625, 0.8551788330078125, 0.91650390625, 0.9778289794921875, 1.039154052734375, 1.1004791259765625, 1.16180419921875, 1.2231292724609375, 1.284454345703125, 1.3457794189453125, 1.4071044921875, 1.4684295654296875, 1.529754638671875, 1.5910797119140625, 1.65240478515625, 1.7137298583984375, 1.775054931640625, 1.8363800048828125, 1.897705078125, 1.9590301513671875, 2.020355224609375, 2.0816802978515625, 2.14300537109375, 2.2043304443359375, 2.265655517578125, 2.3269805908203125, 2.3883056640625, 2.4496307373046875, 2.510955810546875, 2.5722808837890625, 2.63360595703125, 2.6949310302734375, 2.756256103515625, 2.8175811767578125, 2.87890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 10.0, 16.0, 24.0, 30.0, 48.0, 119.0, 418.0, 3610.0, 286276.0, 3894684.0, 8026.0, 643.0, 144.0, 62.0, 51.0, 27.0, 22.0, 16.0, 17.0, 6.0, 8.0, 8.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.9375, -94.45703125, -90.9765625, -87.49609375, -84.015625, -80.53515625, -77.0546875, -73.57421875, -70.09375, -66.61328125, -63.1328125, -59.65234375, -56.171875, -52.69140625, -49.2109375, -45.73046875, -42.25, -38.76953125, -35.2890625, -31.80859375, -28.328125, -24.84765625, -21.3671875, -17.88671875, -14.40625, -10.92578125, -7.4453125, -3.96484375, -0.484375, 2.99609375, 6.4765625, 9.95703125, 13.4375, 16.91796875, 20.3984375, 23.87890625, 27.359375, 30.83984375, 34.3203125, 37.80078125, 41.28125, 44.76171875, 48.2421875, 51.72265625, 55.203125, 58.68359375, 62.1640625, 65.64453125, 69.125, 72.60546875, 76.0859375, 79.56640625, 83.046875, 86.52734375, 90.0078125, 93.48828125, 96.96875, 100.44921875, 103.9296875, 107.41015625, 110.890625, 114.37109375, 117.8515625, 121.33203125, 124.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 1.0, 6.0, 5.0, 3.0, 4.0, 11.0, 8.0, 13.0, 23.0, 34.0, 29.0, 44.0, 41.0, 57.0, 98.0, 137.0, 239.0, 450.0, 1464.0, 575.0, 257.0, 166.0, 124.0, 67.0, 55.0, 40.0, 33.0, 22.0, 13.0, 9.0, 11.0, 7.0, 5.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.71484375, -3.618499755859375, -3.52215576171875, -3.425811767578125, -3.3294677734375, -3.233123779296875, -3.13677978515625, -3.040435791015625, -2.944091796875, -2.847747802734375, -2.75140380859375, -2.655059814453125, -2.5587158203125, -2.462371826171875, -2.36602783203125, -2.269683837890625, -2.17333984375, -2.076995849609375, -1.98065185546875, -1.884307861328125, -1.7879638671875, -1.691619873046875, -1.59527587890625, -1.498931884765625, -1.402587890625, -1.306243896484375, -1.20989990234375, -1.113555908203125, -1.0172119140625, -0.920867919921875, -0.82452392578125, -0.728179931640625, -0.6318359375, -0.535491943359375, -0.43914794921875, -0.342803955078125, -0.2464599609375, -0.150115966796875, -0.05377197265625, 0.042572021484375, 0.138916015625, 0.235260009765625, 0.33160400390625, 0.427947998046875, 0.5242919921875, 0.620635986328125, 0.71697998046875, 0.813323974609375, 0.90966796875, 1.006011962890625, 1.10235595703125, 1.198699951171875, 1.2950439453125, 1.391387939453125, 1.48773193359375, 1.584075927734375, 1.680419921875, 1.776763916015625, 1.87310791015625, 1.969451904296875, 2.0657958984375, 2.162139892578125, 2.25848388671875, 2.354827880859375, 2.451171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 21.0, 45.0, 133.0, 251.0, 263.0, 170.0, 58.0, 29.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.42173767089844, -67.59588623046875, -65.77003479003906, -63.944183349609375, -62.11832809448242, -60.292476654052734, -58.46662521362305, -56.64077377319336, -54.814918518066406, -52.98906707763672, -51.16321563720703, -49.337364196777344, -47.51150894165039, -45.6856575012207, -43.859806060791016, -42.03395462036133, -40.20810317993164, -38.38225173950195, -36.556400299072266, -34.73054504394531, -32.904693603515625, -31.078842163085938, -29.25299072265625, -27.427139282226562, -25.601285934448242, -23.775434494018555, -21.949581146240234, -20.123729705810547, -18.29787826538086, -16.47202491760254, -14.646173477172852, -12.820321083068848, -10.99447250366211, -9.168620109558105, -7.34276819229126, -5.516916275024414, -3.69106388092041, -1.8652114868164062, -0.03936004638671875, 1.7864923477172852, 3.612344741821289, 5.438197135925293, 7.264049053192139, 9.089900970458984, 10.915753364562988, 12.741605758666992, 14.56745719909668, 16.393310546875, 18.219161987304688, 20.045013427734375, 21.870866775512695, 23.696718215942383, 25.522571563720703, 27.34842300415039, 29.174274444580078, 31.000125885009766, 32.82598114013672, 34.651832580566406, 36.477684020996094, 38.30353546142578, 40.129390716552734, 41.95524215698242, 43.78109359741211, 45.6069450378418, 47.432796478271484]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 15.0, 20.0, 32.0, 45.0, 39.0, 68.0, 73.0, 72.0, 86.0, 78.0, 89.0, 62.0, 69.0, 63.0, 53.0, 38.0, 29.0, 20.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.177270889282227, -30.451385498046875, -29.725500106811523, -28.999614715576172, -28.27372932434082, -27.54784393310547, -26.821956634521484, -26.096071243286133, -25.37018585205078, -24.64430046081543, -23.918415069580078, -23.192529678344727, -22.466644287109375, -21.74075698852539, -21.014873504638672, -20.288986206054688, -19.56310272216797, -18.837217330932617, -18.111331939697266, -17.385446548461914, -16.659561157226562, -15.933674812316895, -15.207789421081543, -14.481903076171875, -13.756017684936523, -13.030132293701172, -12.30424690246582, -11.578361511230469, -10.8524751663208, -10.12658977508545, -9.400704383850098, -8.67481803894043, -7.948931694030762, -7.22304630279541, -6.4971604347229, -5.771275043487549, -5.045389175415039, -4.3195037841796875, -3.593618392944336, -2.867732524871826, -2.1418471336364746, -1.415961503982544, -0.6900759935379028, 0.03580951690673828, 0.761695146560669, 1.4875807762145996, 2.213466167449951, 2.939352035522461, 3.6652374267578125, 4.391122817993164, 5.117008686065674, 5.842894077301025, 6.568779945373535, 7.294665336608887, 8.020550727844238, 8.746437072753906, 9.472322463989258, 10.19820785522461, 10.924093246459961, 11.649978637695312, 12.37586498260498, 13.101750373840332, 13.827635765075684, 14.553522109985352, 15.279406547546387]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 6.0, 7.0, 18.0, 11.0, 16.0, 30.0, 20.0, 18.0, 21.0, 37.0, 33.0, 61.0, 87.0, 354.0, 2656.0, 65647.0, 905795.0, 70187.0, 2781.0, 339.0, 102.0, 64.0, 37.0, 36.0, 29.0, 29.0, 23.0, 13.0, 18.0, 15.0, 11.0, 10.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.75, -41.30126953125, -39.8525390625, -38.40380859375, -36.955078125, -35.50634765625, -34.0576171875, -32.60888671875, -31.16015625, -29.71142578125, -28.2626953125, -26.81396484375, -25.365234375, -23.91650390625, -22.4677734375, -21.01904296875, -19.5703125, -18.12158203125, -16.6728515625, -15.22412109375, -13.775390625, -12.32666015625, -10.8779296875, -9.42919921875, -7.98046875, -6.53173828125, -5.0830078125, -3.63427734375, -2.185546875, -0.73681640625, 0.7119140625, 2.16064453125, 3.609375, 5.05810546875, 6.5068359375, 7.95556640625, 9.404296875, 10.85302734375, 12.3017578125, 13.75048828125, 15.19921875, 16.64794921875, 18.0966796875, 19.54541015625, 20.994140625, 22.44287109375, 23.8916015625, 25.34033203125, 26.7890625, 28.23779296875, 29.6865234375, 31.13525390625, 32.583984375, 34.03271484375, 35.4814453125, 36.93017578125, 38.37890625, 39.82763671875, 41.2763671875, 42.72509765625, 44.173828125, 45.62255859375, 47.0712890625, 48.52001953125, 49.96875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 3.0, 9.0, 17.0, 32.0, 50.0, 73.0, 96.0, 101.0, 110.0, 122.0, 106.0, 88.0, 68.0, 40.0, 31.0, 23.0, 13.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.132232666015625, -3.05938720703125, -2.986541748046875, -2.9136962890625, -2.840850830078125, -2.76800537109375, -2.695159912109375, -2.622314453125, -2.549468994140625, -2.47662353515625, -2.403778076171875, -2.3309326171875, -2.258087158203125, -2.18524169921875, -2.112396240234375, -2.03955078125, -1.966705322265625, -1.89385986328125, -1.821014404296875, -1.7481689453125, -1.675323486328125, -1.60247802734375, -1.529632568359375, -1.456787109375, -1.383941650390625, -1.31109619140625, -1.238250732421875, -1.1654052734375, -1.092559814453125, -1.01971435546875, -0.946868896484375, -0.8740234375, -0.801177978515625, -0.72833251953125, -0.655487060546875, -0.5826416015625, -0.509796142578125, -0.43695068359375, -0.364105224609375, -0.291259765625, -0.218414306640625, -0.14556884765625, -0.072723388671875, 0.0001220703125, 0.072967529296875, 0.14581298828125, 0.218658447265625, 0.29150390625, 0.364349365234375, 0.43719482421875, 0.510040283203125, 0.5828857421875, 0.655731201171875, 0.72857666015625, 0.801422119140625, 0.874267578125, 0.947113037109375, 1.01995849609375, 1.092803955078125, 1.1656494140625, 1.238494873046875, 1.31134033203125, 1.384185791015625, 1.45703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 5.0, 7.0, 18.0, 21.0, 39.0, 40.0, 58.0, 64.0, 110.0, 161.0, 226.0, 319.0, 488.0, 730.0, 1298.0, 2446.0, 4653.0, 10162.0, 23061.0, 57381.0, 148242.0, 322132.0, 280671.0, 116746.0, 44534.0, 18101.0, 7946.0, 3845.0, 1953.0, 1076.0, 631.0, 416.0, 263.0, 213.0, 138.0, 101.0, 66.0, 59.0, 30.0, 36.0, 16.0, 19.0, 12.0, 5.0, 2.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.39453125, -11.0, -10.60546875, -10.2109375, -9.81640625, -9.421875, -9.02734375, -8.6328125, -8.23828125, -7.84375, -7.44921875, -7.0546875, -6.66015625, -6.265625, -5.87109375, -5.4765625, -5.08203125, -4.6875, -4.29296875, -3.8984375, -3.50390625, -3.109375, -2.71484375, -2.3203125, -1.92578125, -1.53125, -1.13671875, -0.7421875, -0.34765625, 0.046875, 0.44140625, 0.8359375, 1.23046875, 1.625, 2.01953125, 2.4140625, 2.80859375, 3.203125, 3.59765625, 3.9921875, 4.38671875, 4.78125, 5.17578125, 5.5703125, 5.96484375, 6.359375, 6.75390625, 7.1484375, 7.54296875, 7.9375, 8.33203125, 8.7265625, 9.12109375, 9.515625, 9.91015625, 10.3046875, 10.69921875, 11.09375, 11.48828125, 11.8828125, 12.27734375, 12.671875, 13.06640625, 13.4609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 7.0, 8.0, 6.0, 10.0, 9.0, 17.0, 14.0, 19.0, 36.0, 27.0, 29.0, 35.0, 37.0, 37.0, 48.0, 45.0, 52.0, 46.0, 50.0, 62.0, 64.0, 43.0, 30.0, 35.0, 32.0, 35.0, 28.0, 22.0, 19.0, 12.0, 19.0, 13.0, 7.0, 9.0, 10.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.18304443359375, -7.9364013671875, -7.68975830078125, -7.443115234375, -7.19647216796875, -6.9498291015625, -6.70318603515625, -6.45654296875, -6.20989990234375, -5.9632568359375, -5.71661376953125, -5.469970703125, -5.22332763671875, -4.9766845703125, -4.73004150390625, -4.4833984375, -4.23675537109375, -3.9901123046875, -3.74346923828125, -3.496826171875, -3.25018310546875, -3.0035400390625, -2.75689697265625, -2.51025390625, -2.26361083984375, -2.0169677734375, -1.77032470703125, -1.523681640625, -1.27703857421875, -1.0303955078125, -0.78375244140625, -0.537109375, -0.29046630859375, -0.0438232421875, 0.20281982421875, 0.449462890625, 0.69610595703125, 0.9427490234375, 1.18939208984375, 1.43603515625, 1.68267822265625, 1.9293212890625, 2.17596435546875, 2.422607421875, 2.66925048828125, 2.9158935546875, 3.16253662109375, 3.4091796875, 3.65582275390625, 3.9024658203125, 4.14910888671875, 4.395751953125, 4.64239501953125, 4.8890380859375, 5.13568115234375, 5.38232421875, 5.62896728515625, 5.8756103515625, 6.12225341796875, 6.368896484375, 6.61553955078125, 6.8621826171875, 7.10882568359375, 7.35546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 7.0, 20.0, 13.0, 12.0, 16.0, 34.0, 45.0, 74.0, 80.0, 117.0, 183.0, 229.0, 395.0, 589.0, 963.0, 1647.0, 2814.0, 5267.0, 11908.0, 33121.0, 181716.0, 635532.0, 125541.0, 26735.0, 10043.0, 4803.0, 2608.0, 1396.0, 881.0, 560.0, 395.0, 239.0, 165.0, 95.0, 86.0, 59.0, 36.0, 29.0, 31.0, 16.0, 21.0, 6.0, 4.0, 8.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.796875, -17.247802734375, -16.69873046875, -16.149658203125, -15.6005859375, -15.051513671875, -14.50244140625, -13.953369140625, -13.404296875, -12.855224609375, -12.30615234375, -11.757080078125, -11.2080078125, -10.658935546875, -10.10986328125, -9.560791015625, -9.01171875, -8.462646484375, -7.91357421875, -7.364501953125, -6.8154296875, -6.266357421875, -5.71728515625, -5.168212890625, -4.619140625, -4.070068359375, -3.52099609375, -2.971923828125, -2.4228515625, -1.873779296875, -1.32470703125, -0.775634765625, -0.2265625, 0.322509765625, 0.87158203125, 1.420654296875, 1.9697265625, 2.518798828125, 3.06787109375, 3.616943359375, 4.166015625, 4.715087890625, 5.26416015625, 5.813232421875, 6.3623046875, 6.911376953125, 7.46044921875, 8.009521484375, 8.55859375, 9.107666015625, 9.65673828125, 10.205810546875, 10.7548828125, 11.303955078125, 11.85302734375, 12.402099609375, 12.951171875, 13.500244140625, 14.04931640625, 14.598388671875, 15.1474609375, 15.696533203125, 16.24560546875, 16.794677734375, 17.34375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 6.0, 5.0, 3.0, 17.0, 22.0, 27.0, 28.0, 34.0, 51.0, 64.0, 83.0, 92.0, 91.0, 88.0, 83.0, 72.0, 53.0, 30.0, 30.0, 22.0, 23.0, 17.0, 10.0, 7.0, 4.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013093948364257812, -0.0012726932764053345, -0.0012359917163848877, -0.001199290156364441, -0.0011625885963439941, -0.0011258870363235474, -0.0010891854763031006, -0.0010524839162826538, -0.001015782356262207, -0.0009790807962417603, -0.0009423792362213135, -0.0009056776762008667, -0.0008689761161804199, -0.0008322745561599731, -0.0007955729961395264, -0.0007588714361190796, -0.0007221698760986328, -0.000685468316078186, -0.0006487667560577393, -0.0006120651960372925, -0.0005753636360168457, -0.0005386620759963989, -0.0005019605159759521, -0.00046525895595550537, -0.0004285573959350586, -0.0003918558359146118, -0.00035515427589416504, -0.00031845271587371826, -0.0002817511558532715, -0.0002450495958328247, -0.00020834803581237793, -0.00017164647579193115, -0.00013494491577148438, -9.82433557510376e-05, -6.154179573059082e-05, -2.4840235710144043e-05, 1.1861324310302734e-05, 4.856288433074951e-05, 8.526444435119629e-05, 0.00012196600437164307, 0.00015866756439208984, 0.00019536912441253662, 0.0002320706844329834, 0.0002687722444534302, 0.00030547380447387695, 0.00034217536449432373, 0.0003788769245147705, 0.0004155784845352173, 0.00045228004455566406, 0.0004889816045761108, 0.0005256831645965576, 0.0005623847246170044, 0.0005990862846374512, 0.000635787844657898, 0.0006724894046783447, 0.0007091909646987915, 0.0007458925247192383, 0.0007825940847396851, 0.0008192956447601318, 0.0008559972047805786, 0.0008926987648010254, 0.0009294003248214722, 0.0009661018848419189, 0.0010028034448623657, 0.0010395050048828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 9.0, 12.0, 5.0, 8.0, 13.0, 15.0, 32.0, 34.0, 69.0, 98.0, 183.0, 295.0, 445.0, 928.0, 1891.0, 4246.0, 11531.0, 44238.0, 373000.0, 526183.0, 61349.0, 14262.0, 5124.0, 2135.0, 1025.0, 546.0, 318.0, 185.0, 112.0, 87.0, 44.0, 34.0, 29.0, 16.0, 14.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.578125, -19.956298828125, -19.33447265625, -18.712646484375, -18.0908203125, -17.468994140625, -16.84716796875, -16.225341796875, -15.603515625, -14.981689453125, -14.35986328125, -13.738037109375, -13.1162109375, -12.494384765625, -11.87255859375, -11.250732421875, -10.62890625, -10.007080078125, -9.38525390625, -8.763427734375, -8.1416015625, -7.519775390625, -6.89794921875, -6.276123046875, -5.654296875, -5.032470703125, -4.41064453125, -3.788818359375, -3.1669921875, -2.545166015625, -1.92333984375, -1.301513671875, -0.6796875, -0.057861328125, 0.56396484375, 1.185791015625, 1.8076171875, 2.429443359375, 3.05126953125, 3.673095703125, 4.294921875, 4.916748046875, 5.53857421875, 6.160400390625, 6.7822265625, 7.404052734375, 8.02587890625, 8.647705078125, 9.26953125, 9.891357421875, 10.51318359375, 11.135009765625, 11.7568359375, 12.378662109375, 13.00048828125, 13.622314453125, 14.244140625, 14.865966796875, 15.48779296875, 16.109619140625, 16.7314453125, 17.353271484375, 17.97509765625, 18.596923828125, 19.21875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 5.0, 6.0, 12.0, 16.0, 34.0, 46.0, 74.0, 135.0, 139.0, 148.0, 127.0, 80.0, 55.0, 44.0, 20.0, 15.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.609375, -12.26123046875, -11.9130859375, -11.56494140625, -11.216796875, -10.86865234375, -10.5205078125, -10.17236328125, -9.82421875, -9.47607421875, -9.1279296875, -8.77978515625, -8.431640625, -8.08349609375, -7.7353515625, -7.38720703125, -7.0390625, -6.69091796875, -6.3427734375, -5.99462890625, -5.646484375, -5.29833984375, -4.9501953125, -4.60205078125, -4.25390625, -3.90576171875, -3.5576171875, -3.20947265625, -2.861328125, -2.51318359375, -2.1650390625, -1.81689453125, -1.46875, -1.12060546875, -0.7724609375, -0.42431640625, -0.076171875, 0.27197265625, 0.6201171875, 0.96826171875, 1.31640625, 1.66455078125, 2.0126953125, 2.36083984375, 2.708984375, 3.05712890625, 3.4052734375, 3.75341796875, 4.1015625, 4.44970703125, 4.7978515625, 5.14599609375, 5.494140625, 5.84228515625, 6.1904296875, 6.53857421875, 6.88671875, 7.23486328125, 7.5830078125, 7.93115234375, 8.279296875, 8.62744140625, 8.9755859375, 9.32373046875, 9.671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 16.0, 29.0, 33.0, 59.0, 89.0, 168.0, 171.0, 184.0, 108.0, 57.0, 38.0, 19.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.7835235595703, -147.545166015625, -143.3068084716797, -139.06845092773438, -134.83009338378906, -130.59173583984375, -126.35337829589844, -122.11502075195312, -117.87666320800781, -113.6383056640625, -109.39994812011719, -105.16159057617188, -100.92323303222656, -96.68487548828125, -92.44651794433594, -88.20816040039062, -83.96980285644531, -79.7314453125, -75.49308776855469, -71.25473022460938, -67.01637268066406, -62.77801513671875, -58.53965759277344, -54.301300048828125, -50.06294250488281, -45.8245849609375, -41.58622741699219, -37.347869873046875, -33.10951232910156, -28.87115478515625, -24.632797241210938, -20.394439697265625, -16.156082153320312, -11.917724609375, -7.6793670654296875, -3.441009521484375, 0.7973480224609375, 5.03570556640625, 9.274063110351562, 13.512420654296875, 17.750778198242188, 21.9891357421875, 26.227493286132812, 30.465850830078125, 34.70420837402344, 38.94256591796875, 43.18092346191406, 47.419281005859375, 51.65763854980469, 55.89599609375, 60.13435363769531, 64.37271118164062, 68.61106872558594, 72.84942626953125, 77.08778381347656, 81.32614135742188, 85.56449890136719, 89.8028564453125, 94.04121398925781, 98.27957153320312, 102.51792907714844, 106.75628662109375, 110.99464416503906, 115.23300170898438, 119.47135925292969]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 13.0, 16.0, 27.0, 27.0, 32.0, 37.0, 53.0, 64.0, 86.0, 75.0, 91.0, 73.0, 79.0, 63.0, 59.0, 54.0, 46.0, 29.0, 22.0, 13.0, 13.0, 10.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.28970336914062, -119.17134857177734, -116.05298614501953, -112.93463134765625, -109.81626892089844, -106.69791412353516, -103.57955169677734, -100.46119689941406, -97.34283447265625, -94.22447967529297, -91.10611724853516, -87.98776245117188, -84.86940002441406, -81.75104522705078, -78.63268280029297, -75.51432800292969, -72.39596557617188, -69.2776107788086, -66.15924835205078, -63.040889739990234, -59.92253112792969, -56.80417251586914, -53.685813903808594, -50.56745910644531, -47.44910430908203, -44.330745697021484, -41.21238708496094, -38.09402847290039, -34.975669860839844, -31.857311248779297, -28.738954544067383, -25.620595932006836, -22.502235412597656, -19.38387680053711, -16.265518188476562, -13.147160530090332, -10.028801918029785, -6.910443305969238, -3.792085647583008, -0.6737270355224609, 2.444631576538086, 5.562990188598633, 8.68134880065918, 11.79970645904541, 14.918065071105957, 18.036422729492188, 21.154781341552734, 24.27313995361328, 27.391498565673828, 30.509857177734375, 33.62821578979492, 36.74657440185547, 39.864933013916016, 42.98329162597656, 46.101646423339844, 49.220008850097656, 52.33836364746094, 55.456722259521484, 58.57508087158203, 61.69343948364258, 64.81179809570312, 67.9301528930664, 71.04851531982422, 74.1668701171875, 77.28523254394531]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 14.0, 15.0, 19.0, 32.0, 65.0, 80.0, 153.0, 336.0, 639.0, 2049.0, 22492.0, 4116611.0, 48872.0, 2181.0, 376.0, 154.0, 80.0, 42.0, 29.0, 12.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0], "bins": [-190.25, -186.41357421875, -182.5771484375, -178.74072265625, -174.904296875, -171.06787109375, -167.2314453125, -163.39501953125, -159.55859375, -155.72216796875, -151.8857421875, -148.04931640625, -144.212890625, -140.37646484375, -136.5400390625, -132.70361328125, -128.8671875, -125.03076171875, -121.1943359375, -117.35791015625, -113.521484375, -109.68505859375, -105.8486328125, -102.01220703125, -98.17578125, -94.33935546875, -90.5029296875, -86.66650390625, -82.830078125, -78.99365234375, -75.1572265625, -71.32080078125, -67.484375, -63.64794921875, -59.8115234375, -55.97509765625, -52.138671875, -48.30224609375, -44.4658203125, -40.62939453125, -36.79296875, -32.95654296875, -29.1201171875, -25.28369140625, -21.447265625, -17.61083984375, -13.7744140625, -9.93798828125, -6.1015625, -2.26513671875, 1.5712890625, 5.40771484375, 9.244140625, 13.08056640625, 16.9169921875, 20.75341796875, 24.58984375, 28.42626953125, 32.2626953125, 36.09912109375, 39.935546875, 43.77197265625, 47.6083984375, 51.44482421875, 55.28125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 6.0, 18.0, 27.0, 39.0, 53.0, 54.0, 62.0, 72.0, 91.0, 83.0, 94.0, 78.0, 72.0, 54.0, 52.0, 33.0, 25.0, 27.0, 14.0, 8.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0], "bins": [-3.732421875, -3.6519775390625, -3.571533203125, -3.4910888671875, -3.41064453125, -3.3302001953125, -3.249755859375, -3.1693115234375, -3.0888671875, -3.0084228515625, -2.927978515625, -2.8475341796875, -2.76708984375, -2.6866455078125, -2.606201171875, -2.5257568359375, -2.4453125, -2.3648681640625, -2.284423828125, -2.2039794921875, -2.12353515625, -2.0430908203125, -1.962646484375, -1.8822021484375, -1.8017578125, -1.7213134765625, -1.640869140625, -1.5604248046875, -1.47998046875, -1.3995361328125, -1.319091796875, -1.2386474609375, -1.158203125, -1.0777587890625, -0.997314453125, -0.9168701171875, -0.83642578125, -0.7559814453125, -0.675537109375, -0.5950927734375, -0.5146484375, -0.4342041015625, -0.353759765625, -0.2733154296875, -0.19287109375, -0.1124267578125, -0.031982421875, 0.0484619140625, 0.12890625, 0.2093505859375, 0.289794921875, 0.3702392578125, 0.45068359375, 0.5311279296875, 0.611572265625, 0.6920166015625, 0.7724609375, 0.8529052734375, 0.933349609375, 1.0137939453125, 1.09423828125, 1.1746826171875, 1.255126953125, 1.3355712890625, 1.416015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 9.0, 9.0, 11.0, 30.0, 27.0, 31.0, 40.0, 61.0, 94.0, 95.0, 141.0, 297.0, 887.0, 3868.0, 41871.0, 3898371.0, 232638.0, 12187.0, 2051.0, 553.0, 283.0, 163.0, 127.0, 106.0, 66.0, 77.0, 44.0, 35.0, 22.0, 23.0, 11.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-76.5, -74.4169921875, -72.333984375, -70.2509765625, -68.16796875, -66.0849609375, -64.001953125, -61.9189453125, -59.8359375, -57.7529296875, -55.669921875, -53.5869140625, -51.50390625, -49.4208984375, -47.337890625, -45.2548828125, -43.171875, -41.0888671875, -39.005859375, -36.9228515625, -34.83984375, -32.7568359375, -30.673828125, -28.5908203125, -26.5078125, -24.4248046875, -22.341796875, -20.2587890625, -18.17578125, -16.0927734375, -14.009765625, -11.9267578125, -9.84375, -7.7607421875, -5.677734375, -3.5947265625, -1.51171875, 0.5712890625, 2.654296875, 4.7373046875, 6.8203125, 8.9033203125, 10.986328125, 13.0693359375, 15.15234375, 17.2353515625, 19.318359375, 21.4013671875, 23.484375, 25.5673828125, 27.650390625, 29.7333984375, 31.81640625, 33.8994140625, 35.982421875, 38.0654296875, 40.1484375, 42.2314453125, 44.314453125, 46.3974609375, 48.48046875, 50.5634765625, 52.646484375, 54.7294921875, 56.8125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 4.0, 7.0, 22.0, 37.0, 70.0, 180.0, 629.0, 2297.0, 478.0, 153.0, 60.0, 49.0, 31.0, 22.0, 19.0, 10.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.089691162109375, -2.76336669921875, -2.437042236328125, -2.1107177734375, -1.784393310546875, -1.45806884765625, -1.131744384765625, -0.805419921875, -0.479095458984375, -0.15277099609375, 0.173553466796875, 0.4998779296875, 0.826202392578125, 1.15252685546875, 1.478851318359375, 1.80517578125, 2.131500244140625, 2.45782470703125, 2.784149169921875, 3.1104736328125, 3.436798095703125, 3.76312255859375, 4.089447021484375, 4.415771484375, 4.742095947265625, 5.06842041015625, 5.394744873046875, 5.7210693359375, 6.047393798828125, 6.37371826171875, 6.700042724609375, 7.0263671875, 7.352691650390625, 7.67901611328125, 8.005340576171875, 8.3316650390625, 8.657989501953125, 8.98431396484375, 9.310638427734375, 9.636962890625, 9.963287353515625, 10.28961181640625, 10.615936279296875, 10.9422607421875, 11.268585205078125, 11.59490966796875, 11.921234130859375, 12.24755859375, 12.573883056640625, 12.90020751953125, 13.226531982421875, 13.5528564453125, 13.879180908203125, 14.20550537109375, 14.531829833984375, 14.858154296875, 15.184478759765625, 15.51080322265625, 15.837127685546875, 16.1634521484375, 16.489776611328125, 16.81610107421875, 17.142425537109375, 17.46875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 9.0, 14.0, 78.0, 367.0, 412.0, 114.0, 17.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.359474182128906, -43.52962875366211, -38.69978332519531, -33.86993408203125, -29.040090560913086, -24.21024513244629, -19.38039779663086, -14.550552368164062, -9.720706939697266, -4.8908610343933105, -0.06101512908935547, 4.768831253051758, 9.598676681518555, 14.428522109985352, 19.25836944580078, 24.088214874267578, 28.918060302734375, 33.74790573120117, 38.57775115966797, 43.40760040283203, 48.23744201660156, 53.067291259765625, 57.89713668823242, 62.72698211669922, 67.55682373046875, 72.38667297363281, 77.21651458740234, 82.0463638305664, 86.87620544433594, 91.7060546875, 96.53590393066406, 101.3657455444336, 106.19560241699219, 111.02545166015625, 115.85529327392578, 120.68514251708984, 125.51498413085938, 130.34483337402344, 135.1746826171875, 140.0045166015625, 144.83436584472656, 149.66421508789062, 154.4940643310547, 159.3238983154297, 164.15374755859375, 168.9835968017578, 173.81344604492188, 178.64328002929688, 183.47314453125, 188.30299377441406, 193.13284301757812, 197.96267700195312, 202.7925262451172, 207.62237548828125, 212.4522247314453, 217.28207397460938, 222.11190795898438, 226.94175720214844, 231.7716064453125, 236.6014404296875, 241.43128967285156, 246.26113891601562, 251.0909881591797, 255.92083740234375, 260.75067138671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 16.0, 17.0, 39.0, 50.0, 59.0, 93.0, 103.0, 105.0, 96.0, 101.0, 89.0, 71.0, 40.0, 36.0, 30.0, 17.0, 15.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-66.4062271118164, -64.872802734375, -63.33937454223633, -61.80595016479492, -60.272525787353516, -58.73910140991211, -57.20567321777344, -55.67224884033203, -54.138824462890625, -52.60540008544922, -51.07197189331055, -49.53854751586914, -48.005123138427734, -46.47169876098633, -44.938270568847656, -43.40484619140625, -41.871421813964844, -40.33799743652344, -38.804569244384766, -37.27114486694336, -35.73772048950195, -34.20429611206055, -32.670867919921875, -31.13744354248047, -29.604015350341797, -28.070589065551758, -26.53716468811035, -25.003738403320312, -23.470314025878906, -21.936887741088867, -20.403461456298828, -18.870037078857422, -17.336610794067383, -15.80318546295166, -14.269760131835938, -12.736333847045898, -11.202909469604492, -9.669483184814453, -8.13605785369873, -6.602632522583008, -5.069207191467285, -3.5357818603515625, -2.0023562908172607, -0.468930721282959, 1.0644946098327637, 2.5979199409484863, 4.131345748901367, 5.66477108001709, 7.1981964111328125, 8.731621742248535, 10.265047073364258, 11.798473358154297, 13.331897735595703, 14.865324020385742, 16.39875030517578, 17.932174682617188, 19.465599060058594, 20.999025344848633, 22.53244972229004, 24.065876007080078, 25.599300384521484, 27.132726669311523, 28.666152954101562, 30.19957733154297, 31.733003616333008]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 11.0, 9.0, 10.0, 15.0, 23.0, 20.0, 31.0, 36.0, 57.0, 84.0, 114.0, 253.0, 563.0, 1782.0, 7853.0, 84992.0, 718766.0, 214652.0, 14966.0, 2623.0, 781.0, 338.0, 178.0, 109.0, 77.0, 41.0, 39.0, 31.0, 26.0, 14.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.5, -42.2802734375, -41.060546875, -39.8408203125, -38.62109375, -37.4013671875, -36.181640625, -34.9619140625, -33.7421875, -32.5224609375, -31.302734375, -30.0830078125, -28.86328125, -27.6435546875, -26.423828125, -25.2041015625, -23.984375, -22.7646484375, -21.544921875, -20.3251953125, -19.10546875, -17.8857421875, -16.666015625, -15.4462890625, -14.2265625, -13.0068359375, -11.787109375, -10.5673828125, -9.34765625, -8.1279296875, -6.908203125, -5.6884765625, -4.46875, -3.2490234375, -2.029296875, -0.8095703125, 0.41015625, 1.6298828125, 2.849609375, 4.0693359375, 5.2890625, 6.5087890625, 7.728515625, 8.9482421875, 10.16796875, 11.3876953125, 12.607421875, 13.8271484375, 15.046875, 16.2666015625, 17.486328125, 18.7060546875, 19.92578125, 21.1455078125, 22.365234375, 23.5849609375, 24.8046875, 26.0244140625, 27.244140625, 28.4638671875, 29.68359375, 30.9033203125, 32.123046875, 33.3427734375, 34.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 12.0, 27.0, 45.0, 58.0, 80.0, 108.0, 120.0, 123.0, 104.0, 91.0, 73.0, 67.0, 28.0, 23.0, 15.0, 10.0, 6.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.091583251953125, -4.96832275390625, -4.845062255859375, -4.7218017578125, -4.598541259765625, -4.47528076171875, -4.352020263671875, -4.228759765625, -4.105499267578125, -3.98223876953125, -3.858978271484375, -3.7357177734375, -3.612457275390625, -3.48919677734375, -3.365936279296875, -3.24267578125, -3.119415283203125, -2.99615478515625, -2.872894287109375, -2.7496337890625, -2.626373291015625, -2.50311279296875, -2.379852294921875, -2.256591796875, -2.133331298828125, -2.01007080078125, -1.886810302734375, -1.7635498046875, -1.640289306640625, -1.51702880859375, -1.393768310546875, -1.2705078125, -1.147247314453125, -1.02398681640625, -0.900726318359375, -0.7774658203125, -0.654205322265625, -0.53094482421875, -0.407684326171875, -0.284423828125, -0.161163330078125, -0.03790283203125, 0.085357666015625, 0.2086181640625, 0.331878662109375, 0.45513916015625, 0.578399658203125, 0.70166015625, 0.824920654296875, 0.94818115234375, 1.071441650390625, 1.1947021484375, 1.317962646484375, 1.44122314453125, 1.564483642578125, 1.687744140625, 1.811004638671875, 1.93426513671875, 2.057525634765625, 2.1807861328125, 2.304046630859375, 2.42730712890625, 2.550567626953125, 2.673828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 7.0, 17.0, 13.0, 21.0, 23.0, 40.0, 62.0, 77.0, 117.0, 166.0, 244.0, 399.0, 553.0, 976.0, 1732.0, 3175.0, 6444.0, 15016.0, 40057.0, 120684.0, 311268.0, 332702.0, 136751.0, 45866.0, 16859.0, 7086.0, 3477.0, 1848.0, 984.0, 592.0, 404.0, 277.0, 156.0, 134.0, 77.0, 66.0, 48.0, 33.0, 30.0, 18.0, 16.0, 7.0, 8.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.640625, -13.201416015625, -12.76220703125, -12.322998046875, -11.8837890625, -11.444580078125, -11.00537109375, -10.566162109375, -10.126953125, -9.687744140625, -9.24853515625, -8.809326171875, -8.3701171875, -7.930908203125, -7.49169921875, -7.052490234375, -6.61328125, -6.174072265625, -5.73486328125, -5.295654296875, -4.8564453125, -4.417236328125, -3.97802734375, -3.538818359375, -3.099609375, -2.660400390625, -2.22119140625, -1.781982421875, -1.3427734375, -0.903564453125, -0.46435546875, -0.025146484375, 0.4140625, 0.853271484375, 1.29248046875, 1.731689453125, 2.1708984375, 2.610107421875, 3.04931640625, 3.488525390625, 3.927734375, 4.366943359375, 4.80615234375, 5.245361328125, 5.6845703125, 6.123779296875, 6.56298828125, 7.002197265625, 7.44140625, 7.880615234375, 8.31982421875, 8.759033203125, 9.1982421875, 9.637451171875, 10.07666015625, 10.515869140625, 10.955078125, 11.394287109375, 11.83349609375, 12.272705078125, 12.7119140625, 13.151123046875, 13.59033203125, 14.029541015625, 14.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 2.0, 8.0, 13.0, 5.0, 9.0, 14.0, 13.0, 22.0, 20.0, 28.0, 30.0, 49.0, 43.0, 58.0, 49.0, 43.0, 54.0, 54.0, 56.0, 45.0, 47.0, 50.0, 49.0, 29.0, 33.0, 38.0, 27.0, 21.0, 20.0, 15.0, 8.0, 9.0, 9.0, 4.0, 7.0, 5.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.876220703125, -9.50244140625, -9.128662109375, -8.7548828125, -8.381103515625, -8.00732421875, -7.633544921875, -7.259765625, -6.885986328125, -6.51220703125, -6.138427734375, -5.7646484375, -5.390869140625, -5.01708984375, -4.643310546875, -4.26953125, -3.895751953125, -3.52197265625, -3.148193359375, -2.7744140625, -2.400634765625, -2.02685546875, -1.653076171875, -1.279296875, -0.905517578125, -0.53173828125, -0.157958984375, 0.2158203125, 0.589599609375, 0.96337890625, 1.337158203125, 1.7109375, 2.084716796875, 2.45849609375, 2.832275390625, 3.2060546875, 3.579833984375, 3.95361328125, 4.327392578125, 4.701171875, 5.074951171875, 5.44873046875, 5.822509765625, 6.1962890625, 6.570068359375, 6.94384765625, 7.317626953125, 7.69140625, 8.065185546875, 8.43896484375, 8.812744140625, 9.1865234375, 9.560302734375, 9.93408203125, 10.307861328125, 10.681640625, 11.055419921875, 11.42919921875, 11.802978515625, 12.1767578125, 12.550537109375, 12.92431640625, 13.298095703125, 13.671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 22.0, 30.0, 26.0, 52.0, 78.0, 153.0, 234.0, 473.0, 975.0, 2025.0, 5046.0, 16740.0, 100152.0, 681810.0, 202857.0, 25852.0, 7006.0, 2520.0, 1154.0, 583.0, 309.0, 169.0, 101.0, 65.0, 39.0, 27.0, 18.0, 9.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.63037109375, -17.0732421875, -16.51611328125, -15.958984375, -15.40185546875, -14.8447265625, -14.28759765625, -13.73046875, -13.17333984375, -12.6162109375, -12.05908203125, -11.501953125, -10.94482421875, -10.3876953125, -9.83056640625, -9.2734375, -8.71630859375, -8.1591796875, -7.60205078125, -7.044921875, -6.48779296875, -5.9306640625, -5.37353515625, -4.81640625, -4.25927734375, -3.7021484375, -3.14501953125, -2.587890625, -2.03076171875, -1.4736328125, -0.91650390625, -0.359375, 0.19775390625, 0.7548828125, 1.31201171875, 1.869140625, 2.42626953125, 2.9833984375, 3.54052734375, 4.09765625, 4.65478515625, 5.2119140625, 5.76904296875, 6.326171875, 6.88330078125, 7.4404296875, 7.99755859375, 8.5546875, 9.11181640625, 9.6689453125, 10.22607421875, 10.783203125, 11.34033203125, 11.8974609375, 12.45458984375, 13.01171875, 13.56884765625, 14.1259765625, 14.68310546875, 15.240234375, 15.79736328125, 16.3544921875, 16.91162109375, 17.46875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 13.0, 18.0, 21.0, 19.0, 30.0, 36.0, 56.0, 59.0, 60.0, 81.0, 76.0, 75.0, 96.0, 80.0, 65.0, 52.0, 36.0, 30.0, 24.0, 18.0, 12.0, 13.0, 4.0, 7.0, 2.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015869140625, -0.0015444010496139526, -0.0015018880367279053, -0.001459375023841858, -0.0014168620109558105, -0.0013743489980697632, -0.0013318359851837158, -0.0012893229722976685, -0.001246809959411621, -0.0012042969465255737, -0.0011617839336395264, -0.001119270920753479, -0.0010767579078674316, -0.0010342448949813843, -0.000991731882095337, -0.0009492188692092896, -0.0009067058563232422, -0.0008641928434371948, -0.0008216798305511475, -0.0007791668176651001, -0.0007366538047790527, -0.0006941407918930054, -0.000651627779006958, -0.0006091147661209106, -0.0005666017532348633, -0.0005240887403488159, -0.00048157572746276855, -0.0004390627145767212, -0.00039654970169067383, -0.00035403668880462646, -0.0003115236759185791, -0.00026901066303253174, -0.00022649765014648438, -0.000183984637260437, -0.00014147162437438965, -9.895861148834229e-05, -5.644559860229492e-05, -1.3932585716247559e-05, 2.8580427169799805e-05, 7.109344005584717e-05, 0.00011360645294189453, 0.0001561194658279419, 0.00019863247871398926, 0.00024114549160003662, 0.000283658504486084, 0.00032617151737213135, 0.0003686845302581787, 0.0004111975431442261, 0.00045371055603027344, 0.0004962235689163208, 0.0005387365818023682, 0.0005812495946884155, 0.0006237626075744629, 0.0006662756204605103, 0.0007087886333465576, 0.000751301646232605, 0.0007938146591186523, 0.0008363276720046997, 0.0008788406848907471, 0.0009213536977767944, 0.0009638667106628418, 0.0010063797235488892, 0.0010488927364349365, 0.0010914057493209839, 0.0011339187622070312]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 12.0, 8.0, 17.0, 22.0, 54.0, 77.0, 133.0, 295.0, 760.0, 2463.0, 13943.0, 250139.0, 738569.0, 35352.0, 4595.0, 1221.0, 471.0, 192.0, 84.0, 59.0, 30.0, 31.0, 7.0, 12.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.265625, -22.377685546875, -21.48974609375, -20.601806640625, -19.7138671875, -18.825927734375, -17.93798828125, -17.050048828125, -16.162109375, -15.274169921875, -14.38623046875, -13.498291015625, -12.6103515625, -11.722412109375, -10.83447265625, -9.946533203125, -9.05859375, -8.170654296875, -7.28271484375, -6.394775390625, -5.5068359375, -4.618896484375, -3.73095703125, -2.843017578125, -1.955078125, -1.067138671875, -0.17919921875, 0.708740234375, 1.5966796875, 2.484619140625, 3.37255859375, 4.260498046875, 5.1484375, 6.036376953125, 6.92431640625, 7.812255859375, 8.7001953125, 9.588134765625, 10.47607421875, 11.364013671875, 12.251953125, 13.139892578125, 14.02783203125, 14.915771484375, 15.8037109375, 16.691650390625, 17.57958984375, 18.467529296875, 19.35546875, 20.243408203125, 21.13134765625, 22.019287109375, 22.9072265625, 23.795166015625, 24.68310546875, 25.571044921875, 26.458984375, 27.346923828125, 28.23486328125, 29.122802734375, 30.0107421875, 30.898681640625, 31.78662109375, 32.674560546875, 33.5625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 12.0, 18.0, 22.0, 20.0, 29.0, 42.0, 60.0, 79.0, 89.0, 118.0, 112.0, 102.0, 75.0, 56.0, 40.0, 27.0, 21.0, 20.0, 13.0, 4.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6500244140625, -7.393798828125, -7.1375732421875, -6.88134765625, -6.6251220703125, -6.368896484375, -6.1126708984375, -5.8564453125, -5.6002197265625, -5.343994140625, -5.0877685546875, -4.83154296875, -4.5753173828125, -4.319091796875, -4.0628662109375, -3.806640625, -3.5504150390625, -3.294189453125, -3.0379638671875, -2.78173828125, -2.5255126953125, -2.269287109375, -2.0130615234375, -1.7568359375, -1.5006103515625, -1.244384765625, -0.9881591796875, -0.73193359375, -0.4757080078125, -0.219482421875, 0.0367431640625, 0.29296875, 0.5491943359375, 0.805419921875, 1.0616455078125, 1.31787109375, 1.5740966796875, 1.830322265625, 2.0865478515625, 2.3427734375, 2.5989990234375, 2.855224609375, 3.1114501953125, 3.36767578125, 3.6239013671875, 3.880126953125, 4.1363525390625, 4.392578125, 4.6488037109375, 4.905029296875, 5.1612548828125, 5.41748046875, 5.6737060546875, 5.929931640625, 6.1861572265625, 6.4423828125, 6.6986083984375, 6.954833984375, 7.2110595703125, 7.46728515625, 7.7235107421875, 7.979736328125, 8.2359619140625, 8.4921875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 8.0, 27.0, 43.0, 123.0, 226.0, 253.0, 170.0, 80.0, 38.0, 18.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-237.17144775390625, -230.8107147216797, -224.4499969482422, -218.08926391601562, -211.72853088378906, -205.3677978515625, -199.007080078125, -192.64634704589844, -186.28561401367188, -179.9248809814453, -173.5641632080078, -167.20343017578125, -160.8426971435547, -154.48196411132812, -148.12124633789062, -141.76051330566406, -135.39979553222656, -129.0390625, -122.67833709716797, -116.31761169433594, -109.95687866210938, -103.59615325927734, -97.23542785644531, -90.87469482421875, -84.51396942138672, -78.15324401855469, -71.79251098632812, -65.4317855834961, -59.0710563659668, -52.7103271484375, -46.34960174560547, -39.98887252807617, -33.62815856933594, -27.26742935180664, -20.906702041625977, -14.545974731445312, -8.185245513916016, -1.8245162963867188, 4.5362091064453125, 10.89693832397461, 17.257667541503906, 23.618396759033203, 29.979124069213867, 36.33985137939453, 42.70058059692383, 49.061309814453125, 55.422035217285156, 61.78276443481445, 68.14349365234375, 74.50421905517578, 80.86495208740234, 87.22567749023438, 93.58641052246094, 99.94713592529297, 106.307861328125, 112.66859436035156, 119.0293197631836, 125.39004516601562, 131.7507781982422, 138.11151123046875, 144.47222900390625, 150.8329620361328, 157.19369506835938, 163.55441284179688, 169.91514587402344]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 11.0, 3.0, 13.0, 15.0, 19.0, 17.0, 28.0, 33.0, 26.0, 30.0, 33.0, 43.0, 56.0, 57.0, 67.0, 65.0, 55.0, 42.0, 38.0, 56.0, 48.0, 45.0, 25.0, 28.0, 23.0, 17.0, 19.0, 16.0, 9.0, 10.0, 8.0, 6.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-91.54129028320312, -88.80770874023438, -86.07413482666016, -83.3405532836914, -80.60697174072266, -77.87339782714844, -75.13981628417969, -72.40623474121094, -69.67265319824219, -66.93907165527344, -64.20549774169922, -61.47191619873047, -58.73833465576172, -56.004756927490234, -53.27117919921875, -50.53759765625, -47.80402374267578, -45.0704460144043, -42.33686447143555, -39.60328674316406, -36.86970520019531, -34.13612747192383, -31.402549743652344, -28.668970108032227, -25.93539047241211, -23.201810836791992, -20.468231201171875, -17.73465347290039, -15.001073837280273, -12.267494201660156, -9.533916473388672, -6.800336837768555, -4.0667572021484375, -1.3331780433654785, 1.4004011154174805, 4.133979797363281, 6.867559432983398, 9.601139068603516, 12.334716796875, 15.068296432495117, 17.801876068115234, 20.53545570373535, 23.26903533935547, 26.002613067626953, 28.73619270324707, 31.469772338867188, 34.20335006713867, 36.936927795410156, 39.670509338378906, 42.40408706665039, 45.13766860961914, 47.871246337890625, 50.604827880859375, 53.33840560913086, 56.071983337402344, 58.805564880371094, 61.53914260864258, 64.27272033691406, 67.00630187988281, 69.73988342285156, 72.47345733642578, 75.20703887939453, 77.94061279296875, 80.6741943359375, 83.40777587890625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 11.0, 22.0, 15.0, 45.0, 31.0, 62.0, 93.0, 141.0, 266.0, 507.0, 1292.0, 4434.0, 25646.0, 3399694.0, 736682.0, 19808.0, 3661.0, 1041.0, 384.0, 190.0, 106.0, 56.0, 39.0, 16.0, 11.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.5, -71.61181640625, -69.7236328125, -67.83544921875, -65.947265625, -64.05908203125, -62.1708984375, -60.28271484375, -58.39453125, -56.50634765625, -54.6181640625, -52.72998046875, -50.841796875, -48.95361328125, -47.0654296875, -45.17724609375, -43.2890625, -41.40087890625, -39.5126953125, -37.62451171875, -35.736328125, -33.84814453125, -31.9599609375, -30.07177734375, -28.18359375, -26.29541015625, -24.4072265625, -22.51904296875, -20.630859375, -18.74267578125, -16.8544921875, -14.96630859375, -13.078125, -11.18994140625, -9.3017578125, -7.41357421875, -5.525390625, -3.63720703125, -1.7490234375, 0.13916015625, 2.02734375, 3.91552734375, 5.8037109375, 7.69189453125, 9.580078125, 11.46826171875, 13.3564453125, 15.24462890625, 17.1328125, 19.02099609375, 20.9091796875, 22.79736328125, 24.685546875, 26.57373046875, 28.4619140625, 30.35009765625, 32.23828125, 34.12646484375, 36.0146484375, 37.90283203125, 39.791015625, 41.67919921875, 43.5673828125, 45.45556640625, 47.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 13.0, 5.0, 22.0, 23.0, 29.0, 41.0, 48.0, 71.0, 83.0, 80.0, 84.0, 88.0, 82.0, 59.0, 59.0, 52.0, 40.0, 42.0, 20.0, 16.0, 13.0, 11.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.66015625, -4.545928955078125, -4.43170166015625, -4.317474365234375, -4.2032470703125, -4.089019775390625, -3.97479248046875, -3.860565185546875, -3.746337890625, -3.632110595703125, -3.51788330078125, -3.403656005859375, -3.2894287109375, -3.175201416015625, -3.06097412109375, -2.946746826171875, -2.83251953125, -2.718292236328125, -2.60406494140625, -2.489837646484375, -2.3756103515625, -2.261383056640625, -2.14715576171875, -2.032928466796875, -1.918701171875, -1.804473876953125, -1.69024658203125, -1.576019287109375, -1.4617919921875, -1.347564697265625, -1.23333740234375, -1.119110107421875, -1.0048828125, -0.890655517578125, -0.77642822265625, -0.662200927734375, -0.5479736328125, -0.433746337890625, -0.31951904296875, -0.205291748046875, -0.091064453125, 0.023162841796875, 0.13739013671875, 0.251617431640625, 0.3658447265625, 0.480072021484375, 0.59429931640625, 0.708526611328125, 0.82275390625, 0.936981201171875, 1.05120849609375, 1.165435791015625, 1.2796630859375, 1.393890380859375, 1.50811767578125, 1.622344970703125, 1.736572265625, 1.850799560546875, 1.96502685546875, 2.079254150390625, 2.1934814453125, 2.307708740234375, 2.42193603515625, 2.536163330078125, 2.650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 12.0, 4.0, 12.0, 9.0, 13.0, 19.0, 28.0, 31.0, 32.0, 41.0, 59.0, 74.0, 123.0, 213.0, 478.0, 1832.0, 18006.0, 4037344.0, 130586.0, 3812.0, 769.0, 318.0, 132.0, 85.0, 56.0, 51.0, 29.0, 21.0, 19.0, 13.0, 15.0, 10.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.5625, -73.9873046875, -71.412109375, -68.8369140625, -66.26171875, -63.6865234375, -61.111328125, -58.5361328125, -55.9609375, -53.3857421875, -50.810546875, -48.2353515625, -45.66015625, -43.0849609375, -40.509765625, -37.9345703125, -35.359375, -32.7841796875, -30.208984375, -27.6337890625, -25.05859375, -22.4833984375, -19.908203125, -17.3330078125, -14.7578125, -12.1826171875, -9.607421875, -7.0322265625, -4.45703125, -1.8818359375, 0.693359375, 3.2685546875, 5.84375, 8.4189453125, 10.994140625, 13.5693359375, 16.14453125, 18.7197265625, 21.294921875, 23.8701171875, 26.4453125, 29.0205078125, 31.595703125, 34.1708984375, 36.74609375, 39.3212890625, 41.896484375, 44.4716796875, 47.046875, 49.6220703125, 52.197265625, 54.7724609375, 57.34765625, 59.9228515625, 62.498046875, 65.0732421875, 67.6484375, 70.2236328125, 72.798828125, 75.3740234375, 77.94921875, 80.5244140625, 83.099609375, 85.6748046875, 88.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 23.0, 57.0, 342.0, 2703.0, 693.0, 142.0, 51.0, 22.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.421875, -24.8770751953125, -24.332275390625, -23.7874755859375, -23.24267578125, -22.6978759765625, -22.153076171875, -21.6082763671875, -21.0634765625, -20.5186767578125, -19.973876953125, -19.4290771484375, -18.88427734375, -18.3394775390625, -17.794677734375, -17.2498779296875, -16.705078125, -16.1602783203125, -15.615478515625, -15.0706787109375, -14.52587890625, -13.9810791015625, -13.436279296875, -12.8914794921875, -12.3466796875, -11.8018798828125, -11.257080078125, -10.7122802734375, -10.16748046875, -9.6226806640625, -9.077880859375, -8.5330810546875, -7.98828125, -7.4434814453125, -6.898681640625, -6.3538818359375, -5.80908203125, -5.2642822265625, -4.719482421875, -4.1746826171875, -3.6298828125, -3.0850830078125, -2.540283203125, -1.9954833984375, -1.45068359375, -0.9058837890625, -0.361083984375, 0.1837158203125, 0.728515625, 1.2733154296875, 1.818115234375, 2.3629150390625, 2.90771484375, 3.4525146484375, 3.997314453125, 4.5421142578125, 5.0869140625, 5.6317138671875, 6.176513671875, 6.7213134765625, 7.26611328125, 7.8109130859375, 8.355712890625, 8.9005126953125, 9.4453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 21.0, 66.0, 173.0, 290.0, 257.0, 121.0, 32.0, 16.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.47831726074219, -89.66240692138672, -86.84649658203125, -84.03059387207031, -81.21468353271484, -78.39877319335938, -75.5828628540039, -72.76695251464844, -69.9510498046875, -67.13513946533203, -64.31922912597656, -61.50332260131836, -58.687416076660156, -55.87150573730469, -53.05559539794922, -50.23968505859375, -47.42377471923828, -44.60786437988281, -41.79195785522461, -38.97604751586914, -36.16014099121094, -33.34423065185547, -30.5283203125, -27.712411880493164, -24.896503448486328, -22.080595016479492, -19.264686584472656, -16.448776245117188, -13.632867813110352, -10.816959381103516, -8.001049041748047, -5.185140609741211, -2.369232177734375, 0.44667673110961914, 3.2625856399536133, 6.078495025634766, 8.894403457641602, 11.710311889648438, 14.526222229003906, 17.342130661010742, 20.158039093017578, 22.973947525024414, 25.78985595703125, 28.60576629638672, 31.421674728393555, 34.23758316040039, 37.05349349975586, 39.86940002441406, 42.68531036376953, 45.501220703125, 48.3171272277832, 51.13303756713867, 53.948944091796875, 56.764854431152344, 59.58076477050781, 62.39667510986328, 65.21258544921875, 68.02849578857422, 70.84440612792969, 73.66030883789062, 76.4762191772461, 79.29212951660156, 82.10803985595703, 84.9239501953125, 87.73985290527344]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 9.0, 12.0, 17.0, 18.0, 19.0, 37.0, 35.0, 51.0, 53.0, 58.0, 65.0, 59.0, 71.0, 72.0, 65.0, 49.0, 46.0, 56.0, 48.0, 40.0, 29.0, 23.0, 25.0, 14.0, 12.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.537078857421875, -27.61844825744629, -26.699819564819336, -25.78118896484375, -24.862558364868164, -23.943927764892578, -23.025299072265625, -22.10666847229004, -21.188037872314453, -20.269407272338867, -19.350778579711914, -18.432147979736328, -17.513517379760742, -16.594886779785156, -15.676258087158203, -14.757627487182617, -13.838998794555664, -12.920369148254395, -12.001738548278809, -11.083108901977539, -10.164478302001953, -9.245848655700684, -8.327219009399414, -7.408588886260986, -6.489958763122559, -5.571328639984131, -4.652698516845703, -3.7340688705444336, -2.815438747406006, -1.8968086242675781, -0.9781789779663086, -0.05954885482788086, 0.8590831756591797, 1.7777131795883179, 2.696343183517456, 3.6149730682373047, 4.533603191375732, 5.45223331451416, 6.37086296081543, 7.289493083953857, 8.208123207092285, 9.126752853393555, 10.04538345336914, 10.96401309967041, 11.88264274597168, 12.801273345947266, 13.719902992248535, 14.638532638549805, 15.55716323852539, 16.475793838500977, 17.39442253112793, 18.313053131103516, 19.2316837310791, 20.150314331054688, 21.06894302368164, 21.987573623657227, 22.906204223632812, 23.8248348236084, 24.74346351623535, 25.662094116210938, 26.580724716186523, 27.49935531616211, 28.417984008789062, 29.33661460876465, 30.2552433013916]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 17.0, 22.0, 41.0, 51.0, 62.0, 108.0, 184.0, 291.0, 465.0, 858.0, 2067.0, 5362.0, 18324.0, 76799.0, 316666.0, 445101.0, 136958.0, 31083.0, 8394.0, 2898.0, 1215.0, 621.0, 355.0, 194.0, 121.0, 75.0, 56.0, 35.0, 35.0, 15.0, 13.0, 10.0, 8.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.953125, -20.34033203125, -19.7275390625, -19.11474609375, -18.501953125, -17.88916015625, -17.2763671875, -16.66357421875, -16.05078125, -15.43798828125, -14.8251953125, -14.21240234375, -13.599609375, -12.98681640625, -12.3740234375, -11.76123046875, -11.1484375, -10.53564453125, -9.9228515625, -9.31005859375, -8.697265625, -8.08447265625, -7.4716796875, -6.85888671875, -6.24609375, -5.63330078125, -5.0205078125, -4.40771484375, -3.794921875, -3.18212890625, -2.5693359375, -1.95654296875, -1.34375, -0.73095703125, -0.1181640625, 0.49462890625, 1.107421875, 1.72021484375, 2.3330078125, 2.94580078125, 3.55859375, 4.17138671875, 4.7841796875, 5.39697265625, 6.009765625, 6.62255859375, 7.2353515625, 7.84814453125, 8.4609375, 9.07373046875, 9.6865234375, 10.29931640625, 10.912109375, 11.52490234375, 12.1376953125, 12.75048828125, 13.36328125, 13.97607421875, 14.5888671875, 15.20166015625, 15.814453125, 16.42724609375, 17.0400390625, 17.65283203125, 18.265625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 14.0, 16.0, 20.0, 19.0, 42.0, 67.0, 74.0, 77.0, 104.0, 104.0, 88.0, 79.0, 81.0, 60.0, 49.0, 39.0, 24.0, 19.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.969390869140625, -4.83331298828125, -4.697235107421875, -4.5611572265625, -4.425079345703125, -4.28900146484375, -4.152923583984375, -4.016845703125, -3.880767822265625, -3.74468994140625, -3.608612060546875, -3.4725341796875, -3.336456298828125, -3.20037841796875, -3.064300537109375, -2.92822265625, -2.792144775390625, -2.65606689453125, -2.519989013671875, -2.3839111328125, -2.247833251953125, -2.11175537109375, -1.975677490234375, -1.839599609375, -1.703521728515625, -1.56744384765625, -1.431365966796875, -1.2952880859375, -1.159210205078125, -1.02313232421875, -0.887054443359375, -0.7509765625, -0.614898681640625, -0.47882080078125, -0.342742919921875, -0.2066650390625, -0.070587158203125, 0.06549072265625, 0.201568603515625, 0.337646484375, 0.473724365234375, 0.60980224609375, 0.745880126953125, 0.8819580078125, 1.018035888671875, 1.15411376953125, 1.290191650390625, 1.42626953125, 1.562347412109375, 1.69842529296875, 1.834503173828125, 1.9705810546875, 2.106658935546875, 2.24273681640625, 2.378814697265625, 2.514892578125, 2.650970458984375, 2.78704833984375, 2.923126220703125, 3.0592041015625, 3.195281982421875, 3.33135986328125, 3.467437744140625, 3.603515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 9.0, 8.0, 17.0, 18.0, 32.0, 37.0, 44.0, 73.0, 106.0, 150.0, 258.0, 446.0, 711.0, 1341.0, 3107.0, 7715.0, 22049.0, 70877.0, 240440.0, 423804.0, 192453.0, 55446.0, 17524.0, 6354.0, 2557.0, 1201.0, 627.0, 393.0, 246.0, 169.0, 113.0, 64.0, 48.0, 39.0, 20.0, 23.0, 11.0, 11.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.90625, -15.4300537109375, -14.953857421875, -14.4776611328125, -14.00146484375, -13.5252685546875, -13.049072265625, -12.5728759765625, -12.0966796875, -11.6204833984375, -11.144287109375, -10.6680908203125, -10.19189453125, -9.7156982421875, -9.239501953125, -8.7633056640625, -8.287109375, -7.8109130859375, -7.334716796875, -6.8585205078125, -6.38232421875, -5.9061279296875, -5.429931640625, -4.9537353515625, -4.4775390625, -4.0013427734375, -3.525146484375, -3.0489501953125, -2.57275390625, -2.0965576171875, -1.620361328125, -1.1441650390625, -0.66796875, -0.1917724609375, 0.284423828125, 0.7606201171875, 1.23681640625, 1.7130126953125, 2.189208984375, 2.6654052734375, 3.1416015625, 3.6177978515625, 4.093994140625, 4.5701904296875, 5.04638671875, 5.5225830078125, 5.998779296875, 6.4749755859375, 6.951171875, 7.4273681640625, 7.903564453125, 8.3797607421875, 8.85595703125, 9.3321533203125, 9.808349609375, 10.2845458984375, 10.7607421875, 11.2369384765625, 11.713134765625, 12.1893310546875, 12.66552734375, 13.1417236328125, 13.617919921875, 14.0941162109375, 14.5703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 10.0, 10.0, 7.0, 15.0, 18.0, 18.0, 18.0, 23.0, 25.0, 20.0, 28.0, 34.0, 31.0, 34.0, 31.0, 36.0, 40.0, 35.0, 37.0, 42.0, 42.0, 45.0, 39.0, 29.0, 30.0, 39.0, 32.0, 28.0, 30.0, 23.0, 19.0, 15.0, 19.0, 12.0, 16.0, 15.0, 9.0, 6.0, 9.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.1953125, -8.875244140625, -8.55517578125, -8.235107421875, -7.9150390625, -7.594970703125, -7.27490234375, -6.954833984375, -6.634765625, -6.314697265625, -5.99462890625, -5.674560546875, -5.3544921875, -5.034423828125, -4.71435546875, -4.394287109375, -4.07421875, -3.754150390625, -3.43408203125, -3.114013671875, -2.7939453125, -2.473876953125, -2.15380859375, -1.833740234375, -1.513671875, -1.193603515625, -0.87353515625, -0.553466796875, -0.2333984375, 0.086669921875, 0.40673828125, 0.726806640625, 1.046875, 1.366943359375, 1.68701171875, 2.007080078125, 2.3271484375, 2.647216796875, 2.96728515625, 3.287353515625, 3.607421875, 3.927490234375, 4.24755859375, 4.567626953125, 4.8876953125, 5.207763671875, 5.52783203125, 5.847900390625, 6.16796875, 6.488037109375, 6.80810546875, 7.128173828125, 7.4482421875, 7.768310546875, 8.08837890625, 8.408447265625, 8.728515625, 9.048583984375, 9.36865234375, 9.688720703125, 10.0087890625, 10.328857421875, 10.64892578125, 10.968994140625, 11.2890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 18.0, 18.0, 43.0, 35.0, 52.0, 109.0, 183.0, 267.0, 517.0, 1211.0, 2802.0, 7643.0, 24027.0, 96599.0, 368972.0, 396165.0, 108966.0, 27069.0, 8340.0, 2895.0, 1263.0, 586.0, 284.0, 173.0, 110.0, 66.0, 37.0, 13.0, 19.0, 15.0, 12.0, 7.0, 6.0, 5.0, 1.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.099609375, -6.86328125, -6.626953125, -6.390625, -6.154296875, -5.91796875, -5.681640625, -5.4453125, -5.208984375, -4.97265625, -4.736328125, -4.5, -4.263671875, -4.02734375, -3.791015625, -3.5546875, -3.318359375, -3.08203125, -2.845703125, -2.609375, -2.373046875, -2.13671875, -1.900390625, -1.6640625, -1.427734375, -1.19140625, -0.955078125, -0.71875, -0.482421875, -0.24609375, -0.009765625, 0.2265625, 0.462890625, 0.69921875, 0.935546875, 1.171875, 1.408203125, 1.64453125, 1.880859375, 2.1171875, 2.353515625, 2.58984375, 2.826171875, 3.0625, 3.298828125, 3.53515625, 3.771484375, 4.0078125, 4.244140625, 4.48046875, 4.716796875, 4.953125, 5.189453125, 5.42578125, 5.662109375, 5.8984375, 6.134765625, 6.37109375, 6.607421875, 6.84375, 7.080078125, 7.31640625, 7.552734375, 7.7890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 12.0, 12.0, 19.0, 24.0, 26.0, 15.0, 38.0, 34.0, 38.0, 60.0, 80.0, 91.0, 85.0, 85.0, 70.0, 66.0, 58.0, 45.0, 29.0, 25.0, 23.0, 18.0, 19.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001102447509765625, -0.0010731369256973267, -0.0010438263416290283, -0.00101451575756073, -0.0009852051734924316, -0.0009558945894241333, -0.000926584005355835, -0.0008972734212875366, -0.0008679628372192383, -0.0008386522531509399, -0.0008093416690826416, -0.0007800310850143433, -0.0007507205009460449, -0.0007214099168777466, -0.0006920993328094482, -0.0006627887487411499, -0.0006334781646728516, -0.0006041675806045532, -0.0005748569965362549, -0.0005455464124679565, -0.0005162358283996582, -0.00048692524433135986, -0.0004576146602630615, -0.0004283040761947632, -0.00039899349212646484, -0.0003696829080581665, -0.00034037232398986816, -0.0003110617399215698, -0.0002817511558532715, -0.00025244057178497314, -0.0002231299877166748, -0.00019381940364837646, -0.00016450881958007812, -0.00013519823551177979, -0.00010588765144348145, -7.65770673751831e-05, -4.7266483306884766e-05, -1.7955899238586426e-05, 1.1354684829711914e-05, 4.0665268898010254e-05, 6.99758529663086e-05, 9.928643703460693e-05, 0.00012859702110290527, 0.0001579076051712036, 0.00018721818923950195, 0.0002165287733078003, 0.00024583935737609863, 0.00027514994144439697, 0.0003044605255126953, 0.00033377110958099365, 0.000363081693649292, 0.00039239227771759033, 0.00042170286178588867, 0.000451013445854187, 0.00048032402992248535, 0.0005096346139907837, 0.000538945198059082, 0.0005682557821273804, 0.0005975663661956787, 0.000626876950263977, 0.0006561875343322754, 0.0006854981184005737, 0.0007148087024688721, 0.0007441192865371704, 0.0007734298706054688]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 12.0, 8.0, 12.0, 34.0, 41.0, 65.0, 113.0, 176.0, 278.0, 511.0, 980.0, 1971.0, 4827.0, 13200.0, 48263.0, 240955.0, 512355.0, 171614.0, 35425.0, 10110.0, 3835.0, 1702.0, 892.0, 440.0, 263.0, 161.0, 98.0, 67.0, 44.0, 27.0, 18.0, 13.0, 14.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0], "bins": [-10.828125, -10.54608154296875, -10.2640380859375, -9.98199462890625, -9.699951171875, -9.41790771484375, -9.1358642578125, -8.85382080078125, -8.57177734375, -8.28973388671875, -8.0076904296875, -7.72564697265625, -7.443603515625, -7.16156005859375, -6.8795166015625, -6.59747314453125, -6.3154296875, -6.03338623046875, -5.7513427734375, -5.46929931640625, -5.187255859375, -4.90521240234375, -4.6231689453125, -4.34112548828125, -4.05908203125, -3.77703857421875, -3.4949951171875, -3.21295166015625, -2.930908203125, -2.64886474609375, -2.3668212890625, -2.08477783203125, -1.802734375, -1.52069091796875, -1.2386474609375, -0.95660400390625, -0.674560546875, -0.39251708984375, -0.1104736328125, 0.17156982421875, 0.45361328125, 0.73565673828125, 1.0177001953125, 1.29974365234375, 1.581787109375, 1.86383056640625, 2.1458740234375, 2.42791748046875, 2.7099609375, 2.99200439453125, 3.2740478515625, 3.55609130859375, 3.838134765625, 4.12017822265625, 4.4022216796875, 4.68426513671875, 4.96630859375, 5.24835205078125, 5.5303955078125, 5.81243896484375, 6.094482421875, 6.37652587890625, 6.6585693359375, 6.94061279296875, 7.22265625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 10.0, 6.0, 13.0, 12.0, 17.0, 42.0, 47.0, 60.0, 87.0, 81.0, 84.0, 98.0, 88.0, 90.0, 70.0, 47.0, 49.0, 27.0, 27.0, 11.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.7279052734375, -4.494873046875, -4.2618408203125, -4.02880859375, -3.7957763671875, -3.562744140625, -3.3297119140625, -3.0966796875, -2.8636474609375, -2.630615234375, -2.3975830078125, -2.16455078125, -1.9315185546875, -1.698486328125, -1.4654541015625, -1.232421875, -0.9993896484375, -0.766357421875, -0.5333251953125, -0.30029296875, -0.0672607421875, 0.165771484375, 0.3988037109375, 0.6318359375, 0.8648681640625, 1.097900390625, 1.3309326171875, 1.56396484375, 1.7969970703125, 2.030029296875, 2.2630615234375, 2.49609375, 2.7291259765625, 2.962158203125, 3.1951904296875, 3.42822265625, 3.6612548828125, 3.894287109375, 4.1273193359375, 4.3603515625, 4.5933837890625, 4.826416015625, 5.0594482421875, 5.29248046875, 5.5255126953125, 5.758544921875, 5.9915771484375, 6.224609375, 6.4576416015625, 6.690673828125, 6.9237060546875, 7.15673828125, 7.3897705078125, 7.622802734375, 7.8558349609375, 8.0888671875, 8.3218994140625, 8.554931640625, 8.7879638671875, 9.02099609375, 9.2540283203125, 9.487060546875, 9.7200927734375, 9.953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 11.0, 31.0, 46.0, 86.0, 181.0, 205.0, 186.0, 134.0, 59.0, 23.0, 13.0, 6.0, 8.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.32009887695312, -99.5240249633789, -94.72795104980469, -89.93187713623047, -85.13580322265625, -80.33972930908203, -75.54365539550781, -70.74758911132812, -65.95150756835938, -61.155433654785156, -56.35935974121094, -51.56328582763672, -46.7672119140625, -41.97113800048828, -37.17506790161133, -32.37899398803711, -27.582923889160156, -22.786849975585938, -17.99077606201172, -13.194704055786133, -8.398630142211914, -3.6025562286376953, 1.1935157775878906, 5.989589691162109, 10.785663604736328, 15.581737518310547, 20.377811431884766, 25.17388343811035, 29.96995735168457, 34.766029357910156, 39.562103271484375, 44.358177185058594, 49.15425109863281, 53.95032501220703, 58.74639892578125, 63.54247283935547, 68.33854675292969, 73.1346206665039, 77.93069458007812, 82.72676086425781, 87.52284240722656, 92.31891632080078, 97.114990234375, 101.91106414794922, 106.70713806152344, 111.50321197509766, 116.29928588867188, 121.09535217285156, 125.89142608642578, 130.6875, 135.4835662841797, 140.27964782714844, 145.07571411132812, 149.87179565429688, 154.66786193847656, 159.4639434814453, 164.260009765625, 169.0560760498047, 173.85215759277344, 178.64822387695312, 183.44430541992188, 188.24037170410156, 193.0364532470703, 197.83251953125, 202.62860107421875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 8.0, 8.0, 9.0, 11.0, 11.0, 18.0, 27.0, 26.0, 29.0, 40.0, 59.0, 49.0, 54.0, 58.0, 53.0, 65.0, 63.0, 51.0, 48.0, 43.0, 44.0, 41.0, 34.0, 35.0, 18.0, 18.0, 22.0, 15.0, 7.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.15040588378906, -93.51943969726562, -90.88846588134766, -88.25749969482422, -85.62653350830078, -82.99556732177734, -80.36459350585938, -77.73362731933594, -75.1026611328125, -72.47169494628906, -69.8407211303711, -67.20975494384766, -64.57878875732422, -61.947818756103516, -59.31684875488281, -56.685882568359375, -54.05491256713867, -51.42394256591797, -48.79297637939453, -46.16200637817383, -43.53104019165039, -40.90007019042969, -38.26910400390625, -35.63813400268555, -33.007164001464844, -30.376195907592773, -27.745227813720703, -25.1142578125, -22.483291625976562, -19.85232162475586, -17.22135353088379, -14.590385437011719, -11.959419250488281, -9.328451156616211, -6.697482585906982, -4.066514015197754, -1.4355459213256836, 1.1954221725463867, 3.8263912200927734, 6.457359313964844, 9.088327407836914, 11.719295501708984, 14.350263595581055, 16.981231689453125, 19.612201690673828, 22.243167877197266, 24.87413787841797, 27.50510597229004, 30.13607406616211, 32.76704406738281, 35.39801025390625, 38.02898025512695, 40.65994644165039, 43.290916442871094, 45.92188262939453, 48.552852630615234, 51.18382263183594, 53.81479263305664, 56.44575881958008, 59.07672882080078, 61.70769500732422, 64.33866119384766, 66.96963500976562, 69.60060119628906, 72.2315673828125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 12.0, 12.0, 10.0, 14.0, 23.0, 13.0, 30.0, 42.0, 89.0, 109.0, 173.0, 358.0, 603.0, 1410.0, 3250.0, 12519.0, 142223.0, 3934011.0, 84233.0, 9681.0, 2925.0, 1199.0, 599.0, 301.0, 155.0, 91.0, 65.0, 44.0, 26.0, 11.0, 14.0, 11.0, 8.0, 3.0, 3.0, 1.0, 4.0, 3.0], "bins": [-43.75, -42.742431640625, -41.73486328125, -40.727294921875, -39.7197265625, -38.712158203125, -37.70458984375, -36.697021484375, -35.689453125, -34.681884765625, -33.67431640625, -32.666748046875, -31.6591796875, -30.651611328125, -29.64404296875, -28.636474609375, -27.62890625, -26.621337890625, -25.61376953125, -24.606201171875, -23.5986328125, -22.591064453125, -21.58349609375, -20.575927734375, -19.568359375, -18.560791015625, -17.55322265625, -16.545654296875, -15.5380859375, -14.530517578125, -13.52294921875, -12.515380859375, -11.5078125, -10.500244140625, -9.49267578125, -8.485107421875, -7.4775390625, -6.469970703125, -5.46240234375, -4.454833984375, -3.447265625, -2.439697265625, -1.43212890625, -0.424560546875, 0.5830078125, 1.590576171875, 2.59814453125, 3.605712890625, 4.61328125, 5.620849609375, 6.62841796875, 7.635986328125, 8.6435546875, 9.651123046875, 10.65869140625, 11.666259765625, 12.673828125, 13.681396484375, 14.68896484375, 15.696533203125, 16.7041015625, 17.711669921875, 18.71923828125, 19.726806640625, 20.734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 18.0, 14.0, 33.0, 38.0, 55.0, 84.0, 96.0, 122.0, 103.0, 100.0, 89.0, 71.0, 46.0, 34.0, 41.0, 25.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.91949462890625, -5.7569580078125, -5.59442138671875, -5.431884765625, -5.26934814453125, -5.1068115234375, -4.94427490234375, -4.78173828125, -4.61920166015625, -4.4566650390625, -4.29412841796875, -4.131591796875, -3.96905517578125, -3.8065185546875, -3.64398193359375, -3.4814453125, -3.31890869140625, -3.1563720703125, -2.99383544921875, -2.831298828125, -2.66876220703125, -2.5062255859375, -2.34368896484375, -2.18115234375, -2.01861572265625, -1.8560791015625, -1.69354248046875, -1.531005859375, -1.36846923828125, -1.2059326171875, -1.04339599609375, -0.880859375, -0.71832275390625, -0.5557861328125, -0.39324951171875, -0.230712890625, -0.06817626953125, 0.0943603515625, 0.25689697265625, 0.41943359375, 0.58197021484375, 0.7445068359375, 0.90704345703125, 1.069580078125, 1.23211669921875, 1.3946533203125, 1.55718994140625, 1.7197265625, 1.88226318359375, 2.0447998046875, 2.20733642578125, 2.369873046875, 2.53240966796875, 2.6949462890625, 2.85748291015625, 3.02001953125, 3.18255615234375, 3.3450927734375, 3.50762939453125, 3.670166015625, 3.83270263671875, 3.9952392578125, 4.15777587890625, 4.3203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 11.0, 21.0, 17.0, 24.0, 34.0, 67.0, 88.0, 131.0, 292.0, 703.0, 2607.0, 24020.0, 3994033.0, 164585.0, 5616.0, 1138.0, 376.0, 180.0, 107.0, 79.0, 39.0, 39.0, 16.0, 14.0, 12.0, 6.0, 6.0, 2.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65625, -35.04345703125, -33.4306640625, -31.81787109375, -30.205078125, -28.59228515625, -26.9794921875, -25.36669921875, -23.75390625, -22.14111328125, -20.5283203125, -18.91552734375, -17.302734375, -15.68994140625, -14.0771484375, -12.46435546875, -10.8515625, -9.23876953125, -7.6259765625, -6.01318359375, -4.400390625, -2.78759765625, -1.1748046875, 0.43798828125, 2.05078125, 3.66357421875, 5.2763671875, 6.88916015625, 8.501953125, 10.11474609375, 11.7275390625, 13.34033203125, 14.953125, 16.56591796875, 18.1787109375, 19.79150390625, 21.404296875, 23.01708984375, 24.6298828125, 26.24267578125, 27.85546875, 29.46826171875, 31.0810546875, 32.69384765625, 34.306640625, 35.91943359375, 37.5322265625, 39.14501953125, 40.7578125, 42.37060546875, 43.9833984375, 45.59619140625, 47.208984375, 48.82177734375, 50.4345703125, 52.04736328125, 53.66015625, 55.27294921875, 56.8857421875, 58.49853515625, 60.111328125, 61.72412109375, 63.3369140625, 64.94970703125, 66.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 6.0, 10.0, 23.0, 18.0, 30.0, 71.0, 143.0, 384.0, 1346.0, 1317.0, 410.0, 134.0, 65.0, 52.0, 17.0, 15.0, 10.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.9078369140625, -6.698486328125, -6.4891357421875, -6.27978515625, -6.0704345703125, -5.861083984375, -5.6517333984375, -5.4423828125, -5.2330322265625, -5.023681640625, -4.8143310546875, -4.60498046875, -4.3956298828125, -4.186279296875, -3.9769287109375, -3.767578125, -3.5582275390625, -3.348876953125, -3.1395263671875, -2.93017578125, -2.7208251953125, -2.511474609375, -2.3021240234375, -2.0927734375, -1.8834228515625, -1.674072265625, -1.4647216796875, -1.25537109375, -1.0460205078125, -0.836669921875, -0.6273193359375, -0.41796875, -0.2086181640625, 0.000732421875, 0.2100830078125, 0.41943359375, 0.6287841796875, 0.838134765625, 1.0474853515625, 1.2568359375, 1.4661865234375, 1.675537109375, 1.8848876953125, 2.09423828125, 2.3035888671875, 2.512939453125, 2.7222900390625, 2.931640625, 3.1409912109375, 3.350341796875, 3.5596923828125, 3.76904296875, 3.9783935546875, 4.187744140625, 4.3970947265625, 4.6064453125, 4.8157958984375, 5.025146484375, 5.2344970703125, 5.44384765625, 5.6531982421875, 5.862548828125, 6.0718994140625, 6.28125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 52.0, 132.0, 303.0, 308.0, 141.0, 36.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.61771392822266, -108.1576919555664, -105.69766235351562, -103.23764038085938, -100.7776107788086, -98.31758880615234, -95.85755920410156, -93.39753723144531, -90.93751525878906, -88.47749328613281, -86.01746368408203, -83.55744171142578, -81.097412109375, -78.63739013671875, -76.17736053466797, -73.71733856201172, -71.25730895996094, -68.79728698730469, -66.3372573852539, -63.87723159790039, -61.417205810546875, -58.957183837890625, -56.49715805053711, -54.037132263183594, -51.57710647583008, -49.11708068847656, -46.65705490112305, -44.19702911376953, -41.73700714111328, -39.2769775390625, -36.81695556640625, -34.356929779052734, -31.89691162109375, -29.436885833740234, -26.97686004638672, -24.516836166381836, -22.05681037902832, -19.596784591674805, -17.136760711669922, -14.676734924316406, -12.21670913696289, -9.756683349609375, -7.296658515930176, -4.836633205413818, -2.376607894897461, 0.08341789245605469, 2.543442726135254, 5.003467559814453, 7.463493347167969, 9.923519134521484, 12.383543968200684, 14.843568801879883, 17.3035945892334, 19.763620376586914, 22.223644256591797, 24.683670043945312, 27.143695831298828, 29.603721618652344, 32.06374740600586, 34.523773193359375, 36.983795166015625, 39.443824768066406, 41.903846740722656, 44.36387252807617, 46.82389831542969]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 10.0, 21.0, 23.0, 21.0, 33.0, 36.0, 51.0, 60.0, 62.0, 80.0, 64.0, 67.0, 86.0, 56.0, 77.0, 59.0, 48.0, 41.0, 20.0, 24.0, 13.0, 12.0, 10.0, 2.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.828554153442383, -20.068880081176758, -19.309206008911133, -18.549531936645508, -17.789857864379883, -17.030183792114258, -16.270509719848633, -15.510835647583008, -14.751161575317383, -13.991487503051758, -13.231813430786133, -12.472139358520508, -11.712465286254883, -10.952791213989258, -10.193117141723633, -9.433443069458008, -8.673768997192383, -7.914094924926758, -7.154420852661133, -6.394746780395508, -5.635072708129883, -4.875398635864258, -4.115724563598633, -3.356050491333008, -2.596376419067383, -1.8367023468017578, -1.0770282745361328, -0.3173542022705078, 0.4423198699951172, 1.2019939422607422, 1.9616680145263672, 2.721342086791992, 3.48101806640625, 4.240692138671875, 5.0003662109375, 5.760040283203125, 6.51971435546875, 7.279388427734375, 8.0390625, 8.798736572265625, 9.55841064453125, 10.318084716796875, 11.0777587890625, 11.837432861328125, 12.59710693359375, 13.356781005859375, 14.116455078125, 14.876129150390625, 15.63580322265625, 16.395477294921875, 17.1551513671875, 17.914825439453125, 18.67449951171875, 19.434173583984375, 20.19384765625, 20.953521728515625, 21.71319580078125, 22.472869873046875, 23.2325439453125, 23.992218017578125, 24.75189208984375, 25.511566162109375, 26.271240234375, 27.030914306640625, 27.79058837890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 7.0, 3.0, 6.0, 11.0, 12.0, 10.0, 23.0, 25.0, 31.0, 55.0, 57.0, 104.0, 145.0, 283.0, 426.0, 740.0, 1487.0, 3325.0, 10069.0, 37796.0, 168328.0, 464099.0, 272277.0, 64552.0, 15599.0, 4794.0, 1969.0, 926.0, 501.0, 297.0, 182.0, 120.0, 74.0, 68.0, 49.0, 34.0, 16.0, 16.0, 12.0, 5.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5859375, -14.0589599609375, -13.531982421875, -13.0050048828125, -12.47802734375, -11.9510498046875, -11.424072265625, -10.8970947265625, -10.3701171875, -9.8431396484375, -9.316162109375, -8.7891845703125, -8.26220703125, -7.7352294921875, -7.208251953125, -6.6812744140625, -6.154296875, -5.6273193359375, -5.100341796875, -4.5733642578125, -4.04638671875, -3.5194091796875, -2.992431640625, -2.4654541015625, -1.9384765625, -1.4114990234375, -0.884521484375, -0.3575439453125, 0.16943359375, 0.6964111328125, 1.223388671875, 1.7503662109375, 2.27734375, 2.8043212890625, 3.331298828125, 3.8582763671875, 4.38525390625, 4.9122314453125, 5.439208984375, 5.9661865234375, 6.4931640625, 7.0201416015625, 7.547119140625, 8.0740966796875, 8.60107421875, 9.1280517578125, 9.655029296875, 10.1820068359375, 10.708984375, 11.2359619140625, 11.762939453125, 12.2899169921875, 12.81689453125, 13.3438720703125, 13.870849609375, 14.3978271484375, 14.9248046875, 15.4517822265625, 15.978759765625, 16.5057373046875, 17.03271484375, 17.5596923828125, 18.086669921875, 18.6136474609375, 19.140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 11.0, 22.0, 28.0, 34.0, 82.0, 91.0, 105.0, 123.0, 120.0, 100.0, 74.0, 73.0, 46.0, 37.0, 19.0, 16.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6484375, -6.47320556640625, -6.2979736328125, -6.12274169921875, -5.947509765625, -5.77227783203125, -5.5970458984375, -5.42181396484375, -5.24658203125, -5.07135009765625, -4.8961181640625, -4.72088623046875, -4.545654296875, -4.37042236328125, -4.1951904296875, -4.01995849609375, -3.8447265625, -3.66949462890625, -3.4942626953125, -3.31903076171875, -3.143798828125, -2.96856689453125, -2.7933349609375, -2.61810302734375, -2.44287109375, -2.26763916015625, -2.0924072265625, -1.91717529296875, -1.741943359375, -1.56671142578125, -1.3914794921875, -1.21624755859375, -1.041015625, -0.86578369140625, -0.6905517578125, -0.51531982421875, -0.340087890625, -0.16485595703125, 0.0103759765625, 0.18560791015625, 0.36083984375, 0.53607177734375, 0.7113037109375, 0.88653564453125, 1.061767578125, 1.23699951171875, 1.4122314453125, 1.58746337890625, 1.7626953125, 1.93792724609375, 2.1131591796875, 2.28839111328125, 2.463623046875, 2.63885498046875, 2.8140869140625, 2.98931884765625, 3.16455078125, 3.33978271484375, 3.5150146484375, 3.69024658203125, 3.865478515625, 4.04071044921875, 4.2159423828125, 4.39117431640625, 4.56640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 17.0, 19.0, 25.0, 30.0, 49.0, 64.0, 98.0, 141.0, 189.0, 291.0, 477.0, 781.0, 1163.0, 2298.0, 4710.0, 10853.0, 28287.0, 82059.0, 233443.0, 371901.0, 200222.0, 68658.0, 24177.0, 9285.0, 4041.0, 2097.0, 1101.0, 690.0, 436.0, 312.0, 189.0, 126.0, 83.0, 56.0, 44.0, 35.0, 19.0, 26.0, 17.0, 10.0, 9.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8828125, -10.5250244140625, -10.167236328125, -9.8094482421875, -9.45166015625, -9.0938720703125, -8.736083984375, -8.3782958984375, -8.0205078125, -7.6627197265625, -7.304931640625, -6.9471435546875, -6.58935546875, -6.2315673828125, -5.873779296875, -5.5159912109375, -5.158203125, -4.8004150390625, -4.442626953125, -4.0848388671875, -3.72705078125, -3.3692626953125, -3.011474609375, -2.6536865234375, -2.2958984375, -1.9381103515625, -1.580322265625, -1.2225341796875, -0.86474609375, -0.5069580078125, -0.149169921875, 0.2086181640625, 0.56640625, 0.9241943359375, 1.281982421875, 1.6397705078125, 1.99755859375, 2.3553466796875, 2.713134765625, 3.0709228515625, 3.4287109375, 3.7864990234375, 4.144287109375, 4.5020751953125, 4.85986328125, 5.2176513671875, 5.575439453125, 5.9332275390625, 6.291015625, 6.6488037109375, 7.006591796875, 7.3643798828125, 7.72216796875, 8.0799560546875, 8.437744140625, 8.7955322265625, 9.1533203125, 9.5111083984375, 9.868896484375, 10.2266845703125, 10.58447265625, 10.9422607421875, 11.300048828125, 11.6578369140625, 12.015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 15.0, 17.0, 20.0, 17.0, 28.0, 32.0, 34.0, 32.0, 43.0, 44.0, 40.0, 40.0, 47.0, 67.0, 46.0, 56.0, 35.0, 30.0, 48.0, 42.0, 39.0, 33.0, 26.0, 16.0, 23.0, 15.0, 19.0, 15.0, 10.0, 7.0, 8.0, 8.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0], "bins": [-15.03125, -14.63818359375, -14.2451171875, -13.85205078125, -13.458984375, -13.06591796875, -12.6728515625, -12.27978515625, -11.88671875, -11.49365234375, -11.1005859375, -10.70751953125, -10.314453125, -9.92138671875, -9.5283203125, -9.13525390625, -8.7421875, -8.34912109375, -7.9560546875, -7.56298828125, -7.169921875, -6.77685546875, -6.3837890625, -5.99072265625, -5.59765625, -5.20458984375, -4.8115234375, -4.41845703125, -4.025390625, -3.63232421875, -3.2392578125, -2.84619140625, -2.453125, -2.06005859375, -1.6669921875, -1.27392578125, -0.880859375, -0.48779296875, -0.0947265625, 0.29833984375, 0.69140625, 1.08447265625, 1.4775390625, 1.87060546875, 2.263671875, 2.65673828125, 3.0498046875, 3.44287109375, 3.8359375, 4.22900390625, 4.6220703125, 5.01513671875, 5.408203125, 5.80126953125, 6.1943359375, 6.58740234375, 6.98046875, 7.37353515625, 7.7666015625, 8.15966796875, 8.552734375, 8.94580078125, 9.3388671875, 9.73193359375, 10.125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 3.0, 9.0, 20.0, 16.0, 37.0, 47.0, 86.0, 218.0, 443.0, 1093.0, 3711.0, 16504.0, 143202.0, 713524.0, 147014.0, 16933.0, 3654.0, 1159.0, 422.0, 210.0, 89.0, 46.0, 27.0, 23.0, 22.0, 10.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.86328125, -9.4765625, -9.08984375, -8.703125, -8.31640625, -7.9296875, -7.54296875, -7.15625, -6.76953125, -6.3828125, -5.99609375, -5.609375, -5.22265625, -4.8359375, -4.44921875, -4.0625, -3.67578125, -3.2890625, -2.90234375, -2.515625, -2.12890625, -1.7421875, -1.35546875, -0.96875, -0.58203125, -0.1953125, 0.19140625, 0.578125, 0.96484375, 1.3515625, 1.73828125, 2.125, 2.51171875, 2.8984375, 3.28515625, 3.671875, 4.05859375, 4.4453125, 4.83203125, 5.21875, 5.60546875, 5.9921875, 6.37890625, 6.765625, 7.15234375, 7.5390625, 7.92578125, 8.3125, 8.69921875, 9.0859375, 9.47265625, 9.859375, 10.24609375, 10.6328125, 11.01953125, 11.40625, 11.79296875, 12.1796875, 12.56640625, 12.953125, 13.33984375, 13.7265625, 14.11328125, 14.5]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 11.0, 18.0, 29.0, 29.0, 40.0, 46.0, 58.0, 74.0, 83.0, 121.0, 91.0, 68.0, 49.0, 59.0, 43.0, 35.0, 27.0, 23.0, 15.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009284019470214844, -0.0008950904011726379, -0.0008617788553237915, -0.0008284673094749451, -0.0007951557636260986, -0.0007618442177772522, -0.0007285326719284058, -0.0006952211260795593, -0.0006619095802307129, -0.0006285980343818665, -0.00059528648853302, -0.0005619749426841736, -0.0005286633968353271, -0.0004953518509864807, -0.0004620403051376343, -0.00042872875928878784, -0.0003954172134399414, -0.00036210566759109497, -0.00032879412174224854, -0.0002954825758934021, -0.00026217103004455566, -0.00022885948419570923, -0.0001955479383468628, -0.00016223639249801636, -0.00012892484664916992, -9.561330080032349e-05, -6.230175495147705e-05, -2.8990209102630615e-05, 4.32133674621582e-06, 3.7632882595062256e-05, 7.094442844390869e-05, 0.00010425597429275513, 0.00013756752014160156, 0.000170879065990448, 0.00020419061183929443, 0.00023750215768814087, 0.0002708137035369873, 0.00030412524938583374, 0.0003374367952346802, 0.0003707483410835266, 0.00040405988693237305, 0.0004373714327812195, 0.0004706829786300659, 0.0005039945244789124, 0.0005373060703277588, 0.0005706176161766052, 0.0006039291620254517, 0.0006372407078742981, 0.0006705522537231445, 0.000703863799571991, 0.0007371753454208374, 0.0007704868912696838, 0.0008037984371185303, 0.0008371099829673767, 0.0008704215288162231, 0.0009037330746650696, 0.000937044620513916, 0.0009703561663627625, 0.0010036677122116089, 0.0010369792580604553, 0.0010702908039093018, 0.0011036023497581482, 0.0011369138956069946, 0.001170225441455841, 0.0012035369873046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 18.0, 22.0, 32.0, 42.0, 91.0, 153.0, 265.0, 488.0, 1142.0, 3395.0, 13838.0, 140868.0, 791824.0, 81498.0, 10178.0, 2691.0, 1003.0, 444.0, 225.0, 116.0, 82.0, 36.0, 20.0, 25.0, 14.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.293701171875, -15.77490234375, -15.256103515625, -14.7373046875, -14.218505859375, -13.69970703125, -13.180908203125, -12.662109375, -12.143310546875, -11.62451171875, -11.105712890625, -10.5869140625, -10.068115234375, -9.54931640625, -9.030517578125, -8.51171875, -7.992919921875, -7.47412109375, -6.955322265625, -6.4365234375, -5.917724609375, -5.39892578125, -4.880126953125, -4.361328125, -3.842529296875, -3.32373046875, -2.804931640625, -2.2861328125, -1.767333984375, -1.24853515625, -0.729736328125, -0.2109375, 0.307861328125, 0.82666015625, 1.345458984375, 1.8642578125, 2.383056640625, 2.90185546875, 3.420654296875, 3.939453125, 4.458251953125, 4.97705078125, 5.495849609375, 6.0146484375, 6.533447265625, 7.05224609375, 7.571044921875, 8.08984375, 8.608642578125, 9.12744140625, 9.646240234375, 10.1650390625, 10.683837890625, 11.20263671875, 11.721435546875, 12.240234375, 12.759033203125, 13.27783203125, 13.796630859375, 14.3154296875, 14.834228515625, 15.35302734375, 15.871826171875, 16.390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 12.0, 20.0, 32.0, 40.0, 83.0, 88.0, 148.0, 173.0, 115.0, 97.0, 68.0, 44.0, 18.0, 20.0, 10.0, 8.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.4737548828125, -11.158447265625, -10.8431396484375, -10.52783203125, -10.2125244140625, -9.897216796875, -9.5819091796875, -9.2666015625, -8.9512939453125, -8.635986328125, -8.3206787109375, -8.00537109375, -7.6900634765625, -7.374755859375, -7.0594482421875, -6.744140625, -6.4288330078125, -6.113525390625, -5.7982177734375, -5.48291015625, -5.1676025390625, -4.852294921875, -4.5369873046875, -4.2216796875, -3.9063720703125, -3.591064453125, -3.2757568359375, -2.96044921875, -2.6451416015625, -2.329833984375, -2.0145263671875, -1.69921875, -1.3839111328125, -1.068603515625, -0.7532958984375, -0.43798828125, -0.1226806640625, 0.192626953125, 0.5079345703125, 0.8232421875, 1.1385498046875, 1.453857421875, 1.7691650390625, 2.08447265625, 2.3997802734375, 2.715087890625, 3.0303955078125, 3.345703125, 3.6610107421875, 3.976318359375, 4.2916259765625, 4.60693359375, 4.9222412109375, 5.237548828125, 5.5528564453125, 5.8681640625, 6.1834716796875, 6.498779296875, 6.8140869140625, 7.12939453125, 7.4447021484375, 7.760009765625, 8.0753173828125, 8.390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 13.0, 32.0, 67.0, 132.0, 222.0, 217.0, 165.0, 78.0, 38.0, 17.0, 9.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.25121307373047, -106.89424133300781, -101.53726959228516, -96.1802978515625, -90.82333374023438, -85.46635437011719, -80.10939025878906, -74.7524185180664, -69.39544677734375, -64.0384750366211, -58.68150329589844, -53.32453536987305, -47.96756362915039, -42.610591888427734, -37.253623962402344, -31.896652221679688, -26.53968048095703, -21.182708740234375, -15.825738906860352, -10.468769073486328, -5.111797332763672, 0.24517440795898438, 5.602142333984375, 10.959114074707031, 16.316085815429688, 21.673057556152344, 27.030027389526367, 32.38699722290039, 37.74396896362305, 43.1009407043457, 48.457908630371094, 53.81488037109375, 59.17185974121094, 64.5288314819336, 69.88580322265625, 75.24276733398438, 80.59974670410156, 85.95671081542969, 91.31368255615234, 96.670654296875, 102.02762603759766, 107.38459777832031, 112.74156951904297, 118.09854125976562, 123.45550537109375, 128.81248474121094, 134.16944885253906, 139.52642822265625, 144.88339233398438, 150.2403564453125, 155.5973358154297, 160.9542999267578, 166.311279296875, 171.66824340820312, 177.02520751953125, 182.38218688964844, 187.73916625976562, 193.09613037109375, 198.45310974121094, 203.81007385253906, 209.16705322265625, 214.52401733398438, 219.8809814453125, 225.2379608154297, 230.5949249267578]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 5.0, 9.0, 21.0, 12.0, 15.0, 18.0, 31.0, 35.0, 33.0, 33.0, 44.0, 57.0, 55.0, 63.0, 57.0, 58.0, 48.0, 61.0, 49.0, 57.0, 39.0, 47.0, 33.0, 21.0, 23.0, 10.0, 13.0, 8.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-108.58840942382812, -105.73151397705078, -102.87461853027344, -100.01771545410156, -97.16082000732422, -94.30392456054688, -91.44702911376953, -88.59013366699219, -85.73323059082031, -82.87633514404297, -80.01943969726562, -77.16253662109375, -74.3056411743164, -71.44874572753906, -68.59185028076172, -65.73495483398438, -62.87805938720703, -60.02116394042969, -57.16426467895508, -54.307369232177734, -51.450469970703125, -48.59357452392578, -45.73667907714844, -42.879783630371094, -40.022884368896484, -37.16598892211914, -34.30908966064453, -31.452194213867188, -28.59529685974121, -25.738399505615234, -22.88150405883789, -20.024606704711914, -17.167709350585938, -14.310811996459961, -11.4539155960083, -8.59701919555664, -5.740121841430664, -2.8832244873046875, -0.02632904052734375, 2.830568313598633, 5.687465667724609, 8.544363021850586, 11.401259422302246, 14.258155822753906, 17.115053176879883, 19.97195053100586, 22.828845977783203, 25.68574333190918, 28.542640686035156, 31.399538040161133, 34.25643539428711, 37.11333084106445, 39.97023010253906, 42.827125549316406, 45.68402099609375, 48.540916442871094, 51.3978157043457, 54.25471115112305, 57.111610412597656, 59.968505859375, 62.825401306152344, 65.68229675292969, 68.53919982910156, 71.3960952758789, 74.25299072265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 15.0, 22.0, 33.0, 36.0, 73.0, 82.0, 136.0, 228.0, 416.0, 971.0, 2437.0, 8847.0, 53099.0, 3653320.0, 442511.0, 23777.0, 5298.0, 1690.0, 644.0, 277.0, 139.0, 76.0, 49.0, 32.0, 19.0, 9.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.15625, -46.0283203125, -44.900390625, -43.7724609375, -42.64453125, -41.5166015625, -40.388671875, -39.2607421875, -38.1328125, -37.0048828125, -35.876953125, -34.7490234375, -33.62109375, -32.4931640625, -31.365234375, -30.2373046875, -29.109375, -27.9814453125, -26.853515625, -25.7255859375, -24.59765625, -23.4697265625, -22.341796875, -21.2138671875, -20.0859375, -18.9580078125, -17.830078125, -16.7021484375, -15.57421875, -14.4462890625, -13.318359375, -12.1904296875, -11.0625, -9.9345703125, -8.806640625, -7.6787109375, -6.55078125, -5.4228515625, -4.294921875, -3.1669921875, -2.0390625, -0.9111328125, 0.216796875, 1.3447265625, 2.47265625, 3.6005859375, 4.728515625, 5.8564453125, 6.984375, 8.1123046875, 9.240234375, 10.3681640625, 11.49609375, 12.6240234375, 13.751953125, 14.8798828125, 16.0078125, 17.1357421875, 18.263671875, 19.3916015625, 20.51953125, 21.6474609375, 22.775390625, 23.9033203125, 25.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 18.0, 19.0, 35.0, 57.0, 89.0, 121.0, 108.0, 132.0, 118.0, 91.0, 66.0, 66.0, 32.0, 20.0, 15.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.83209228515625, -7.6329345703125, -7.43377685546875, -7.234619140625, -7.03546142578125, -6.8363037109375, -6.63714599609375, -6.43798828125, -6.23883056640625, -6.0396728515625, -5.84051513671875, -5.641357421875, -5.44219970703125, -5.2430419921875, -5.04388427734375, -4.8447265625, -4.64556884765625, -4.4464111328125, -4.24725341796875, -4.048095703125, -3.84893798828125, -3.6497802734375, -3.45062255859375, -3.25146484375, -3.05230712890625, -2.8531494140625, -2.65399169921875, -2.454833984375, -2.25567626953125, -2.0565185546875, -1.85736083984375, -1.658203125, -1.45904541015625, -1.2598876953125, -1.06072998046875, -0.861572265625, -0.66241455078125, -0.4632568359375, -0.26409912109375, -0.06494140625, 0.13421630859375, 0.3333740234375, 0.53253173828125, 0.731689453125, 0.93084716796875, 1.1300048828125, 1.32916259765625, 1.5283203125, 1.72747802734375, 1.9266357421875, 2.12579345703125, 2.324951171875, 2.52410888671875, 2.7232666015625, 2.92242431640625, 3.12158203125, 3.32073974609375, 3.5198974609375, 3.71905517578125, 3.918212890625, 4.11737060546875, 4.3165283203125, 4.51568603515625, 4.71484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 9.0, 14.0, 18.0, 28.0, 39.0, 43.0, 54.0, 89.0, 131.0, 189.0, 295.0, 402.0, 697.0, 1320.0, 2322.0, 4426.0, 10379.0, 42860.0, 1188380.0, 2864170.0, 57320.0, 11411.0, 4398.0, 2170.0, 1186.0, 678.0, 426.0, 215.0, 150.0, 113.0, 91.0, 70.0, 51.0, 25.0, 24.0, 14.0, 12.0, 14.0, 6.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.515625, -24.694580078125, -23.87353515625, -23.052490234375, -22.2314453125, -21.410400390625, -20.58935546875, -19.768310546875, -18.947265625, -18.126220703125, -17.30517578125, -16.484130859375, -15.6630859375, -14.842041015625, -14.02099609375, -13.199951171875, -12.37890625, -11.557861328125, -10.73681640625, -9.915771484375, -9.0947265625, -8.273681640625, -7.45263671875, -6.631591796875, -5.810546875, -4.989501953125, -4.16845703125, -3.347412109375, -2.5263671875, -1.705322265625, -0.88427734375, -0.063232421875, 0.7578125, 1.578857421875, 2.39990234375, 3.220947265625, 4.0419921875, 4.863037109375, 5.68408203125, 6.505126953125, 7.326171875, 8.147216796875, 8.96826171875, 9.789306640625, 10.6103515625, 11.431396484375, 12.25244140625, 13.073486328125, 13.89453125, 14.715576171875, 15.53662109375, 16.357666015625, 17.1787109375, 17.999755859375, 18.82080078125, 19.641845703125, 20.462890625, 21.283935546875, 22.10498046875, 22.926025390625, 23.7470703125, 24.568115234375, 25.38916015625, 26.210205078125, 27.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 12.0, 9.0, 10.0, 20.0, 24.0, 46.0, 90.0, 154.0, 362.0, 1071.0, 1351.0, 471.0, 189.0, 103.0, 54.0, 24.0, 16.0, 11.0, 11.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3914794921875, -10.111083984375, -9.8306884765625, -9.55029296875, -9.2698974609375, -8.989501953125, -8.7091064453125, -8.4287109375, -8.1483154296875, -7.867919921875, -7.5875244140625, -7.30712890625, -7.0267333984375, -6.746337890625, -6.4659423828125, -6.185546875, -5.9051513671875, -5.624755859375, -5.3443603515625, -5.06396484375, -4.7835693359375, -4.503173828125, -4.2227783203125, -3.9423828125, -3.6619873046875, -3.381591796875, -3.1011962890625, -2.82080078125, -2.5404052734375, -2.260009765625, -1.9796142578125, -1.69921875, -1.4188232421875, -1.138427734375, -0.8580322265625, -0.57763671875, -0.2972412109375, -0.016845703125, 0.2635498046875, 0.5439453125, 0.8243408203125, 1.104736328125, 1.3851318359375, 1.66552734375, 1.9459228515625, 2.226318359375, 2.5067138671875, 2.787109375, 3.0675048828125, 3.347900390625, 3.6282958984375, 3.90869140625, 4.1890869140625, 4.469482421875, 4.7498779296875, 5.0302734375, 5.3106689453125, 5.591064453125, 5.8714599609375, 6.15185546875, 6.4322509765625, 6.712646484375, 6.9930419921875, 7.2734375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 11.0, 27.0, 43.0, 76.0, 130.0, 172.0, 176.0, 146.0, 88.0, 58.0, 28.0, 13.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-69.06864166259766, -66.82907104492188, -64.58950805664062, -62.349937438964844, -60.11037063598633, -57.87080383300781, -55.6312370300293, -53.39167022705078, -51.152099609375, -48.912532806396484, -46.67296600341797, -44.43339538574219, -42.19382858276367, -39.954261779785156, -37.71469497680664, -35.475128173828125, -33.23556137084961, -30.995994567871094, -28.756425857543945, -26.51685905456543, -24.27729034423828, -22.037723541259766, -19.79815673828125, -17.558589935302734, -15.319021224975586, -13.079453468322754, -10.839885711669922, -8.600318908691406, -6.360751152038574, -4.121183395385742, -1.8816165924072266, 0.35795116424560547, 2.5975189208984375, 4.8370866775512695, 7.076653957366943, 9.316221237182617, 11.55578899383545, 13.795356750488281, 16.034923553466797, 18.274490356445312, 20.51405906677246, 22.753625869750977, 24.993194580078125, 27.23276138305664, 29.472328186035156, 31.711896896362305, 33.95146179199219, 36.19103240966797, 38.430599212646484, 40.670166015625, 42.909732818603516, 45.14929962158203, 47.38887023925781, 49.62843704223633, 51.868003845214844, 54.10757064819336, 56.347137451171875, 58.58670425415039, 60.826271057128906, 63.06584167480469, 65.30540466308594, 67.54497528076172, 69.7845458984375, 72.02410888671875, 74.26367950439453]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 11.0, 23.0, 16.0, 20.0, 31.0, 46.0, 41.0, 67.0, 64.0, 73.0, 66.0, 98.0, 94.0, 73.0, 78.0, 49.0, 41.0, 33.0, 27.0, 12.0, 9.0, 10.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.14438247680664, -42.574703216552734, -41.00502395629883, -39.43534469604492, -37.865665435791016, -36.29598617553711, -34.7263069152832, -33.1566276550293, -31.58694839477539, -30.017269134521484, -28.447589874267578, -26.877910614013672, -25.308231353759766, -23.73855209350586, -22.168872833251953, -20.599193572998047, -19.02951431274414, -17.459835052490234, -15.890155792236328, -14.320476531982422, -12.750797271728516, -11.18111801147461, -9.611438751220703, -8.041759490966797, -6.472080230712891, -4.902400970458984, -3.332721710205078, -1.7630424499511719, -0.19336318969726562, 1.3763160705566406, 2.945995330810547, 4.515674591064453, 6.085350036621094, 7.655029296875, 9.224708557128906, 10.794387817382812, 12.364067077636719, 13.933746337890625, 15.503425598144531, 17.073104858398438, 18.642784118652344, 20.21246337890625, 21.782142639160156, 23.351821899414062, 24.92150115966797, 26.491180419921875, 28.06085968017578, 29.630538940429688, 31.200218200683594, 32.7698974609375, 34.339576721191406, 35.90925598144531, 37.47893524169922, 39.048614501953125, 40.61829376220703, 42.18797302246094, 43.757652282714844, 45.32733154296875, 46.897010803222656, 48.46669006347656, 50.03636932373047, 51.606048583984375, 53.17572784423828, 54.74540710449219, 56.315086364746094]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 11.0, 10.0, 15.0, 13.0, 20.0, 33.0, 50.0, 75.0, 116.0, 163.0, 254.0, 420.0, 729.0, 1359.0, 3006.0, 8548.0, 32615.0, 156084.0, 535333.0, 241065.0, 48947.0, 11900.0, 3967.0, 1620.0, 804.0, 509.0, 304.0, 174.0, 119.0, 86.0, 58.0, 44.0, 23.0, 25.0, 16.0, 14.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.060302734375, -18.37060546875, -17.680908203125, -16.9912109375, -16.301513671875, -15.61181640625, -14.922119140625, -14.232421875, -13.542724609375, -12.85302734375, -12.163330078125, -11.4736328125, -10.783935546875, -10.09423828125, -9.404541015625, -8.71484375, -8.025146484375, -7.33544921875, -6.645751953125, -5.9560546875, -5.266357421875, -4.57666015625, -3.886962890625, -3.197265625, -2.507568359375, -1.81787109375, -1.128173828125, -0.4384765625, 0.251220703125, 0.94091796875, 1.630615234375, 2.3203125, 3.010009765625, 3.69970703125, 4.389404296875, 5.0791015625, 5.768798828125, 6.45849609375, 7.148193359375, 7.837890625, 8.527587890625, 9.21728515625, 9.906982421875, 10.5966796875, 11.286376953125, 11.97607421875, 12.665771484375, 13.35546875, 14.045166015625, 14.73486328125, 15.424560546875, 16.1142578125, 16.803955078125, 17.49365234375, 18.183349609375, 18.873046875, 19.562744140625, 20.25244140625, 20.942138671875, 21.6318359375, 22.321533203125, 23.01123046875, 23.700927734375, 24.390625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 19.0, 31.0, 53.0, 80.0, 121.0, 149.0, 149.0, 129.0, 97.0, 77.0, 49.0, 26.0, 8.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.17242431640625, -8.9385986328125, -8.70477294921875, -8.470947265625, -8.23712158203125, -8.0032958984375, -7.76947021484375, -7.53564453125, -7.30181884765625, -7.0679931640625, -6.83416748046875, -6.600341796875, -6.36651611328125, -6.1326904296875, -5.89886474609375, -5.6650390625, -5.43121337890625, -5.1973876953125, -4.96356201171875, -4.729736328125, -4.49591064453125, -4.2620849609375, -4.02825927734375, -3.79443359375, -3.56060791015625, -3.3267822265625, -3.09295654296875, -2.859130859375, -2.62530517578125, -2.3914794921875, -2.15765380859375, -1.923828125, -1.69000244140625, -1.4561767578125, -1.22235107421875, -0.988525390625, -0.75469970703125, -0.5208740234375, -0.28704833984375, -0.05322265625, 0.18060302734375, 0.4144287109375, 0.64825439453125, 0.882080078125, 1.11590576171875, 1.3497314453125, 1.58355712890625, 1.8173828125, 2.05120849609375, 2.2850341796875, 2.51885986328125, 2.752685546875, 2.98651123046875, 3.2203369140625, 3.45416259765625, 3.68798828125, 3.92181396484375, 4.1556396484375, 4.38946533203125, 4.623291015625, 4.85711669921875, 5.0909423828125, 5.32476806640625, 5.55859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 4.0, 14.0, 13.0, 28.0, 33.0, 42.0, 69.0, 86.0, 140.0, 200.0, 231.0, 319.0, 527.0, 881.0, 1485.0, 2790.0, 5470.0, 11487.0, 25108.0, 56992.0, 128784.0, 256135.0, 280411.0, 151979.0, 67829.0, 29727.0, 13609.0, 6399.0, 3178.0, 1675.0, 1035.0, 591.0, 395.0, 254.0, 165.0, 127.0, 97.0, 56.0, 53.0, 42.0, 23.0, 20.0, 11.0, 11.0, 7.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.1796875, -7.9249267578125, -7.670166015625, -7.4154052734375, -7.16064453125, -6.9058837890625, -6.651123046875, -6.3963623046875, -6.1416015625, -5.8868408203125, -5.632080078125, -5.3773193359375, -5.12255859375, -4.8677978515625, -4.613037109375, -4.3582763671875, -4.103515625, -3.8487548828125, -3.593994140625, -3.3392333984375, -3.08447265625, -2.8297119140625, -2.574951171875, -2.3201904296875, -2.0654296875, -1.8106689453125, -1.555908203125, -1.3011474609375, -1.04638671875, -0.7916259765625, -0.536865234375, -0.2821044921875, -0.02734375, 0.2274169921875, 0.482177734375, 0.7369384765625, 0.99169921875, 1.2464599609375, 1.501220703125, 1.7559814453125, 2.0107421875, 2.2655029296875, 2.520263671875, 2.7750244140625, 3.02978515625, 3.2845458984375, 3.539306640625, 3.7940673828125, 4.048828125, 4.3035888671875, 4.558349609375, 4.8131103515625, 5.06787109375, 5.3226318359375, 5.577392578125, 5.8321533203125, 6.0869140625, 6.3416748046875, 6.596435546875, 6.8511962890625, 7.10595703125, 7.3607177734375, 7.615478515625, 7.8702392578125, 8.125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 9.0, 10.0, 15.0, 15.0, 15.0, 22.0, 20.0, 28.0, 29.0, 30.0, 24.0, 53.0, 34.0, 38.0, 45.0, 48.0, 36.0, 52.0, 40.0, 50.0, 39.0, 43.0, 29.0, 38.0, 42.0, 28.0, 32.0, 21.0, 15.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.4056396484375, -9.069091796875, -8.7325439453125, -8.39599609375, -8.0594482421875, -7.722900390625, -7.3863525390625, -7.0498046875, -6.7132568359375, -6.376708984375, -6.0401611328125, -5.70361328125, -5.3670654296875, -5.030517578125, -4.6939697265625, -4.357421875, -4.0208740234375, -3.684326171875, -3.3477783203125, -3.01123046875, -2.6746826171875, -2.338134765625, -2.0015869140625, -1.6650390625, -1.3284912109375, -0.991943359375, -0.6553955078125, -0.31884765625, 0.0177001953125, 0.354248046875, 0.6907958984375, 1.02734375, 1.3638916015625, 1.700439453125, 2.0369873046875, 2.37353515625, 2.7100830078125, 3.046630859375, 3.3831787109375, 3.7197265625, 4.0562744140625, 4.392822265625, 4.7293701171875, 5.06591796875, 5.4024658203125, 5.739013671875, 6.0755615234375, 6.412109375, 6.7486572265625, 7.085205078125, 7.4217529296875, 7.75830078125, 8.0948486328125, 8.431396484375, 8.7679443359375, 9.1044921875, 9.4410400390625, 9.777587890625, 10.1141357421875, 10.45068359375, 10.7872314453125, 11.123779296875, 11.4603271484375, 11.796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 10.0, 8.0, 17.0, 20.0, 40.0, 46.0, 81.0, 185.0, 386.0, 964.0, 2911.0, 11630.0, 200159.0, 788751.0, 35351.0, 5197.0, 1598.0, 595.0, 257.0, 132.0, 65.0, 33.0, 21.0, 17.0, 13.0, 12.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.765869140625, -16.17236328125, -15.578857421875, -14.9853515625, -14.391845703125, -13.79833984375, -13.204833984375, -12.611328125, -12.017822265625, -11.42431640625, -10.830810546875, -10.2373046875, -9.643798828125, -9.05029296875, -8.456787109375, -7.86328125, -7.269775390625, -6.67626953125, -6.082763671875, -5.4892578125, -4.895751953125, -4.30224609375, -3.708740234375, -3.115234375, -2.521728515625, -1.92822265625, -1.334716796875, -0.7412109375, -0.147705078125, 0.44580078125, 1.039306640625, 1.6328125, 2.226318359375, 2.81982421875, 3.413330078125, 4.0068359375, 4.600341796875, 5.19384765625, 5.787353515625, 6.380859375, 6.974365234375, 7.56787109375, 8.161376953125, 8.7548828125, 9.348388671875, 9.94189453125, 10.535400390625, 11.12890625, 11.722412109375, 12.31591796875, 12.909423828125, 13.5029296875, 14.096435546875, 14.68994140625, 15.283447265625, 15.876953125, 16.470458984375, 17.06396484375, 17.657470703125, 18.2509765625, 18.844482421875, 19.43798828125, 20.031494140625, 20.625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 4.0, 6.0, 9.0, 9.0, 10.0, 20.0, 16.0, 15.0, 21.0, 29.0, 30.0, 51.0, 45.0, 63.0, 76.0, 74.0, 86.0, 72.0, 65.0, 51.0, 36.0, 34.0, 28.0, 18.0, 22.0, 20.0, 20.0, 10.0, 6.0, 7.0, 7.0, 6.0, 10.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007061958312988281, -0.0006860792636871338, -0.0006659626960754395, -0.0006458461284637451, -0.0006257295608520508, -0.0006056129932403564, -0.0005854964256286621, -0.0005653798580169678, -0.0005452632904052734, -0.0005251467227935791, -0.0005050301551818848, -0.00048491358757019043, -0.0004647970199584961, -0.00044468045234680176, -0.0004245638847351074, -0.0004044473171234131, -0.00038433074951171875, -0.0003642141819000244, -0.0003440976142883301, -0.00032398104667663574, -0.0003038644790649414, -0.00028374791145324707, -0.00026363134384155273, -0.0002435147762298584, -0.00022339820861816406, -0.00020328164100646973, -0.0001831650733947754, -0.00016304850578308105, -0.00014293193817138672, -0.00012281537055969238, -0.00010269880294799805, -8.258223533630371e-05, -6.246566772460938e-05, -4.234910011291504e-05, -2.2232532501220703e-05, -2.115964889526367e-06, 1.800060272216797e-05, 3.8117170333862305e-05, 5.823373794555664e-05, 7.835030555725098e-05, 9.846687316894531e-05, 0.00011858344078063965, 0.00013870000839233398, 0.00015881657600402832, 0.00017893314361572266, 0.000199049711227417, 0.00021916627883911133, 0.00023928284645080566, 0.0002593994140625, 0.00027951598167419434, 0.00029963254928588867, 0.000319749116897583, 0.00033986568450927734, 0.0003599822521209717, 0.000380098819732666, 0.00040021538734436035, 0.0004203319549560547, 0.000440448522567749, 0.00046056509017944336, 0.0004806816577911377, 0.000500798225402832, 0.0005209147930145264, 0.0005410313606262207, 0.000561147928237915, 0.0005812644958496094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 2.0, 8.0, 3.0, 5.0, 8.0, 19.0, 23.0, 28.0, 65.0, 100.0, 175.0, 261.0, 530.0, 1124.0, 2493.0, 7040.0, 58177.0, 888090.0, 77634.0, 7789.0, 2542.0, 1151.0, 590.0, 295.0, 160.0, 83.0, 65.0, 36.0, 19.0, 14.0, 3.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.265625, -22.592041015625, -21.91845703125, -21.244873046875, -20.5712890625, -19.897705078125, -19.22412109375, -18.550537109375, -17.876953125, -17.203369140625, -16.52978515625, -15.856201171875, -15.1826171875, -14.509033203125, -13.83544921875, -13.161865234375, -12.48828125, -11.814697265625, -11.14111328125, -10.467529296875, -9.7939453125, -9.120361328125, -8.44677734375, -7.773193359375, -7.099609375, -6.426025390625, -5.75244140625, -5.078857421875, -4.4052734375, -3.731689453125, -3.05810546875, -2.384521484375, -1.7109375, -1.037353515625, -0.36376953125, 0.309814453125, 0.9833984375, 1.656982421875, 2.33056640625, 3.004150390625, 3.677734375, 4.351318359375, 5.02490234375, 5.698486328125, 6.3720703125, 7.045654296875, 7.71923828125, 8.392822265625, 9.06640625, 9.739990234375, 10.41357421875, 11.087158203125, 11.7607421875, 12.434326171875, 13.10791015625, 13.781494140625, 14.455078125, 15.128662109375, 15.80224609375, 16.475830078125, 17.1494140625, 17.822998046875, 18.49658203125, 19.170166015625, 19.84375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 5.0, 16.0, 27.0, 30.0, 52.0, 76.0, 122.0, 131.0, 153.0, 109.0, 87.0, 52.0, 37.0, 22.0, 22.0, 9.0, 7.0, 8.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.49346923828125, -6.2330322265625, -5.97259521484375, -5.712158203125, -5.45172119140625, -5.1912841796875, -4.93084716796875, -4.67041015625, -4.40997314453125, -4.1495361328125, -3.88909912109375, -3.628662109375, -3.36822509765625, -3.1077880859375, -2.84735107421875, -2.5869140625, -2.32647705078125, -2.0660400390625, -1.80560302734375, -1.545166015625, -1.28472900390625, -1.0242919921875, -0.76385498046875, -0.50341796875, -0.24298095703125, 0.0174560546875, 0.27789306640625, 0.538330078125, 0.79876708984375, 1.0592041015625, 1.31964111328125, 1.580078125, 1.84051513671875, 2.1009521484375, 2.36138916015625, 2.621826171875, 2.88226318359375, 3.1427001953125, 3.40313720703125, 3.66357421875, 3.92401123046875, 4.1844482421875, 4.44488525390625, 4.705322265625, 4.96575927734375, 5.2261962890625, 5.48663330078125, 5.7470703125, 6.00750732421875, 6.2679443359375, 6.52838134765625, 6.788818359375, 7.04925537109375, 7.3096923828125, 7.57012939453125, 7.83056640625, 8.09100341796875, 8.3514404296875, 8.61187744140625, 8.872314453125, 9.13275146484375, 9.3931884765625, 9.65362548828125, 9.9140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 29.0, 49.0, 126.0, 171.0, 203.0, 158.0, 111.0, 63.0, 37.0, 16.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.88243103027344, -152.56039428710938, -148.2383575439453, -143.91632080078125, -139.5942840576172, -135.27224731445312, -130.95021057128906, -126.628173828125, -122.30613708496094, -117.98410034179688, -113.66206359863281, -109.34002685546875, -105.01799011230469, -100.69595336914062, -96.37391662597656, -92.0518798828125, -87.7298355102539, -83.40779876708984, -79.08576202392578, -74.76372528076172, -70.44168853759766, -66.1196517944336, -61.797611236572266, -57.4755744934082, -53.15353775024414, -48.83150100708008, -44.509464263916016, -40.18742370605469, -35.865386962890625, -31.543352127075195, -27.2213134765625, -22.899276733398438, -18.577239990234375, -14.255203247070312, -9.933165550231934, -5.611127853393555, -1.2890911102294922, 3.0329456329345703, 7.354984283447266, 11.677021026611328, 15.99905776977539, 20.321094512939453, 24.643131256103516, 28.96516990661621, 33.287208557128906, 37.60924530029297, 41.93128204345703, 46.253318786621094, 50.575355529785156, 54.89739227294922, 59.21942901611328, 63.541465759277344, 67.8635025024414, 72.18553924560547, 76.50758361816406, 80.82962036132812, 85.15165710449219, 89.47369384765625, 93.79573059082031, 98.11776733398438, 102.43980407714844, 106.7618408203125, 111.08387756347656, 115.40591430664062, 119.72795104980469]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 13.0, 18.0, 12.0, 16.0, 25.0, 19.0, 39.0, 36.0, 38.0, 41.0, 52.0, 44.0, 57.0, 41.0, 62.0, 53.0, 53.0, 43.0, 46.0, 42.0, 44.0, 37.0, 38.0, 12.0, 18.0, 18.0, 17.0, 16.0, 3.0, 10.0, 6.0, 3.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-82.38967895507812, -80.09929656982422, -77.80890655517578, -75.51852416992188, -73.22814178466797, -70.93775939941406, -68.64736938476562, -66.35698699951172, -64.06660461425781, -61.77621841430664, -59.485836029052734, -57.19544982910156, -54.905067443847656, -52.614681243896484, -50.32429504394531, -48.033912658691406, -45.743526458740234, -43.45314025878906, -41.162757873535156, -38.872371673583984, -36.58198928833008, -34.291603088378906, -32.001220703125, -29.710834503173828, -27.42045021057129, -25.13006591796875, -22.83968162536621, -20.549297332763672, -18.2589111328125, -15.968527793884277, -13.678142547607422, -11.387758255004883, -9.097373962402344, -6.806989669799805, -4.516604900360107, -2.22622013092041, 0.0641641616821289, 2.354548454284668, 4.644933700561523, 6.9353179931640625, 9.225702285766602, 11.51608657836914, 13.80647087097168, 16.09685516357422, 18.38724136352539, 20.677623748779297, 22.96800994873047, 25.258394241333008, 27.548778533935547, 29.839162826538086, 32.129547119140625, 34.4199333190918, 36.7103157043457, 39.000701904296875, 41.29108428955078, 43.58147048950195, 45.871856689453125, 48.1622428894043, 50.4526252746582, 52.743011474609375, 55.03339385986328, 57.32378005981445, 59.614166259765625, 61.90454864501953, 64.19493103027344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 9.0, 10.0, 14.0, 20.0, 38.0, 57.0, 85.0, 129.0, 228.0, 420.0, 817.0, 1695.0, 4498.0, 21084.0, 729873.0, 3396686.0, 29679.0, 5280.0, 1842.0, 798.0, 423.0, 225.0, 130.0, 70.0, 32.0, 42.0, 14.0, 12.0, 12.0, 8.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-36.71875, -35.672119140625, -34.62548828125, -33.578857421875, -32.5322265625, -31.485595703125, -30.43896484375, -29.392333984375, -28.345703125, -27.299072265625, -26.25244140625, -25.205810546875, -24.1591796875, -23.112548828125, -22.06591796875, -21.019287109375, -19.97265625, -18.926025390625, -17.87939453125, -16.832763671875, -15.7861328125, -14.739501953125, -13.69287109375, -12.646240234375, -11.599609375, -10.552978515625, -9.50634765625, -8.459716796875, -7.4130859375, -6.366455078125, -5.31982421875, -4.273193359375, -3.2265625, -2.179931640625, -1.13330078125, -0.086669921875, 0.9599609375, 2.006591796875, 3.05322265625, 4.099853515625, 5.146484375, 6.193115234375, 7.23974609375, 8.286376953125, 9.3330078125, 10.379638671875, 11.42626953125, 12.472900390625, 13.51953125, 14.566162109375, 15.61279296875, 16.659423828125, 17.7060546875, 18.752685546875, 19.79931640625, 20.845947265625, 21.892578125, 22.939208984375, 23.98583984375, 25.032470703125, 26.0791015625, 27.125732421875, 28.17236328125, 29.218994140625, 30.265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 19.0, 31.0, 57.0, 86.0, 125.0, 119.0, 156.0, 126.0, 101.0, 87.0, 45.0, 23.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.99847412109375, -8.7625732421875, -8.52667236328125, -8.290771484375, -8.05487060546875, -7.8189697265625, -7.58306884765625, -7.34716796875, -7.11126708984375, -6.8753662109375, -6.63946533203125, -6.403564453125, -6.16766357421875, -5.9317626953125, -5.69586181640625, -5.4599609375, -5.22406005859375, -4.9881591796875, -4.75225830078125, -4.516357421875, -4.28045654296875, -4.0445556640625, -3.80865478515625, -3.57275390625, -3.33685302734375, -3.1009521484375, -2.86505126953125, -2.629150390625, -2.39324951171875, -2.1573486328125, -1.92144775390625, -1.685546875, -1.44964599609375, -1.2137451171875, -0.97784423828125, -0.741943359375, -0.50604248046875, -0.2701416015625, -0.03424072265625, 0.20166015625, 0.43756103515625, 0.6734619140625, 0.90936279296875, 1.145263671875, 1.38116455078125, 1.6170654296875, 1.85296630859375, 2.0888671875, 2.32476806640625, 2.5606689453125, 2.79656982421875, 3.032470703125, 3.26837158203125, 3.5042724609375, 3.74017333984375, 3.97607421875, 4.21197509765625, 4.4478759765625, 4.68377685546875, 4.919677734375, 5.15557861328125, 5.3914794921875, 5.62738037109375, 5.86328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 11.0, 19.0, 31.0, 34.0, 41.0, 32.0, 52.0, 49.0, 84.0, 89.0, 125.0, 256.0, 511.0, 1563.0, 6987.0, 64176.0, 3794713.0, 306076.0, 14865.0, 2782.0, 820.0, 336.0, 180.0, 106.0, 79.0, 63.0, 38.0, 39.0, 35.0, 18.0, 15.0, 10.0, 9.0, 8.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.8125, -25.992919921875, -25.17333984375, -24.353759765625, -23.5341796875, -22.714599609375, -21.89501953125, -21.075439453125, -20.255859375, -19.436279296875, -18.61669921875, -17.797119140625, -16.9775390625, -16.157958984375, -15.33837890625, -14.518798828125, -13.69921875, -12.879638671875, -12.06005859375, -11.240478515625, -10.4208984375, -9.601318359375, -8.78173828125, -7.962158203125, -7.142578125, -6.322998046875, -5.50341796875, -4.683837890625, -3.8642578125, -3.044677734375, -2.22509765625, -1.405517578125, -0.5859375, 0.233642578125, 1.05322265625, 1.872802734375, 2.6923828125, 3.511962890625, 4.33154296875, 5.151123046875, 5.970703125, 6.790283203125, 7.60986328125, 8.429443359375, 9.2490234375, 10.068603515625, 10.88818359375, 11.707763671875, 12.52734375, 13.346923828125, 14.16650390625, 14.986083984375, 15.8056640625, 16.625244140625, 17.44482421875, 18.264404296875, 19.083984375, 19.903564453125, 20.72314453125, 21.542724609375, 22.3623046875, 23.181884765625, 24.00146484375, 24.821044921875, 25.640625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 9.0, 21.0, 35.0, 95.0, 263.0, 1418.0, 1832.0, 260.0, 80.0, 29.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.418701171875, -17.04052734375, -16.662353515625, -16.2841796875, -15.906005859375, -15.52783203125, -15.149658203125, -14.771484375, -14.393310546875, -14.01513671875, -13.636962890625, -13.2587890625, -12.880615234375, -12.50244140625, -12.124267578125, -11.74609375, -11.367919921875, -10.98974609375, -10.611572265625, -10.2333984375, -9.855224609375, -9.47705078125, -9.098876953125, -8.720703125, -8.342529296875, -7.96435546875, -7.586181640625, -7.2080078125, -6.829833984375, -6.45166015625, -6.073486328125, -5.6953125, -5.317138671875, -4.93896484375, -4.560791015625, -4.1826171875, -3.804443359375, -3.42626953125, -3.048095703125, -2.669921875, -2.291748046875, -1.91357421875, -1.535400390625, -1.1572265625, -0.779052734375, -0.40087890625, -0.022705078125, 0.35546875, 0.733642578125, 1.11181640625, 1.489990234375, 1.8681640625, 2.246337890625, 2.62451171875, 3.002685546875, 3.380859375, 3.759033203125, 4.13720703125, 4.515380859375, 4.8935546875, 5.271728515625, 5.64990234375, 6.028076171875, 6.40625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 23.0, 50.0, 221.0, 399.0, 221.0, 57.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.26002502441406, -138.16558837890625, -135.07115173339844, -131.97669982910156, -128.88226318359375, -125.78782653808594, -122.69338989257812, -119.59895324707031, -116.50450897216797, -113.41007232666016, -110.31562805175781, -107.22119140625, -104.12675476074219, -101.03231048583984, -97.93787384033203, -94.84342956542969, -91.74899291992188, -88.65455627441406, -85.56011199951172, -82.4656753540039, -79.37123107910156, -76.27679443359375, -73.18235778808594, -70.08792114257812, -66.99347686767578, -63.8990364074707, -60.804595947265625, -57.71015930175781, -54.615718841552734, -51.521278381347656, -48.426841735839844, -45.332401275634766, -42.23796081542969, -39.14352035522461, -36.04907989501953, -32.95464324951172, -29.86020278930664, -26.765762329101562, -23.671323776245117, -20.576885223388672, -17.482444763183594, -14.388005256652832, -11.29356575012207, -8.199126243591309, -5.104686737060547, -2.010247230529785, 1.0841922760009766, 4.178630828857422, 7.2730712890625, 10.367510795593262, 13.461950302124023, 16.55638885498047, 19.650829315185547, 22.745269775390625, 25.83970832824707, 28.934146881103516, 32.028587341308594, 35.12302780151367, 38.21746826171875, 41.31190490722656, 44.40634536743164, 47.50078582763672, 50.59522247314453, 53.68966293334961, 56.78410339355469]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 9.0, 21.0, 26.0, 46.0, 45.0, 58.0, 74.0, 90.0, 91.0, 103.0, 78.0, 80.0, 79.0, 45.0, 46.0, 41.0, 20.0, 18.0, 11.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.023406982421875, -38.695579528808594, -37.36774826049805, -36.039920806884766, -34.71208953857422, -33.38426208496094, -32.056434631347656, -30.728605270385742, -29.400775909423828, -28.072946548461914, -26.7451171875, -25.41728973388672, -24.089460372924805, -22.76163101196289, -21.43380355834961, -20.105974197387695, -18.77814483642578, -17.450315475463867, -16.122486114501953, -14.794658660888672, -13.466829299926758, -12.138999938964844, -10.811171531677246, -9.483343124389648, -8.155513763427734, -6.8276848793029785, -5.499855995178223, -4.172027111053467, -2.844198226928711, -1.516369342803955, -0.18854045867919922, 1.1392879486083984, 2.467121124267578, 3.794950008392334, 5.12277889251709, 6.450607776641846, 7.778436660766602, 9.106266021728516, 10.434094429016113, 11.761922836303711, 13.089752197265625, 14.417581558227539, 15.745409965515137, 17.073238372802734, 18.40106773376465, 19.728897094726562, 21.056724548339844, 22.384553909301758, 23.712383270263672, 25.040212631225586, 26.3680419921875, 27.69586944580078, 29.023698806762695, 30.35152816772461, 31.67935562133789, 33.00718688964844, 34.33501434326172, 35.662841796875, 36.99067306518555, 38.31850051879883, 39.646331787109375, 40.974159240722656, 42.30198669433594, 43.62981414794922, 44.957645416259766]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 5.0, 12.0, 20.0, 19.0, 30.0, 26.0, 51.0, 80.0, 93.0, 146.0, 252.0, 378.0, 664.0, 1151.0, 2397.0, 5433.0, 16441.0, 59502.0, 231491.0, 468448.0, 190483.0, 47916.0, 13786.0, 4790.0, 2195.0, 1072.0, 558.0, 383.0, 209.0, 136.0, 117.0, 61.0, 49.0, 41.0, 28.0, 22.0, 15.0, 12.0, 11.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.171875, -18.561767578125, -17.95166015625, -17.341552734375, -16.7314453125, -16.121337890625, -15.51123046875, -14.901123046875, -14.291015625, -13.680908203125, -13.07080078125, -12.460693359375, -11.8505859375, -11.240478515625, -10.63037109375, -10.020263671875, -9.41015625, -8.800048828125, -8.18994140625, -7.579833984375, -6.9697265625, -6.359619140625, -5.74951171875, -5.139404296875, -4.529296875, -3.919189453125, -3.30908203125, -2.698974609375, -2.0888671875, -1.478759765625, -0.86865234375, -0.258544921875, 0.3515625, 0.961669921875, 1.57177734375, 2.181884765625, 2.7919921875, 3.402099609375, 4.01220703125, 4.622314453125, 5.232421875, 5.842529296875, 6.45263671875, 7.062744140625, 7.6728515625, 8.282958984375, 8.89306640625, 9.503173828125, 10.11328125, 10.723388671875, 11.33349609375, 11.943603515625, 12.5537109375, 13.163818359375, 13.77392578125, 14.384033203125, 14.994140625, 15.604248046875, 16.21435546875, 16.824462890625, 17.4345703125, 18.044677734375, 18.65478515625, 19.264892578125, 19.875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 8.0, 12.0, 19.0, 39.0, 70.0, 100.0, 125.0, 137.0, 131.0, 118.0, 93.0, 69.0, 42.0, 28.0, 8.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -9.034912109375, -8.79638671875, -8.557861328125, -8.3193359375, -8.080810546875, -7.84228515625, -7.603759765625, -7.365234375, -7.126708984375, -6.88818359375, -6.649658203125, -6.4111328125, -6.172607421875, -5.93408203125, -5.695556640625, -5.45703125, -5.218505859375, -4.97998046875, -4.741455078125, -4.5029296875, -4.264404296875, -4.02587890625, -3.787353515625, -3.548828125, -3.310302734375, -3.07177734375, -2.833251953125, -2.5947265625, -2.356201171875, -2.11767578125, -1.879150390625, -1.640625, -1.402099609375, -1.16357421875, -0.925048828125, -0.6865234375, -0.447998046875, -0.20947265625, 0.029052734375, 0.267578125, 0.506103515625, 0.74462890625, 0.983154296875, 1.2216796875, 1.460205078125, 1.69873046875, 1.937255859375, 2.17578125, 2.414306640625, 2.65283203125, 2.891357421875, 3.1298828125, 3.368408203125, 3.60693359375, 3.845458984375, 4.083984375, 4.322509765625, 4.56103515625, 4.799560546875, 5.0380859375, 5.276611328125, 5.51513671875, 5.753662109375, 5.9921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 7.0, 11.0, 16.0, 18.0, 19.0, 32.0, 41.0, 66.0, 96.0, 99.0, 137.0, 196.0, 275.0, 426.0, 612.0, 1041.0, 2130.0, 4335.0, 10515.0, 28888.0, 86611.0, 245397.0, 378374.0, 187926.0, 63759.0, 21496.0, 8005.0, 3459.0, 1699.0, 930.0, 563.0, 363.0, 251.0, 205.0, 159.0, 92.0, 73.0, 53.0, 41.0, 30.0, 31.0, 16.0, 18.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.953125, -9.6141357421875, -9.275146484375, -8.9361572265625, -8.59716796875, -8.2581787109375, -7.919189453125, -7.5802001953125, -7.2412109375, -6.9022216796875, -6.563232421875, -6.2242431640625, -5.88525390625, -5.5462646484375, -5.207275390625, -4.8682861328125, -4.529296875, -4.1903076171875, -3.851318359375, -3.5123291015625, -3.17333984375, -2.8343505859375, -2.495361328125, -2.1563720703125, -1.8173828125, -1.4783935546875, -1.139404296875, -0.8004150390625, -0.46142578125, -0.1224365234375, 0.216552734375, 0.5555419921875, 0.89453125, 1.2335205078125, 1.572509765625, 1.9114990234375, 2.25048828125, 2.5894775390625, 2.928466796875, 3.2674560546875, 3.6064453125, 3.9454345703125, 4.284423828125, 4.6234130859375, 4.96240234375, 5.3013916015625, 5.640380859375, 5.9793701171875, 6.318359375, 6.6573486328125, 6.996337890625, 7.3353271484375, 7.67431640625, 8.0133056640625, 8.352294921875, 8.6912841796875, 9.0302734375, 9.3692626953125, 9.708251953125, 10.0472412109375, 10.38623046875, 10.7252197265625, 11.064208984375, 11.4031982421875, 11.7421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 10.0, 8.0, 6.0, 14.0, 14.0, 21.0, 32.0, 24.0, 35.0, 29.0, 34.0, 25.0, 39.0, 47.0, 46.0, 43.0, 39.0, 49.0, 45.0, 43.0, 56.0, 35.0, 36.0, 36.0, 44.0, 33.0, 23.0, 21.0, 14.0, 13.0, 12.0, 12.0, 9.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-13.1328125, -12.7587890625, -12.384765625, -12.0107421875, -11.63671875, -11.2626953125, -10.888671875, -10.5146484375, -10.140625, -9.7666015625, -9.392578125, -9.0185546875, -8.64453125, -8.2705078125, -7.896484375, -7.5224609375, -7.1484375, -6.7744140625, -6.400390625, -6.0263671875, -5.65234375, -5.2783203125, -4.904296875, -4.5302734375, -4.15625, -3.7822265625, -3.408203125, -3.0341796875, -2.66015625, -2.2861328125, -1.912109375, -1.5380859375, -1.1640625, -0.7900390625, -0.416015625, -0.0419921875, 0.33203125, 0.7060546875, 1.080078125, 1.4541015625, 1.828125, 2.2021484375, 2.576171875, 2.9501953125, 3.32421875, 3.6982421875, 4.072265625, 4.4462890625, 4.8203125, 5.1943359375, 5.568359375, 5.9423828125, 6.31640625, 6.6904296875, 7.064453125, 7.4384765625, 7.8125, 8.1865234375, 8.560546875, 8.9345703125, 9.30859375, 9.6826171875, 10.056640625, 10.4306640625, 10.8046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 13.0, 5.0, 16.0, 30.0, 40.0, 48.0, 81.0, 112.0, 213.0, 276.0, 483.0, 835.0, 1442.0, 2599.0, 4914.0, 9977.0, 23194.0, 68992.0, 309686.0, 454660.0, 112022.0, 32220.0, 13031.0, 6131.0, 3138.0, 1700.0, 1010.0, 592.0, 388.0, 266.0, 149.0, 91.0, 68.0, 38.0, 24.0, 14.0, 11.0, 13.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1640625, -6.900390625, -6.63671875, -6.373046875, -6.109375, -5.845703125, -5.58203125, -5.318359375, -5.0546875, -4.791015625, -4.52734375, -4.263671875, -4.0, -3.736328125, -3.47265625, -3.208984375, -2.9453125, -2.681640625, -2.41796875, -2.154296875, -1.890625, -1.626953125, -1.36328125, -1.099609375, -0.8359375, -0.572265625, -0.30859375, -0.044921875, 0.21875, 0.482421875, 0.74609375, 1.009765625, 1.2734375, 1.537109375, 1.80078125, 2.064453125, 2.328125, 2.591796875, 2.85546875, 3.119140625, 3.3828125, 3.646484375, 3.91015625, 4.173828125, 4.4375, 4.701171875, 4.96484375, 5.228515625, 5.4921875, 5.755859375, 6.01953125, 6.283203125, 6.546875, 6.810546875, 7.07421875, 7.337890625, 7.6015625, 7.865234375, 8.12890625, 8.392578125, 8.65625, 8.919921875, 9.18359375, 9.447265625, 9.7109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 15.0, 12.0, 25.0, 23.0, 31.0, 49.0, 77.0, 89.0, 135.0, 112.0, 102.0, 79.0, 60.0, 37.0, 35.0, 24.0, 17.0, 17.0, 6.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014371871948242188, -0.0013964921236038208, -0.0013557970523834229, -0.001315101981163025, -0.001274406909942627, -0.001233711838722229, -0.001193016767501831, -0.001152321696281433, -0.0011116266250610352, -0.0010709315538406372, -0.0010302364826202393, -0.0009895414113998413, -0.0009488463401794434, -0.0009081512689590454, -0.0008674561977386475, -0.0008267611265182495, -0.0007860660552978516, -0.0007453709840774536, -0.0007046759128570557, -0.0006639808416366577, -0.0006232857704162598, -0.0005825906991958618, -0.0005418956279754639, -0.0005012005567550659, -0.00046050548553466797, -0.00041981041431427, -0.00037911534309387207, -0.0003384202718734741, -0.00029772520065307617, -0.0002570301294326782, -0.00021633505821228027, -0.00017563998699188232, -0.00013494491577148438, -9.424984455108643e-05, -5.3554773330688477e-05, -1.2859702110290527e-05, 2.7835369110107422e-05, 6.853044033050537e-05, 0.00010922551155090332, 0.00014992058277130127, 0.00019061565399169922, 0.00023131072521209717, 0.0002720057964324951, 0.00031270086765289307, 0.000353395938873291, 0.00039409101009368896, 0.0004347860813140869, 0.00047548115253448486, 0.0005161762237548828, 0.0005568712949752808, 0.0005975663661956787, 0.0006382614374160767, 0.0006789565086364746, 0.0007196515798568726, 0.0007603466510772705, 0.0008010417222976685, 0.0008417367935180664, 0.0008824318647384644, 0.0009231269359588623, 0.0009638220071792603, 0.0010045170783996582, 0.0010452121496200562, 0.001085907220840454, 0.001126602292060852, 0.00116729736328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 12.0, 9.0, 20.0, 16.0, 34.0, 44.0, 83.0, 117.0, 189.0, 323.0, 515.0, 929.0, 2025.0, 4481.0, 11689.0, 39239.0, 272101.0, 614669.0, 72268.0, 17809.0, 6327.0, 2650.0, 1334.0, 666.0, 378.0, 228.0, 128.0, 81.0, 50.0, 40.0, 34.0, 17.0, 15.0, 6.0, 11.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.171875, -13.7025146484375, -13.233154296875, -12.7637939453125, -12.29443359375, -11.8250732421875, -11.355712890625, -10.8863525390625, -10.4169921875, -9.9476318359375, -9.478271484375, -9.0089111328125, -8.53955078125, -8.0701904296875, -7.600830078125, -7.1314697265625, -6.662109375, -6.1927490234375, -5.723388671875, -5.2540283203125, -4.78466796875, -4.3153076171875, -3.845947265625, -3.3765869140625, -2.9072265625, -2.4378662109375, -1.968505859375, -1.4991455078125, -1.02978515625, -0.5604248046875, -0.091064453125, 0.3782958984375, 0.84765625, 1.3170166015625, 1.786376953125, 2.2557373046875, 2.72509765625, 3.1944580078125, 3.663818359375, 4.1331787109375, 4.6025390625, 5.0718994140625, 5.541259765625, 6.0106201171875, 6.47998046875, 6.9493408203125, 7.418701171875, 7.8880615234375, 8.357421875, 8.8267822265625, 9.296142578125, 9.7655029296875, 10.23486328125, 10.7042236328125, 11.173583984375, 11.6429443359375, 12.1123046875, 12.5816650390625, 13.051025390625, 13.5203857421875, 13.98974609375, 14.4591064453125, 14.928466796875, 15.3978271484375, 15.8671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 15.0, 27.0, 42.0, 57.0, 101.0, 153.0, 171.0, 144.0, 99.0, 49.0, 32.0, 22.0, 16.0, 7.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.18212890625, -10.7236328125, -10.26513671875, -9.806640625, -9.34814453125, -8.8896484375, -8.43115234375, -7.97265625, -7.51416015625, -7.0556640625, -6.59716796875, -6.138671875, -5.68017578125, -5.2216796875, -4.76318359375, -4.3046875, -3.84619140625, -3.3876953125, -2.92919921875, -2.470703125, -2.01220703125, -1.5537109375, -1.09521484375, -0.63671875, -0.17822265625, 0.2802734375, 0.73876953125, 1.197265625, 1.65576171875, 2.1142578125, 2.57275390625, 3.03125, 3.48974609375, 3.9482421875, 4.40673828125, 4.865234375, 5.32373046875, 5.7822265625, 6.24072265625, 6.69921875, 7.15771484375, 7.6162109375, 8.07470703125, 8.533203125, 8.99169921875, 9.4501953125, 9.90869140625, 10.3671875, 10.82568359375, 11.2841796875, 11.74267578125, 12.201171875, 12.65966796875, 13.1181640625, 13.57666015625, 14.03515625, 14.49365234375, 14.9521484375, 15.41064453125, 15.869140625, 16.32763671875, 16.7861328125, 17.24462890625, 17.703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 51.0, 164.0, 383.0, 266.0, 85.0, 29.0, 10.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-295.03594970703125, -284.77294921875, -274.5099182128906, -264.2469177246094, -253.98390197753906, -243.72088623046875, -233.4578857421875, -223.1948699951172, -212.93185424804688, -202.66883850097656, -192.40582275390625, -182.142822265625, -171.8798065185547, -161.61679077148438, -151.35379028320312, -141.0907745361328, -130.8277587890625, -120.56474304199219, -110.3017349243164, -100.03872680664062, -89.77571105957031, -79.5126953125, -69.24968719482422, -58.98667907714844, -48.723663330078125, -38.46065139770508, -28.19763946533203, -17.934627532958984, -7.6716156005859375, 2.5913963317871094, 12.854408264160156, 23.117416381835938, 33.38043212890625, 43.6434440612793, 53.906455993652344, 64.16946411132812, 74.43247985839844, 84.69549560546875, 94.95850372314453, 105.22151184082031, 115.48452758789062, 125.74754333496094, 136.01055908203125, 146.2735595703125, 156.5365753173828, 166.79959106445312, 177.06259155273438, 187.3256072998047, 197.588623046875, 207.8516387939453, 218.11465454101562, 228.37765502929688, 238.6406707763672, 248.9036865234375, 259.16668701171875, 269.4296875, 279.6927185058594, 289.9557189941406, 300.21875, 310.48175048828125, 320.7447509765625, 331.0077819824219, 341.2707824707031, 351.5338134765625, 361.79681396484375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 8.0, 8.0, 22.0, 20.0, 17.0, 30.0, 30.0, 33.0, 26.0, 31.0, 47.0, 41.0, 46.0, 50.0, 37.0, 48.0, 42.0, 45.0, 39.0, 42.0, 47.0, 41.0, 28.0, 36.0, 27.0, 22.0, 27.0, 13.0, 21.0, 10.0, 11.0, 9.0, 5.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.48361206054688, -86.8594970703125, -84.2353744506836, -81.61125946044922, -78.98714447021484, -76.36302947998047, -73.73890686035156, -71.11479187011719, -68.49067687988281, -65.86656188964844, -63.2424430847168, -60.618324279785156, -57.99420928955078, -55.37009048461914, -52.7459716796875, -50.121856689453125, -47.497737884521484, -44.873619079589844, -42.24950408935547, -39.62538528442383, -37.00127029418945, -34.37715148925781, -31.753034591674805, -29.128917694091797, -26.50480079650879, -23.88068389892578, -21.256567001342773, -18.632450103759766, -16.008331298828125, -13.384215354919434, -10.76009750366211, -8.135980606079102, -5.511863708496094, -2.887746572494507, -0.2636294364929199, 2.360487937927246, 4.984604835510254, 7.608721733093262, 10.232839584350586, 12.856956481933594, 15.481073379516602, 18.10519027709961, 20.729307174682617, 23.353424072265625, 25.977542877197266, 28.60165786743164, 31.22577667236328, 33.849891662597656, 36.4740104675293, 39.09812927246094, 41.72224426269531, 44.34636306762695, 46.97047805786133, 49.59459686279297, 52.218711853027344, 54.842830657958984, 57.466949462890625, 60.091068267822266, 62.71518325805664, 65.33930206298828, 67.96341705322266, 70.58753204345703, 73.21165466308594, 75.83576965332031, 78.45988464355469]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 11.0, 6.0, 12.0, 18.0, 32.0, 48.0, 74.0, 125.0, 214.0, 411.0, 786.0, 1832.0, 5693.0, 26340.0, 440168.0, 3640652.0, 63116.0, 9814.0, 2801.0, 1131.0, 454.0, 221.0, 123.0, 71.0, 48.0, 25.0, 12.0, 14.0, 13.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.25, -33.1865234375, -32.123046875, -31.0595703125, -29.99609375, -28.9326171875, -27.869140625, -26.8056640625, -25.7421875, -24.6787109375, -23.615234375, -22.5517578125, -21.48828125, -20.4248046875, -19.361328125, -18.2978515625, -17.234375, -16.1708984375, -15.107421875, -14.0439453125, -12.98046875, -11.9169921875, -10.853515625, -9.7900390625, -8.7265625, -7.6630859375, -6.599609375, -5.5361328125, -4.47265625, -3.4091796875, -2.345703125, -1.2822265625, -0.21875, 0.8447265625, 1.908203125, 2.9716796875, 4.03515625, 5.0986328125, 6.162109375, 7.2255859375, 8.2890625, 9.3525390625, 10.416015625, 11.4794921875, 12.54296875, 13.6064453125, 14.669921875, 15.7333984375, 16.796875, 17.8603515625, 18.923828125, 19.9873046875, 21.05078125, 22.1142578125, 23.177734375, 24.2412109375, 25.3046875, 26.3681640625, 27.431640625, 28.4951171875, 29.55859375, 30.6220703125, 31.685546875, 32.7490234375, 33.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 13.0, 20.0, 33.0, 63.0, 81.0, 96.0, 117.0, 120.0, 119.0, 101.0, 82.0, 58.0, 49.0, 25.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.699462890625, -8.46142578125, -8.223388671875, -7.9853515625, -7.747314453125, -7.50927734375, -7.271240234375, -7.033203125, -6.795166015625, -6.55712890625, -6.319091796875, -6.0810546875, -5.843017578125, -5.60498046875, -5.366943359375, -5.12890625, -4.890869140625, -4.65283203125, -4.414794921875, -4.1767578125, -3.938720703125, -3.70068359375, -3.462646484375, -3.224609375, -2.986572265625, -2.74853515625, -2.510498046875, -2.2724609375, -2.034423828125, -1.79638671875, -1.558349609375, -1.3203125, -1.082275390625, -0.84423828125, -0.606201171875, -0.3681640625, -0.130126953125, 0.10791015625, 0.345947265625, 0.583984375, 0.822021484375, 1.06005859375, 1.298095703125, 1.5361328125, 1.774169921875, 2.01220703125, 2.250244140625, 2.48828125, 2.726318359375, 2.96435546875, 3.202392578125, 3.4404296875, 3.678466796875, 3.91650390625, 4.154541015625, 4.392578125, 4.630615234375, 4.86865234375, 5.106689453125, 5.3447265625, 5.582763671875, 5.82080078125, 6.058837890625, 6.296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 14.0, 19.0, 27.0, 34.0, 60.0, 96.0, 131.0, 262.0, 555.0, 1293.0, 4387.0, 24612.0, 580839.0, 3504636.0, 65745.0, 7858.0, 2098.0, 791.0, 355.0, 197.0, 110.0, 64.0, 38.0, 20.0, 14.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.640625, -19.787841796875, -18.93505859375, -18.082275390625, -17.2294921875, -16.376708984375, -15.52392578125, -14.671142578125, -13.818359375, -12.965576171875, -12.11279296875, -11.260009765625, -10.4072265625, -9.554443359375, -8.70166015625, -7.848876953125, -6.99609375, -6.143310546875, -5.29052734375, -4.437744140625, -3.5849609375, -2.732177734375, -1.87939453125, -1.026611328125, -0.173828125, 0.678955078125, 1.53173828125, 2.384521484375, 3.2373046875, 4.090087890625, 4.94287109375, 5.795654296875, 6.6484375, 7.501220703125, 8.35400390625, 9.206787109375, 10.0595703125, 10.912353515625, 11.76513671875, 12.617919921875, 13.470703125, 14.323486328125, 15.17626953125, 16.029052734375, 16.8818359375, 17.734619140625, 18.58740234375, 19.440185546875, 20.29296875, 21.145751953125, 21.99853515625, 22.851318359375, 23.7041015625, 24.556884765625, 25.40966796875, 26.262451171875, 27.115234375, 27.968017578125, 28.82080078125, 29.673583984375, 30.5263671875, 31.379150390625, 32.23193359375, 33.084716796875, 33.9375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 8.0, 15.0, 26.0, 43.0, 93.0, 203.0, 596.0, 1926.0, 775.0, 221.0, 91.0, 34.0, 21.0, 12.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.34375, -16.927490234375, -16.51123046875, -16.094970703125, -15.6787109375, -15.262451171875, -14.84619140625, -14.429931640625, -14.013671875, -13.597412109375, -13.18115234375, -12.764892578125, -12.3486328125, -11.932373046875, -11.51611328125, -11.099853515625, -10.68359375, -10.267333984375, -9.85107421875, -9.434814453125, -9.0185546875, -8.602294921875, -8.18603515625, -7.769775390625, -7.353515625, -6.937255859375, -6.52099609375, -6.104736328125, -5.6884765625, -5.272216796875, -4.85595703125, -4.439697265625, -4.0234375, -3.607177734375, -3.19091796875, -2.774658203125, -2.3583984375, -1.942138671875, -1.52587890625, -1.109619140625, -0.693359375, -0.277099609375, 0.13916015625, 0.555419921875, 0.9716796875, 1.387939453125, 1.80419921875, 2.220458984375, 2.63671875, 3.052978515625, 3.46923828125, 3.885498046875, 4.3017578125, 4.718017578125, 5.13427734375, 5.550537109375, 5.966796875, 6.383056640625, 6.79931640625, 7.215576171875, 7.6318359375, 8.048095703125, 8.46435546875, 8.880615234375, 9.296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 21.0, 59.0, 150.0, 266.0, 277.0, 149.0, 45.0, 11.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.85604858398438, -113.3698501586914, -109.8836441040039, -106.39744567871094, -102.91124725341797, -99.42504119873047, -95.9388427734375, -92.45263671875, -88.96643829345703, -85.48023986816406, -81.99403381347656, -78.5078353881836, -75.02163696289062, -71.53543090820312, -68.04923248291016, -64.56303405761719, -61.07683181762695, -57.59062957763672, -54.10443115234375, -50.618228912353516, -47.13202667236328, -43.64582824707031, -40.15962600708008, -36.673423767089844, -33.187225341796875, -29.701025009155273, -26.21482276916504, -22.728622436523438, -19.242420196533203, -15.756219863891602, -12.27001953125, -8.783817291259766, -5.297615051269531, -1.8114140033721924, 1.6747870445251465, 5.160987854003906, 8.647189140319824, 12.133390426635742, 15.619590759277344, 19.105792999267578, 22.59199333190918, 26.07819366455078, 29.564395904541016, 33.05059814453125, 36.53679656982422, 40.02299880981445, 43.50920104980469, 46.995399475097656, 50.48160171508789, 53.967803955078125, 57.454002380371094, 60.94020462036133, 64.42640686035156, 67.91260528564453, 71.3988037109375, 74.885009765625, 78.37120819091797, 81.85740661621094, 85.34361267089844, 88.8298110961914, 92.31600952148438, 95.80221557617188, 99.28841400146484, 102.77461242675781, 106.26081848144531]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 11.0, 16.0, 16.0, 26.0, 21.0, 31.0, 47.0, 45.0, 42.0, 51.0, 58.0, 48.0, 59.0, 52.0, 60.0, 56.0, 59.0, 47.0, 40.0, 33.0, 44.0, 35.0, 19.0, 20.0, 19.0, 13.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.105918884277344, -42.89449691772461, -41.68307876586914, -40.471656799316406, -39.26023864746094, -38.0488166809082, -36.837398529052734, -35.6259765625, -34.41455841064453, -33.2031364440918, -31.991718292236328, -30.780298233032227, -29.568878173828125, -28.35745620727539, -27.14603614807129, -25.934616088867188, -24.723194122314453, -23.51177406311035, -22.30035400390625, -21.08893394470215, -19.877513885498047, -18.666091918945312, -17.45467185974121, -16.24325180053711, -15.031831741333008, -13.820411682128906, -12.608991622924805, -11.397570610046387, -10.186150550842285, -8.974730491638184, -7.763309955596924, -6.551889419555664, -5.3404693603515625, -4.129049301147461, -2.917628765106201, -1.7062084674835205, -0.49478816986083984, 0.7166318893432617, 1.9280524253845215, 3.1394729614257812, 4.350893020629883, 5.562313079833984, 6.773733615875244, 7.985154151916504, 9.196574211120605, 10.407994270324707, 11.619415283203125, 12.830835342407227, 14.042255401611328, 15.25367546081543, 16.46509552001953, 17.676515579223633, 18.887935638427734, 20.09935760498047, 21.31077766418457, 22.522197723388672, 23.733617782592773, 24.945037841796875, 26.156457901000977, 27.367877960205078, 28.579299926757812, 29.79071807861328, 31.002140045166016, 32.21356201171875, 33.42498016357422]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 5.0, 5.0, 12.0, 14.0, 17.0, 33.0, 52.0, 73.0, 105.0, 204.0, 368.0, 767.0, 1644.0, 4150.0, 13250.0, 61967.0, 492398.0, 402444.0, 52330.0, 11884.0, 3753.0, 1462.0, 736.0, 356.0, 196.0, 110.0, 62.0, 51.0, 28.0, 15.0, 23.0, 13.0, 10.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.22607421875, -25.4052734375, -24.58447265625, -23.763671875, -22.94287109375, -22.1220703125, -21.30126953125, -20.48046875, -19.65966796875, -18.8388671875, -18.01806640625, -17.197265625, -16.37646484375, -15.5556640625, -14.73486328125, -13.9140625, -13.09326171875, -12.2724609375, -11.45166015625, -10.630859375, -9.81005859375, -8.9892578125, -8.16845703125, -7.34765625, -6.52685546875, -5.7060546875, -4.88525390625, -4.064453125, -3.24365234375, -2.4228515625, -1.60205078125, -0.78125, 0.03955078125, 0.8603515625, 1.68115234375, 2.501953125, 3.32275390625, 4.1435546875, 4.96435546875, 5.78515625, 6.60595703125, 7.4267578125, 8.24755859375, 9.068359375, 9.88916015625, 10.7099609375, 11.53076171875, 12.3515625, 13.17236328125, 13.9931640625, 14.81396484375, 15.634765625, 16.45556640625, 17.2763671875, 18.09716796875, 18.91796875, 19.73876953125, 20.5595703125, 21.38037109375, 22.201171875, 23.02197265625, 23.8427734375, 24.66357421875, 25.484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 10.0, 21.0, 35.0, 48.0, 74.0, 101.0, 127.0, 135.0, 112.0, 119.0, 78.0, 59.0, 35.0, 28.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.26287841796875, -9.0101318359375, -8.75738525390625, -8.504638671875, -8.25189208984375, -7.9991455078125, -7.74639892578125, -7.49365234375, -7.24090576171875, -6.9881591796875, -6.73541259765625, -6.482666015625, -6.22991943359375, -5.9771728515625, -5.72442626953125, -5.4716796875, -5.21893310546875, -4.9661865234375, -4.71343994140625, -4.460693359375, -4.20794677734375, -3.9552001953125, -3.70245361328125, -3.44970703125, -3.19696044921875, -2.9442138671875, -2.69146728515625, -2.438720703125, -2.18597412109375, -1.9332275390625, -1.68048095703125, -1.427734375, -1.17498779296875, -0.9222412109375, -0.66949462890625, -0.416748046875, -0.16400146484375, 0.0887451171875, 0.34149169921875, 0.59423828125, 0.84698486328125, 1.0997314453125, 1.35247802734375, 1.605224609375, 1.85797119140625, 2.1107177734375, 2.36346435546875, 2.6162109375, 2.86895751953125, 3.1217041015625, 3.37445068359375, 3.627197265625, 3.87994384765625, 4.1326904296875, 4.38543701171875, 4.63818359375, 4.89093017578125, 5.1436767578125, 5.39642333984375, 5.649169921875, 5.90191650390625, 6.1546630859375, 6.40740966796875, 6.66015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 10.0, 11.0, 14.0, 16.0, 11.0, 25.0, 33.0, 39.0, 46.0, 67.0, 102.0, 116.0, 193.0, 299.0, 449.0, 684.0, 1449.0, 3336.0, 9485.0, 35241.0, 179405.0, 639473.0, 134873.0, 29014.0, 7953.0, 2895.0, 1272.0, 654.0, 444.0, 264.0, 185.0, 111.0, 95.0, 68.0, 52.0, 48.0, 41.0, 25.0, 12.0, 12.0, 9.0, 4.0, 4.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.753662109375, -15.17919921875, -14.604736328125, -14.0302734375, -13.455810546875, -12.88134765625, -12.306884765625, -11.732421875, -11.157958984375, -10.58349609375, -10.009033203125, -9.4345703125, -8.860107421875, -8.28564453125, -7.711181640625, -7.13671875, -6.562255859375, -5.98779296875, -5.413330078125, -4.8388671875, -4.264404296875, -3.68994140625, -3.115478515625, -2.541015625, -1.966552734375, -1.39208984375, -0.817626953125, -0.2431640625, 0.331298828125, 0.90576171875, 1.480224609375, 2.0546875, 2.629150390625, 3.20361328125, 3.778076171875, 4.3525390625, 4.927001953125, 5.50146484375, 6.075927734375, 6.650390625, 7.224853515625, 7.79931640625, 8.373779296875, 8.9482421875, 9.522705078125, 10.09716796875, 10.671630859375, 11.24609375, 11.820556640625, 12.39501953125, 12.969482421875, 13.5439453125, 14.118408203125, 14.69287109375, 15.267333984375, 15.841796875, 16.416259765625, 16.99072265625, 17.565185546875, 18.1396484375, 18.714111328125, 19.28857421875, 19.863037109375, 20.4375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 6.0, 6.0, 11.0, 7.0, 15.0, 15.0, 24.0, 14.0, 24.0, 22.0, 33.0, 44.0, 39.0, 50.0, 60.0, 53.0, 55.0, 54.0, 54.0, 52.0, 45.0, 49.0, 47.0, 31.0, 23.0, 17.0, 25.0, 21.0, 22.0, 11.0, 11.0, 12.0, 9.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.5709228515625, -12.118408203125, -11.6658935546875, -11.21337890625, -10.7608642578125, -10.308349609375, -9.8558349609375, -9.4033203125, -8.9508056640625, -8.498291015625, -8.0457763671875, -7.59326171875, -7.1407470703125, -6.688232421875, -6.2357177734375, -5.783203125, -5.3306884765625, -4.878173828125, -4.4256591796875, -3.97314453125, -3.5206298828125, -3.068115234375, -2.6156005859375, -2.1630859375, -1.7105712890625, -1.258056640625, -0.8055419921875, -0.35302734375, 0.0994873046875, 0.552001953125, 1.0045166015625, 1.45703125, 1.9095458984375, 2.362060546875, 2.8145751953125, 3.26708984375, 3.7196044921875, 4.172119140625, 4.6246337890625, 5.0771484375, 5.5296630859375, 5.982177734375, 6.4346923828125, 6.88720703125, 7.3397216796875, 7.792236328125, 8.2447509765625, 8.697265625, 9.1497802734375, 9.602294921875, 10.0548095703125, 10.50732421875, 10.9598388671875, 11.412353515625, 11.8648681640625, 12.3173828125, 12.7698974609375, 13.222412109375, 13.6749267578125, 14.12744140625, 14.5799560546875, 15.032470703125, 15.4849853515625, 15.9375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 10.0, 12.0, 22.0, 20.0, 38.0, 73.0, 92.0, 169.0, 300.0, 600.0, 1627.0, 5680.0, 25788.0, 433916.0, 542369.0, 28533.0, 6130.0, 1760.0, 652.0, 317.0, 168.0, 98.0, 54.0, 44.0, 26.0, 14.0, 13.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.429443359375, -15.84326171875, -15.257080078125, -14.6708984375, -14.084716796875, -13.49853515625, -12.912353515625, -12.326171875, -11.739990234375, -11.15380859375, -10.567626953125, -9.9814453125, -9.395263671875, -8.80908203125, -8.222900390625, -7.63671875, -7.050537109375, -6.46435546875, -5.878173828125, -5.2919921875, -4.705810546875, -4.11962890625, -3.533447265625, -2.947265625, -2.361083984375, -1.77490234375, -1.188720703125, -0.6025390625, -0.016357421875, 0.56982421875, 1.156005859375, 1.7421875, 2.328369140625, 2.91455078125, 3.500732421875, 4.0869140625, 4.673095703125, 5.25927734375, 5.845458984375, 6.431640625, 7.017822265625, 7.60400390625, 8.190185546875, 8.7763671875, 9.362548828125, 9.94873046875, 10.534912109375, 11.12109375, 11.707275390625, 12.29345703125, 12.879638671875, 13.4658203125, 14.052001953125, 14.63818359375, 15.224365234375, 15.810546875, 16.396728515625, 16.98291015625, 17.569091796875, 18.1552734375, 18.741455078125, 19.32763671875, 19.913818359375, 20.5]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 13.0, 14.0, 20.0, 18.0, 30.0, 39.0, 74.0, 221.0, 318.0, 83.0, 50.0, 31.0, 24.0, 18.0, 6.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002162933349609375, -0.0021046996116638184, -0.0020464658737182617, -0.001988232135772705, -0.0019299983978271484, -0.0018717646598815918, -0.0018135309219360352, -0.0017552971839904785, -0.0016970634460449219, -0.0016388297080993652, -0.0015805959701538086, -0.001522362232208252, -0.0014641284942626953, -0.0014058947563171387, -0.001347661018371582, -0.0012894272804260254, -0.0012311935424804688, -0.0011729598045349121, -0.0011147260665893555, -0.0010564923286437988, -0.0009982585906982422, -0.0009400248527526855, -0.0008817911148071289, -0.0008235573768615723, -0.0007653236389160156, -0.000707089900970459, -0.0006488561630249023, -0.0005906224250793457, -0.0005323886871337891, -0.0004741549491882324, -0.0004159212112426758, -0.00035768747329711914, -0.0002994537353515625, -0.00024121999740600586, -0.00018298625946044922, -0.00012475252151489258, -6.651878356933594e-05, -8.285045623779297e-06, 4.9948692321777344e-05, 0.00010818243026733398, 0.00016641616821289062, 0.00022464990615844727, 0.0002828836441040039, 0.00034111738204956055, 0.0003993511199951172, 0.00045758485794067383, 0.0005158185958862305, 0.0005740523338317871, 0.0006322860717773438, 0.0006905198097229004, 0.000748753547668457, 0.0008069872856140137, 0.0008652210235595703, 0.000923454761505127, 0.0009816884994506836, 0.0010399222373962402, 0.0010981559753417969, 0.0011563897132873535, 0.0012146234512329102, 0.0012728571891784668, 0.0013310909271240234, 0.00138932466506958, 0.0014475584030151367, 0.0015057921409606934, 0.00156402587890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 8.0, 6.0, 16.0, 14.0, 28.0, 41.0, 69.0, 90.0, 137.0, 274.0, 536.0, 1193.0, 2934.0, 8454.0, 32888.0, 701381.0, 264561.0, 24480.0, 6916.0, 2349.0, 1012.0, 484.0, 259.0, 130.0, 98.0, 79.0, 32.0, 21.0, 21.0, 6.0, 13.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.373779296875, -15.71630859375, -15.058837890625, -14.4013671875, -13.743896484375, -13.08642578125, -12.428955078125, -11.771484375, -11.114013671875, -10.45654296875, -9.799072265625, -9.1416015625, -8.484130859375, -7.82666015625, -7.169189453125, -6.51171875, -5.854248046875, -5.19677734375, -4.539306640625, -3.8818359375, -3.224365234375, -2.56689453125, -1.909423828125, -1.251953125, -0.594482421875, 0.06298828125, 0.720458984375, 1.3779296875, 2.035400390625, 2.69287109375, 3.350341796875, 4.0078125, 4.665283203125, 5.32275390625, 5.980224609375, 6.6376953125, 7.295166015625, 7.95263671875, 8.610107421875, 9.267578125, 9.925048828125, 10.58251953125, 11.239990234375, 11.8974609375, 12.554931640625, 13.21240234375, 13.869873046875, 14.52734375, 15.184814453125, 15.84228515625, 16.499755859375, 17.1572265625, 17.814697265625, 18.47216796875, 19.129638671875, 19.787109375, 20.444580078125, 21.10205078125, 21.759521484375, 22.4169921875, 23.074462890625, 23.73193359375, 24.389404296875, 25.046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 14.0, 18.0, 14.0, 21.0, 39.0, 89.0, 274.0, 278.0, 82.0, 42.0, 16.0, 18.0, 12.0, 15.0, 12.0, 3.0, 7.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.10498046875, -15.5849609375, -15.06494140625, -14.544921875, -14.02490234375, -13.5048828125, -12.98486328125, -12.46484375, -11.94482421875, -11.4248046875, -10.90478515625, -10.384765625, -9.86474609375, -9.3447265625, -8.82470703125, -8.3046875, -7.78466796875, -7.2646484375, -6.74462890625, -6.224609375, -5.70458984375, -5.1845703125, -4.66455078125, -4.14453125, -3.62451171875, -3.1044921875, -2.58447265625, -2.064453125, -1.54443359375, -1.0244140625, -0.50439453125, 0.015625, 0.53564453125, 1.0556640625, 1.57568359375, 2.095703125, 2.61572265625, 3.1357421875, 3.65576171875, 4.17578125, 4.69580078125, 5.2158203125, 5.73583984375, 6.255859375, 6.77587890625, 7.2958984375, 7.81591796875, 8.3359375, 8.85595703125, 9.3759765625, 9.89599609375, 10.416015625, 10.93603515625, 11.4560546875, 11.97607421875, 12.49609375, 13.01611328125, 13.5361328125, 14.05615234375, 14.576171875, 15.09619140625, 15.6162109375, 16.13623046875, 16.65625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 22.0, 62.0, 196.0, 348.0, 254.0, 74.0, 22.0, 13.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.06019592285156, -189.39529418945312, -179.7303924560547, -170.06549072265625, -160.4005889892578, -150.73568725585938, -141.07078552246094, -131.4058837890625, -121.74098205566406, -112.07608032226562, -102.41117858886719, -92.74627685546875, -83.08137512207031, -73.41647338867188, -63.75157165527344, -54.086669921875, -44.42176818847656, -34.756866455078125, -25.091964721679688, -15.42706298828125, -5.7621612548828125, 3.902740478515625, 13.567642211914062, 23.2325439453125, 32.89744567871094, 42.562347412109375, 52.22724914550781, 61.89215087890625, 71.55705261230469, 81.22195434570312, 90.88685607910156, 100.5517578125, 110.2166748046875, 119.88157653808594, 129.54647827148438, 139.2113800048828, 148.87628173828125, 158.5411834716797, 168.20608520507812, 177.87098693847656, 187.535888671875, 197.20079040527344, 206.86569213867188, 216.5305938720703, 226.19549560546875, 235.8603973388672, 245.52529907226562, 255.19020080566406, 264.8551025390625, 274.52001953125, 284.1849060058594, 293.84979248046875, 303.51470947265625, 313.17962646484375, 322.8445129394531, 332.5093994140625, 342.17431640625, 351.8392333984375, 361.5041198730469, 371.16900634765625, 380.83392333984375, 390.49884033203125, 400.1637268066406, 409.82861328125, 419.4935302734375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 13.0, 11.0, 12.0, 15.0, 17.0, 20.0, 27.0, 40.0, 35.0, 41.0, 44.0, 55.0, 55.0, 55.0, 51.0, 54.0, 56.0, 52.0, 46.0, 34.0, 51.0, 30.0, 31.0, 22.0, 19.0, 25.0, 19.0, 15.0, 14.0, 12.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.30723571777344, -82.41069030761719, -79.5141372680664, -76.61759185791016, -73.72103881835938, -70.82449340820312, -67.92794036865234, -65.0313949584961, -62.13484191894531, -59.2382926940918, -56.34174346923828, -53.445194244384766, -50.54864501953125, -47.652095794677734, -44.75554656982422, -41.85900115966797, -38.96245193481445, -36.06590270996094, -33.16935348510742, -30.272804260253906, -27.37625503540039, -24.479705810546875, -21.583158493041992, -18.686609268188477, -15.790060043334961, -12.893510818481445, -9.99696159362793, -7.1004133224487305, -4.203864097595215, -1.3073148727416992, 1.5892333984375, 4.485782623291016, 7.382331848144531, 10.278881072998047, 13.175430297851562, 16.071979522705078, 18.968528747558594, 21.86507797241211, 24.761625289916992, 27.658174514770508, 30.554723739624023, 33.451271057128906, 36.34782028198242, 39.24436950683594, 42.14091873168945, 45.03746795654297, 47.934017181396484, 50.83056640625, 53.727115631103516, 56.62366485595703, 59.52021408081055, 62.41676330566406, 65.31330871582031, 68.2098617553711, 71.10640716552734, 74.00296020507812, 76.89950561523438, 79.79605102539062, 82.6926040649414, 85.58914947509766, 88.48570251464844, 91.38224792480469, 94.27880096435547, 97.17534637451172, 100.0718994140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 3.0, 14.0, 8.0, 7.0, 22.0, 25.0, 26.0, 43.0, 72.0, 97.0, 129.0, 206.0, 320.0, 516.0, 1076.0, 2015.0, 4984.0, 13691.0, 52990.0, 691585.0, 3304693.0, 91132.0, 19159.0, 6196.0, 2504.0, 1174.0, 598.0, 346.0, 186.0, 145.0, 84.0, 62.0, 54.0, 30.0, 17.0, 16.0, 14.0, 10.0, 12.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0], "bins": [-28.875, -28.053466796875, -27.23193359375, -26.410400390625, -25.5888671875, -24.767333984375, -23.94580078125, -23.124267578125, -22.302734375, -21.481201171875, -20.65966796875, -19.838134765625, -19.0166015625, -18.195068359375, -17.37353515625, -16.552001953125, -15.73046875, -14.908935546875, -14.08740234375, -13.265869140625, -12.4443359375, -11.622802734375, -10.80126953125, -9.979736328125, -9.158203125, -8.336669921875, -7.51513671875, -6.693603515625, -5.8720703125, -5.050537109375, -4.22900390625, -3.407470703125, -2.5859375, -1.764404296875, -0.94287109375, -0.121337890625, 0.7001953125, 1.521728515625, 2.34326171875, 3.164794921875, 3.986328125, 4.807861328125, 5.62939453125, 6.450927734375, 7.2724609375, 8.093994140625, 8.91552734375, 9.737060546875, 10.55859375, 11.380126953125, 12.20166015625, 13.023193359375, 13.8447265625, 14.666259765625, 15.48779296875, 16.309326171875, 17.130859375, 17.952392578125, 18.77392578125, 19.595458984375, 20.4169921875, 21.238525390625, 22.06005859375, 22.881591796875, 23.703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 10.0, 20.0, 28.0, 54.0, 71.0, 95.0, 86.0, 124.0, 102.0, 106.0, 81.0, 60.0, 56.0, 47.0, 22.0, 16.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9560546875, -8.701171875, -8.4462890625, -8.19140625, -7.9365234375, -7.681640625, -7.4267578125, -7.171875, -6.9169921875, -6.662109375, -6.4072265625, -6.15234375, -5.8974609375, -5.642578125, -5.3876953125, -5.1328125, -4.8779296875, -4.623046875, -4.3681640625, -4.11328125, -3.8583984375, -3.603515625, -3.3486328125, -3.09375, -2.8388671875, -2.583984375, -2.3291015625, -2.07421875, -1.8193359375, -1.564453125, -1.3095703125, -1.0546875, -0.7998046875, -0.544921875, -0.2900390625, -0.03515625, 0.2197265625, 0.474609375, 0.7294921875, 0.984375, 1.2392578125, 1.494140625, 1.7490234375, 2.00390625, 2.2587890625, 2.513671875, 2.7685546875, 3.0234375, 3.2783203125, 3.533203125, 3.7880859375, 4.04296875, 4.2978515625, 4.552734375, 4.8076171875, 5.0625, 5.3173828125, 5.572265625, 5.8271484375, 6.08203125, 6.3369140625, 6.591796875, 6.8466796875, 7.1015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 13.0, 17.0, 9.0, 5.0, 25.0, 19.0, 38.0, 39.0, 80.0, 83.0, 120.0, 160.0, 173.0, 296.0, 440.0, 636.0, 1017.0, 1894.0, 4036.0, 11023.0, 45451.0, 431464.0, 3468056.0, 184254.0, 28945.0, 8151.0, 3392.0, 1690.0, 973.0, 523.0, 340.0, 253.0, 167.0, 132.0, 80.0, 62.0, 60.0, 32.0, 23.0, 17.0, 16.0, 13.0, 18.0, 10.0, 1.0, 3.0, 5.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-18.84375, -18.26123046875, -17.6787109375, -17.09619140625, -16.513671875, -15.93115234375, -15.3486328125, -14.76611328125, -14.18359375, -13.60107421875, -13.0185546875, -12.43603515625, -11.853515625, -11.27099609375, -10.6884765625, -10.10595703125, -9.5234375, -8.94091796875, -8.3583984375, -7.77587890625, -7.193359375, -6.61083984375, -6.0283203125, -5.44580078125, -4.86328125, -4.28076171875, -3.6982421875, -3.11572265625, -2.533203125, -1.95068359375, -1.3681640625, -0.78564453125, -0.203125, 0.37939453125, 0.9619140625, 1.54443359375, 2.126953125, 2.70947265625, 3.2919921875, 3.87451171875, 4.45703125, 5.03955078125, 5.6220703125, 6.20458984375, 6.787109375, 7.36962890625, 7.9521484375, 8.53466796875, 9.1171875, 9.69970703125, 10.2822265625, 10.86474609375, 11.447265625, 12.02978515625, 12.6123046875, 13.19482421875, 13.77734375, 14.35986328125, 14.9423828125, 15.52490234375, 16.107421875, 16.68994140625, 17.2724609375, 17.85498046875, 18.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 10.0, 32.0, 74.0, 187.0, 660.0, 2278.0, 537.0, 136.0, 61.0, 29.0, 20.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.296875, -18.842529296875, -18.38818359375, -17.933837890625, -17.4794921875, -17.025146484375, -16.57080078125, -16.116455078125, -15.662109375, -15.207763671875, -14.75341796875, -14.299072265625, -13.8447265625, -13.390380859375, -12.93603515625, -12.481689453125, -12.02734375, -11.572998046875, -11.11865234375, -10.664306640625, -10.2099609375, -9.755615234375, -9.30126953125, -8.846923828125, -8.392578125, -7.938232421875, -7.48388671875, -7.029541015625, -6.5751953125, -6.120849609375, -5.66650390625, -5.212158203125, -4.7578125, -4.303466796875, -3.84912109375, -3.394775390625, -2.9404296875, -2.486083984375, -2.03173828125, -1.577392578125, -1.123046875, -0.668701171875, -0.21435546875, 0.239990234375, 0.6943359375, 1.148681640625, 1.60302734375, 2.057373046875, 2.51171875, 2.966064453125, 3.42041015625, 3.874755859375, 4.3291015625, 4.783447265625, 5.23779296875, 5.692138671875, 6.146484375, 6.600830078125, 7.05517578125, 7.509521484375, 7.9638671875, 8.418212890625, 8.87255859375, 9.326904296875, 9.78125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 16.0, 28.0, 90.0, 207.0, 332.0, 199.0, 75.0, 29.0, 9.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.87104797363281, -59.695579528808594, -56.52011489868164, -53.34464645385742, -50.1691780090332, -46.99371337890625, -43.81824493408203, -40.64277648925781, -37.467308044433594, -34.291839599609375, -31.11637306213379, -27.940906524658203, -24.765438079833984, -21.5899715423584, -18.414505004882812, -15.239036560058594, -12.06357192993164, -8.888104438781738, -5.712637424468994, -2.53717041015625, 0.6382970809936523, 3.8137645721435547, 6.989231109619141, 10.16469955444336, 13.340166091918945, 16.51563262939453, 19.69110107421875, 22.866567611694336, 26.042034149169922, 29.21750259399414, 32.392967224121094, 35.56843566894531, 38.74390411376953, 41.91937255859375, 45.0948371887207, 48.27030563354492, 51.44577407836914, 54.621238708496094, 57.79670715332031, 60.97217559814453, 64.14764404296875, 67.32311248779297, 70.49858093261719, 73.67404174804688, 76.8495101928711, 80.02497863769531, 83.20044708251953, 86.37591552734375, 89.55137634277344, 92.72684478759766, 95.90231323242188, 99.07777404785156, 102.25324249267578, 105.4287109375, 108.60417938232422, 111.77964782714844, 114.95511627197266, 118.13058471679688, 121.3060531616211, 124.48152160644531, 127.656982421875, 130.83245849609375, 134.00791931152344, 137.18338012695312, 140.35885620117188]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 19.0, 23.0, 32.0, 33.0, 48.0, 52.0, 52.0, 64.0, 89.0, 71.0, 72.0, 55.0, 55.0, 53.0, 52.0, 51.0, 34.0, 24.0, 35.0, 12.0, 20.0, 15.0, 9.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.365440368652344, -33.051151275634766, -31.736862182617188, -30.422571182250977, -29.1082820892334, -27.79399299621582, -26.47970199584961, -25.16541290283203, -23.851123809814453, -22.536834716796875, -21.222545623779297, -19.908254623413086, -18.593965530395508, -17.27967643737793, -15.965386390686035, -14.65109634399414, -13.336807250976562, -12.022518157958984, -10.70822811126709, -9.393938064575195, -8.079648971557617, -6.765359401702881, -5.4510698318481445, -4.13677978515625, -2.822490692138672, -1.5082011222839355, -0.19391155242919922, 1.120378017425537, 2.4346675872802734, 3.7489571571350098, 5.063246726989746, 6.377536773681641, 7.691829681396484, 9.006118774414062, 10.320408821105957, 11.634698867797852, 12.94898796081543, 14.263277053833008, 15.577567100524902, 16.891857147216797, 18.206146240234375, 19.520435333251953, 20.83472442626953, 22.149015426635742, 23.46330451965332, 24.7775936126709, 26.09188461303711, 27.406173706054688, 28.720462799072266, 30.034751892089844, 31.349040985107422, 32.663330078125, 33.977622985839844, 35.29191207885742, 36.606201171875, 37.92049026489258, 39.234779357910156, 40.549068450927734, 41.86335754394531, 43.17764663696289, 44.49193572998047, 45.80622863769531, 47.12051773071289, 48.43480682373047, 49.74909591674805]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 22.0, 43.0, 87.0, 165.0, 364.0, 929.0, 2948.0, 16047.0, 168294.0, 772418.0, 75071.0, 8969.0, 1955.0, 661.0, 288.0, 125.0, 74.0, 32.0, 26.0, 4.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5625, -40.4189453125, -39.275390625, -38.1318359375, -36.98828125, -35.8447265625, -34.701171875, -33.5576171875, -32.4140625, -31.2705078125, -30.126953125, -28.9833984375, -27.83984375, -26.6962890625, -25.552734375, -24.4091796875, -23.265625, -22.1220703125, -20.978515625, -19.8349609375, -18.69140625, -17.5478515625, -16.404296875, -15.2607421875, -14.1171875, -12.9736328125, -11.830078125, -10.6865234375, -9.54296875, -8.3994140625, -7.255859375, -6.1123046875, -4.96875, -3.8251953125, -2.681640625, -1.5380859375, -0.39453125, 0.7490234375, 1.892578125, 3.0361328125, 4.1796875, 5.3232421875, 6.466796875, 7.6103515625, 8.75390625, 9.8974609375, 11.041015625, 12.1845703125, 13.328125, 14.4716796875, 15.615234375, 16.7587890625, 17.90234375, 19.0458984375, 20.189453125, 21.3330078125, 22.4765625, 23.6201171875, 24.763671875, 25.9072265625, 27.05078125, 28.1943359375, 29.337890625, 30.4814453125, 31.625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 15.0, 25.0, 27.0, 50.0, 68.0, 72.0, 110.0, 96.0, 119.0, 92.0, 96.0, 59.0, 56.0, 38.0, 39.0, 16.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.42022705078125, -9.1529541015625, -8.88568115234375, -8.618408203125, -8.35113525390625, -8.0838623046875, -7.81658935546875, -7.54931640625, -7.28204345703125, -7.0147705078125, -6.74749755859375, -6.480224609375, -6.21295166015625, -5.9456787109375, -5.67840576171875, -5.4111328125, -5.14385986328125, -4.8765869140625, -4.60931396484375, -4.342041015625, -4.07476806640625, -3.8074951171875, -3.54022216796875, -3.27294921875, -3.00567626953125, -2.7384033203125, -2.47113037109375, -2.203857421875, -1.93658447265625, -1.6693115234375, -1.40203857421875, -1.134765625, -0.86749267578125, -0.6002197265625, -0.33294677734375, -0.065673828125, 0.20159912109375, 0.4688720703125, 0.73614501953125, 1.00341796875, 1.27069091796875, 1.5379638671875, 1.80523681640625, 2.072509765625, 2.33978271484375, 2.6070556640625, 2.87432861328125, 3.1416015625, 3.40887451171875, 3.6761474609375, 3.94342041015625, 4.210693359375, 4.47796630859375, 4.7452392578125, 5.01251220703125, 5.27978515625, 5.54705810546875, 5.8143310546875, 6.08160400390625, 6.348876953125, 6.61614990234375, 6.8834228515625, 7.15069580078125, 7.41796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 9.0, 17.0, 20.0, 41.0, 55.0, 124.0, 228.0, 547.0, 1634.0, 7156.0, 62454.0, 823243.0, 137403.0, 12014.0, 2230.0, 752.0, 312.0, 141.0, 72.0, 32.0, 26.0, 14.0, 8.0, 8.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.1875, -33.171142578125, -32.15478515625, -31.138427734375, -30.1220703125, -29.105712890625, -28.08935546875, -27.072998046875, -26.056640625, -25.040283203125, -24.02392578125, -23.007568359375, -21.9912109375, -20.974853515625, -19.95849609375, -18.942138671875, -17.92578125, -16.909423828125, -15.89306640625, -14.876708984375, -13.8603515625, -12.843994140625, -11.82763671875, -10.811279296875, -9.794921875, -8.778564453125, -7.76220703125, -6.745849609375, -5.7294921875, -4.713134765625, -3.69677734375, -2.680419921875, -1.6640625, -0.647705078125, 0.36865234375, 1.385009765625, 2.4013671875, 3.417724609375, 4.43408203125, 5.450439453125, 6.466796875, 7.483154296875, 8.49951171875, 9.515869140625, 10.5322265625, 11.548583984375, 12.56494140625, 13.581298828125, 14.59765625, 15.614013671875, 16.63037109375, 17.646728515625, 18.6630859375, 19.679443359375, 20.69580078125, 21.712158203125, 22.728515625, 23.744873046875, 24.76123046875, 25.777587890625, 26.7939453125, 27.810302734375, 28.82666015625, 29.843017578125, 30.859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 8.0, 11.0, 10.0, 13.0, 32.0, 48.0, 57.0, 69.0, 94.0, 88.0, 96.0, 86.0, 104.0, 83.0, 49.0, 40.0, 32.0, 24.0, 19.0, 7.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.469970703125, -31.50244140625, -30.534912109375, -29.5673828125, -28.599853515625, -27.63232421875, -26.664794921875, -25.697265625, -24.729736328125, -23.76220703125, -22.794677734375, -21.8271484375, -20.859619140625, -19.89208984375, -18.924560546875, -17.95703125, -16.989501953125, -16.02197265625, -15.054443359375, -14.0869140625, -13.119384765625, -12.15185546875, -11.184326171875, -10.216796875, -9.249267578125, -8.28173828125, -7.314208984375, -6.3466796875, -5.379150390625, -4.41162109375, -3.444091796875, -2.4765625, -1.509033203125, -0.54150390625, 0.426025390625, 1.3935546875, 2.361083984375, 3.32861328125, 4.296142578125, 5.263671875, 6.231201171875, 7.19873046875, 8.166259765625, 9.1337890625, 10.101318359375, 11.06884765625, 12.036376953125, 13.00390625, 13.971435546875, 14.93896484375, 15.906494140625, 16.8740234375, 17.841552734375, 18.80908203125, 19.776611328125, 20.744140625, 21.711669921875, 22.67919921875, 23.646728515625, 24.6142578125, 25.581787109375, 26.54931640625, 27.516845703125, 28.484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 19.0, 24.0, 45.0, 93.0, 182.0, 403.0, 956.0, 2369.0, 7243.0, 27143.0, 188131.0, 733339.0, 66652.0, 14732.0, 4357.0, 1617.0, 623.0, 307.0, 147.0, 56.0, 36.0, 24.0, 20.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4459228515625, -8.157470703125, -7.8690185546875, -7.58056640625, -7.2921142578125, -7.003662109375, -6.7152099609375, -6.4267578125, -6.1383056640625, -5.849853515625, -5.5614013671875, -5.27294921875, -4.9844970703125, -4.696044921875, -4.4075927734375, -4.119140625, -3.8306884765625, -3.542236328125, -3.2537841796875, -2.96533203125, -2.6768798828125, -2.388427734375, -2.0999755859375, -1.8115234375, -1.5230712890625, -1.234619140625, -0.9461669921875, -0.65771484375, -0.3692626953125, -0.080810546875, 0.2076416015625, 0.49609375, 0.7845458984375, 1.072998046875, 1.3614501953125, 1.64990234375, 1.9383544921875, 2.226806640625, 2.5152587890625, 2.8037109375, 3.0921630859375, 3.380615234375, 3.6690673828125, 3.95751953125, 4.2459716796875, 4.534423828125, 4.8228759765625, 5.111328125, 5.3997802734375, 5.688232421875, 5.9766845703125, 6.26513671875, 6.5535888671875, 6.842041015625, 7.1304931640625, 7.4189453125, 7.7073974609375, 7.995849609375, 8.2843017578125, 8.57275390625, 8.8612060546875, 9.149658203125, 9.4381103515625, 9.7265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 12.0, 9.0, 8.0, 12.0, 18.0, 26.0, 42.0, 113.0, 280.0, 258.0, 60.0, 36.0, 17.0, 23.0, 11.0, 18.0, 13.0, 6.0, 4.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0017900466918945312, -0.0017439723014831543, -0.0016978979110717773, -0.0016518235206604004, -0.0016057491302490234, -0.0015596747398376465, -0.0015136003494262695, -0.0014675259590148926, -0.0014214515686035156, -0.0013753771781921387, -0.0013293027877807617, -0.0012832283973693848, -0.0012371540069580078, -0.0011910796165466309, -0.001145005226135254, -0.001098930835723877, -0.0010528564453125, -0.001006782054901123, -0.0009607076644897461, -0.0009146332740783691, -0.0008685588836669922, -0.0008224844932556152, -0.0007764101028442383, -0.0007303357124328613, -0.0006842613220214844, -0.0006381869316101074, -0.0005921125411987305, -0.0005460381507873535, -0.0004999637603759766, -0.0004538893699645996, -0.00040781497955322266, -0.0003617405891418457, -0.00031566619873046875, -0.0002695918083190918, -0.00022351741790771484, -0.0001774430274963379, -0.00013136863708496094, -8.529424667358398e-05, -3.921985626220703e-05, 6.854534149169922e-06, 5.2928924560546875e-05, 9.900331497192383e-05, 0.00014507770538330078, 0.00019115209579467773, 0.0002372264862060547, 0.00028330087661743164, 0.0003293752670288086, 0.00037544965744018555, 0.0004215240478515625, 0.00046759843826293945, 0.0005136728286743164, 0.0005597472190856934, 0.0006058216094970703, 0.0006518959999084473, 0.0006979703903198242, 0.0007440447807312012, 0.0007901191711425781, 0.0008361935615539551, 0.000882267951965332, 0.000928342342376709, 0.0009744167327880859, 0.0010204911231994629, 0.0010665655136108398, 0.0011126399040222168, 0.0011587142944335938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 12.0, 15.0, 30.0, 66.0, 111.0, 218.0, 467.0, 1398.0, 4481.0, 19736.0, 306630.0, 680548.0, 26445.0, 5707.0, 1624.0, 552.0, 236.0, 112.0, 61.0, 45.0, 23.0, 12.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.3040771484375, -10.834716796875, -10.3653564453125, -9.89599609375, -9.4266357421875, -8.957275390625, -8.4879150390625, -8.0185546875, -7.5491943359375, -7.079833984375, -6.6104736328125, -6.14111328125, -5.6717529296875, -5.202392578125, -4.7330322265625, -4.263671875, -3.7943115234375, -3.324951171875, -2.8555908203125, -2.38623046875, -1.9168701171875, -1.447509765625, -0.9781494140625, -0.5087890625, -0.0394287109375, 0.429931640625, 0.8992919921875, 1.36865234375, 1.8380126953125, 2.307373046875, 2.7767333984375, 3.24609375, 3.7154541015625, 4.184814453125, 4.6541748046875, 5.12353515625, 5.5928955078125, 6.062255859375, 6.5316162109375, 7.0009765625, 7.4703369140625, 7.939697265625, 8.4090576171875, 8.87841796875, 9.3477783203125, 9.817138671875, 10.2864990234375, 10.755859375, 11.2252197265625, 11.694580078125, 12.1639404296875, 12.63330078125, 13.1026611328125, 13.572021484375, 14.0413818359375, 14.5107421875, 14.9801025390625, 15.449462890625, 15.9188232421875, 16.38818359375, 16.8575439453125, 17.326904296875, 17.7962646484375, 18.265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 13.0, 26.0, 36.0, 43.0, 150.0, 301.0, 210.0, 71.0, 39.0, 20.0, 9.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.7193603515625, -11.337158203125, -10.9549560546875, -10.57275390625, -10.1905517578125, -9.808349609375, -9.4261474609375, -9.0439453125, -8.6617431640625, -8.279541015625, -7.8973388671875, -7.51513671875, -7.1329345703125, -6.750732421875, -6.3685302734375, -5.986328125, -5.6041259765625, -5.221923828125, -4.8397216796875, -4.45751953125, -4.0753173828125, -3.693115234375, -3.3109130859375, -2.9287109375, -2.5465087890625, -2.164306640625, -1.7821044921875, -1.39990234375, -1.0177001953125, -0.635498046875, -0.2532958984375, 0.12890625, 0.5111083984375, 0.893310546875, 1.2755126953125, 1.65771484375, 2.0399169921875, 2.422119140625, 2.8043212890625, 3.1865234375, 3.5687255859375, 3.950927734375, 4.3331298828125, 4.71533203125, 5.0975341796875, 5.479736328125, 5.8619384765625, 6.244140625, 6.6263427734375, 7.008544921875, 7.3907470703125, 7.77294921875, 8.1551513671875, 8.537353515625, 8.9195556640625, 9.3017578125, 9.6839599609375, 10.066162109375, 10.4483642578125, 10.83056640625, 11.2127685546875, 11.594970703125, 11.9771728515625, 12.359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 20.0, 49.0, 120.0, 231.0, 274.0, 173.0, 82.0, 28.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.8819580078125, -153.81893920898438, -147.75592041015625, -141.69290161132812, -135.62986755371094, -129.5668487548828, -123.50382995605469, -117.44081115722656, -111.37779235839844, -105.31477355957031, -99.25174713134766, -93.18872833251953, -87.1257095336914, -81.06268310546875, -74.99966430664062, -68.9366455078125, -62.873619079589844, -56.81059646606445, -50.74757766723633, -44.68455505371094, -38.62153625488281, -32.55851364135742, -26.49549102783203, -20.432472229003906, -14.369449615478516, -8.306428909301758, -2.2434072494506836, 3.8196144104003906, 9.882635116577148, 15.945655822753906, 22.008678436279297, 28.071697235107422, 34.13471984863281, 40.1977424621582, 46.26076126098633, 52.32378387451172, 58.386802673339844, 64.4498291015625, 70.51284790039062, 76.57586669921875, 82.63888549804688, 88.701904296875, 94.76493072509766, 100.82794952392578, 106.8909683227539, 112.95399475097656, 119.01701354980469, 125.08003234863281, 131.14306640625, 137.20608520507812, 143.26910400390625, 149.33212280273438, 155.39515686035156, 161.4581756591797, 167.5211944580078, 173.58421325683594, 179.64723205566406, 185.7102508544922, 191.7732696533203, 197.8363037109375, 203.89932250976562, 209.96234130859375, 216.02536010742188, 222.08837890625, 228.15139770507812]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 3.0, 9.0, 6.0, 17.0, 12.0, 14.0, 11.0, 17.0, 22.0, 24.0, 24.0, 32.0, 30.0, 28.0, 39.0, 32.0, 44.0, 49.0, 50.0, 41.0, 33.0, 53.0, 45.0, 34.0, 27.0, 28.0, 24.0, 40.0, 33.0, 29.0, 24.0, 20.0, 21.0, 22.0, 7.0, 14.0, 10.0, 4.0, 8.0, 2.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.2430419921875, -75.99758911132812, -73.75213623046875, -71.50668334960938, -69.26123046875, -67.01577758789062, -64.77032470703125, -62.524871826171875, -60.2794189453125, -58.033966064453125, -55.78851318359375, -53.543060302734375, -51.297607421875, -49.052154541015625, -46.80670166015625, -44.561248779296875, -42.3157958984375, -40.070343017578125, -37.82489013671875, -35.579437255859375, -33.333984375, -31.088531494140625, -28.84307861328125, -26.597625732421875, -24.3521728515625, -22.106719970703125, -19.86126708984375, -17.615814208984375, -15.370361328125, -13.124908447265625, -10.87945556640625, -8.634002685546875, -6.3885498046875, -4.143096923828125, -1.89764404296875, 0.347808837890625, 2.59326171875, 4.838714599609375, 7.08416748046875, 9.329620361328125, 11.5750732421875, 13.820526123046875, 16.06597900390625, 18.311431884765625, 20.556884765625, 22.802337646484375, 25.04779052734375, 27.293243408203125, 29.5386962890625, 31.784149169921875, 34.02960205078125, 36.275054931640625, 38.5205078125, 40.765960693359375, 43.01141357421875, 45.256866455078125, 47.5023193359375, 49.747772216796875, 51.99322509765625, 54.238677978515625, 56.484130859375, 58.729583740234375, 60.97503662109375, 63.220489501953125, 65.4659423828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 12.0, 14.0, 18.0, 19.0, 34.0, 52.0, 55.0, 73.0, 162.0, 211.0, 402.0, 644.0, 1358.0, 2710.0, 6343.0, 17738.0, 77828.0, 3394712.0, 621349.0, 47951.0, 12947.0, 5011.0, 2208.0, 1032.0, 573.0, 315.0, 183.0, 105.0, 58.0, 38.0, 35.0, 23.0, 10.0, 8.0, 9.0, 4.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-31.453125, -30.599853515625, -29.74658203125, -28.893310546875, -28.0400390625, -27.186767578125, -26.33349609375, -25.480224609375, -24.626953125, -23.773681640625, -22.92041015625, -22.067138671875, -21.2138671875, -20.360595703125, -19.50732421875, -18.654052734375, -17.80078125, -16.947509765625, -16.09423828125, -15.240966796875, -14.3876953125, -13.534423828125, -12.68115234375, -11.827880859375, -10.974609375, -10.121337890625, -9.26806640625, -8.414794921875, -7.5615234375, -6.708251953125, -5.85498046875, -5.001708984375, -4.1484375, -3.295166015625, -2.44189453125, -1.588623046875, -0.7353515625, 0.117919921875, 0.97119140625, 1.824462890625, 2.677734375, 3.531005859375, 4.38427734375, 5.237548828125, 6.0908203125, 6.944091796875, 7.79736328125, 8.650634765625, 9.50390625, 10.357177734375, 11.21044921875, 12.063720703125, 12.9169921875, 13.770263671875, 14.62353515625, 15.476806640625, 16.330078125, 17.183349609375, 18.03662109375, 18.889892578125, 19.7431640625, 20.596435546875, 21.44970703125, 22.302978515625, 23.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 14.0, 10.0, 16.0, 31.0, 50.0, 50.0, 74.0, 88.0, 93.0, 111.0, 99.0, 91.0, 71.0, 57.0, 52.0, 36.0, 24.0, 11.0, 16.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.41552734375, -9.1513671875, -8.88720703125, -8.623046875, -8.35888671875, -8.0947265625, -7.83056640625, -7.56640625, -7.30224609375, -7.0380859375, -6.77392578125, -6.509765625, -6.24560546875, -5.9814453125, -5.71728515625, -5.453125, -5.18896484375, -4.9248046875, -4.66064453125, -4.396484375, -4.13232421875, -3.8681640625, -3.60400390625, -3.33984375, -3.07568359375, -2.8115234375, -2.54736328125, -2.283203125, -2.01904296875, -1.7548828125, -1.49072265625, -1.2265625, -0.96240234375, -0.6982421875, -0.43408203125, -0.169921875, 0.09423828125, 0.3583984375, 0.62255859375, 0.88671875, 1.15087890625, 1.4150390625, 1.67919921875, 1.943359375, 2.20751953125, 2.4716796875, 2.73583984375, 3.0, 3.26416015625, 3.5283203125, 3.79248046875, 4.056640625, 4.32080078125, 4.5849609375, 4.84912109375, 5.11328125, 5.37744140625, 5.6416015625, 5.90576171875, 6.169921875, 6.43408203125, 6.6982421875, 6.96240234375, 7.2265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 20.0, 31.0, 44.0, 80.0, 136.0, 341.0, 991.0, 3103.0, 15564.0, 186430.0, 3889565.0, 84166.0, 10248.0, 2289.0, 694.0, 267.0, 129.0, 59.0, 38.0, 23.0, 13.0, 16.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.751220703125, -38.62744140625, -37.503662109375, -36.3798828125, -35.256103515625, -34.13232421875, -33.008544921875, -31.884765625, -30.760986328125, -29.63720703125, -28.513427734375, -27.3896484375, -26.265869140625, -25.14208984375, -24.018310546875, -22.89453125, -21.770751953125, -20.64697265625, -19.523193359375, -18.3994140625, -17.275634765625, -16.15185546875, -15.028076171875, -13.904296875, -12.780517578125, -11.65673828125, -10.532958984375, -9.4091796875, -8.285400390625, -7.16162109375, -6.037841796875, -4.9140625, -3.790283203125, -2.66650390625, -1.542724609375, -0.4189453125, 0.704833984375, 1.82861328125, 2.952392578125, 4.076171875, 5.199951171875, 6.32373046875, 7.447509765625, 8.5712890625, 9.695068359375, 10.81884765625, 11.942626953125, 13.06640625, 14.190185546875, 15.31396484375, 16.437744140625, 17.5615234375, 18.685302734375, 19.80908203125, 20.932861328125, 22.056640625, 23.180419921875, 24.30419921875, 25.427978515625, 26.5517578125, 27.675537109375, 28.79931640625, 29.923095703125, 31.046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 11.0, 20.0, 41.0, 58.0, 107.0, 337.0, 2297.0, 754.0, 206.0, 84.0, 48.0, 32.0, 25.0, 11.0, 16.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.6689453125, -16.259765625, -15.8505859375, -15.44140625, -15.0322265625, -14.623046875, -14.2138671875, -13.8046875, -13.3955078125, -12.986328125, -12.5771484375, -12.16796875, -11.7587890625, -11.349609375, -10.9404296875, -10.53125, -10.1220703125, -9.712890625, -9.3037109375, -8.89453125, -8.4853515625, -8.076171875, -7.6669921875, -7.2578125, -6.8486328125, -6.439453125, -6.0302734375, -5.62109375, -5.2119140625, -4.802734375, -4.3935546875, -3.984375, -3.5751953125, -3.166015625, -2.7568359375, -2.34765625, -1.9384765625, -1.529296875, -1.1201171875, -0.7109375, -0.3017578125, 0.107421875, 0.5166015625, 0.92578125, 1.3349609375, 1.744140625, 2.1533203125, 2.5625, 2.9716796875, 3.380859375, 3.7900390625, 4.19921875, 4.6083984375, 5.017578125, 5.4267578125, 5.8359375, 6.2451171875, 6.654296875, 7.0634765625, 7.47265625, 7.8818359375, 8.291015625, 8.7001953125, 9.109375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 13.0, 88.0, 437.0, 395.0, 57.0, 12.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.64415740966797, -61.918033599853516, -56.19190979003906, -50.465789794921875, -44.739662170410156, -39.01354217529297, -33.287418365478516, -27.561294555664062, -21.83517074584961, -16.109046936035156, -10.38292407989502, -4.656801223754883, 1.0693225860595703, 6.795446395874023, 12.521568298339844, 18.247692108154297, 23.97381591796875, 29.699939727783203, 35.426063537597656, 41.152183532714844, 46.87831115722656, 52.60443115234375, 58.3305549621582, 64.05667877197266, 69.78280639648438, 75.50892639160156, 81.23505401611328, 86.96117401123047, 92.68730163574219, 98.41342163085938, 104.13954162597656, 109.86566925048828, 115.59178161621094, 121.31790161132812, 127.04402923583984, 132.77015686035156, 138.49627685546875, 144.22239685058594, 149.94851684570312, 155.67465209960938, 161.40077209472656, 167.12689208984375, 172.85301208496094, 178.5791473388672, 184.30526733398438, 190.03138732910156, 195.75750732421875, 201.483642578125, 207.20974731445312, 212.9358673095703, 218.6619873046875, 224.38812255859375, 230.11424255371094, 235.84036254882812, 241.5664825439453, 247.2926025390625, 253.01873779296875, 258.744873046875, 264.4709777832031, 270.1971130371094, 275.9232177734375, 281.64935302734375, 287.37548828125, 293.1015930175781, 298.8277282714844]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 6.0, 12.0, 20.0, 23.0, 23.0, 33.0, 25.0, 41.0, 46.0, 43.0, 47.0, 46.0, 52.0, 59.0, 62.0, 60.0, 61.0, 58.0, 42.0, 33.0, 32.0, 26.0, 31.0, 24.0, 24.0, 15.0, 8.0, 9.0, 9.0, 6.0, 3.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.452573776245117, -29.49118995666504, -28.52980613708496, -27.568422317504883, -26.607038497924805, -25.64565658569336, -24.68427276611328, -23.722888946533203, -22.761505126953125, -21.800121307373047, -20.83873748779297, -19.87735366821289, -18.915969848632812, -17.954586029052734, -16.993202209472656, -16.03182029724121, -15.070435523986816, -14.109051704406738, -13.14766788482666, -12.186285018920898, -11.22490119934082, -10.263517379760742, -9.302133560180664, -8.340749740600586, -7.379366397857666, -6.417982578277588, -5.456599235534668, -4.49521541595459, -3.533831834793091, -2.572448253631592, -1.6110644340515137, -0.6496810913085938, 0.3117027282714844, 1.2730863094329834, 2.2344698905944824, 3.1958537101745605, 4.1572370529174805, 5.118620872497559, 6.080004692077637, 7.041388034820557, 8.002771377563477, 8.964155197143555, 9.925539016723633, 10.886922836303711, 11.848305702209473, 12.80968952178955, 13.771073341369629, 14.73245620727539, 15.693840980529785, 16.655223846435547, 17.616607666015625, 18.577991485595703, 19.53937530517578, 20.50075912475586, 21.462142944335938, 22.423526763916016, 23.384910583496094, 24.346294403076172, 25.30767822265625, 26.269062042236328, 27.230445861816406, 28.191829681396484, 29.153213500976562, 30.114595413208008, 31.075979232788086]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 17.0, 22.0, 30.0, 58.0, 86.0, 177.0, 375.0, 851.0, 2119.0, 6511.0, 28717.0, 154673.0, 575456.0, 224550.0, 41472.0, 8938.0, 2516.0, 1041.0, 436.0, 225.0, 115.0, 66.0, 37.0, 22.0, 15.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.140625, -22.359130859375, -21.57763671875, -20.796142578125, -20.0146484375, -19.233154296875, -18.45166015625, -17.670166015625, -16.888671875, -16.107177734375, -15.32568359375, -14.544189453125, -13.7626953125, -12.981201171875, -12.19970703125, -11.418212890625, -10.63671875, -9.855224609375, -9.07373046875, -8.292236328125, -7.5107421875, -6.729248046875, -5.94775390625, -5.166259765625, -4.384765625, -3.603271484375, -2.82177734375, -2.040283203125, -1.2587890625, -0.477294921875, 0.30419921875, 1.085693359375, 1.8671875, 2.648681640625, 3.43017578125, 4.211669921875, 4.9931640625, 5.774658203125, 6.55615234375, 7.337646484375, 8.119140625, 8.900634765625, 9.68212890625, 10.463623046875, 11.2451171875, 12.026611328125, 12.80810546875, 13.589599609375, 14.37109375, 15.152587890625, 15.93408203125, 16.715576171875, 17.4970703125, 18.278564453125, 19.06005859375, 19.841552734375, 20.623046875, 21.404541015625, 22.18603515625, 22.967529296875, 23.7490234375, 24.530517578125, 25.31201171875, 26.093505859375, 26.875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 12.0, 17.0, 18.0, 32.0, 55.0, 71.0, 69.0, 102.0, 109.0, 99.0, 96.0, 77.0, 86.0, 43.0, 41.0, 33.0, 14.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.32061767578125, -9.0474853515625, -8.77435302734375, -8.501220703125, -8.22808837890625, -7.9549560546875, -7.68182373046875, -7.40869140625, -7.13555908203125, -6.8624267578125, -6.58929443359375, -6.316162109375, -6.04302978515625, -5.7698974609375, -5.49676513671875, -5.2236328125, -4.95050048828125, -4.6773681640625, -4.40423583984375, -4.131103515625, -3.85797119140625, -3.5848388671875, -3.31170654296875, -3.03857421875, -2.76544189453125, -2.4923095703125, -2.21917724609375, -1.946044921875, -1.67291259765625, -1.3997802734375, -1.12664794921875, -0.853515625, -0.58038330078125, -0.3072509765625, -0.03411865234375, 0.239013671875, 0.51214599609375, 0.7852783203125, 1.05841064453125, 1.33154296875, 1.60467529296875, 1.8778076171875, 2.15093994140625, 2.424072265625, 2.69720458984375, 2.9703369140625, 3.24346923828125, 3.5166015625, 3.78973388671875, 4.0628662109375, 4.33599853515625, 4.609130859375, 4.88226318359375, 5.1553955078125, 5.42852783203125, 5.70166015625, 5.97479248046875, 6.2479248046875, 6.52105712890625, 6.794189453125, 7.06732177734375, 7.3404541015625, 7.61358642578125, 7.88671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 4.0, 6.0, 10.0, 9.0, 28.0, 20.0, 24.0, 39.0, 47.0, 68.0, 78.0, 91.0, 143.0, 175.0, 322.0, 491.0, 822.0, 1713.0, 4919.0, 22454.0, 148305.0, 650030.0, 181995.0, 26591.0, 5726.0, 1916.0, 900.0, 482.0, 325.0, 177.0, 148.0, 111.0, 98.0, 68.0, 44.0, 35.0, 23.0, 21.0, 10.0, 11.0, 10.0, 9.0, 7.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-22.578125, -21.884521484375, -21.19091796875, -20.497314453125, -19.8037109375, -19.110107421875, -18.41650390625, -17.722900390625, -17.029296875, -16.335693359375, -15.64208984375, -14.948486328125, -14.2548828125, -13.561279296875, -12.86767578125, -12.174072265625, -11.48046875, -10.786865234375, -10.09326171875, -9.399658203125, -8.7060546875, -8.012451171875, -7.31884765625, -6.625244140625, -5.931640625, -5.238037109375, -4.54443359375, -3.850830078125, -3.1572265625, -2.463623046875, -1.77001953125, -1.076416015625, -0.3828125, 0.310791015625, 1.00439453125, 1.697998046875, 2.3916015625, 3.085205078125, 3.77880859375, 4.472412109375, 5.166015625, 5.859619140625, 6.55322265625, 7.246826171875, 7.9404296875, 8.634033203125, 9.32763671875, 10.021240234375, 10.71484375, 11.408447265625, 12.10205078125, 12.795654296875, 13.4892578125, 14.182861328125, 14.87646484375, 15.570068359375, 16.263671875, 16.957275390625, 17.65087890625, 18.344482421875, 19.0380859375, 19.731689453125, 20.42529296875, 21.118896484375, 21.8125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 10.0, 5.0, 5.0, 7.0, 15.0, 23.0, 23.0, 24.0, 33.0, 43.0, 40.0, 40.0, 53.0, 42.0, 57.0, 65.0, 55.0, 51.0, 56.0, 59.0, 45.0, 44.0, 34.0, 33.0, 27.0, 22.0, 15.0, 11.0, 13.0, 9.0, 9.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.75, -21.051025390625, -20.35205078125, -19.653076171875, -18.9541015625, -18.255126953125, -17.55615234375, -16.857177734375, -16.158203125, -15.459228515625, -14.76025390625, -14.061279296875, -13.3623046875, -12.663330078125, -11.96435546875, -11.265380859375, -10.56640625, -9.867431640625, -9.16845703125, -8.469482421875, -7.7705078125, -7.071533203125, -6.37255859375, -5.673583984375, -4.974609375, -4.275634765625, -3.57666015625, -2.877685546875, -2.1787109375, -1.479736328125, -0.78076171875, -0.081787109375, 0.6171875, 1.316162109375, 2.01513671875, 2.714111328125, 3.4130859375, 4.112060546875, 4.81103515625, 5.510009765625, 6.208984375, 6.907958984375, 7.60693359375, 8.305908203125, 9.0048828125, 9.703857421875, 10.40283203125, 11.101806640625, 11.80078125, 12.499755859375, 13.19873046875, 13.897705078125, 14.5966796875, 15.295654296875, 15.99462890625, 16.693603515625, 17.392578125, 18.091552734375, 18.79052734375, 19.489501953125, 20.1884765625, 20.887451171875, 21.58642578125, 22.285400390625, 22.984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 3.0, 5.0, 4.0, 17.0, 21.0, 21.0, 46.0, 65.0, 94.0, 159.0, 252.0, 485.0, 856.0, 1954.0, 4630.0, 12498.0, 38193.0, 140517.0, 604717.0, 173925.0, 46013.0, 14475.0, 5315.0, 2087.0, 939.0, 487.0, 284.0, 175.0, 106.0, 64.0, 39.0, 36.0, 25.0, 14.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.73583984375, -8.4404296875, -8.14501953125, -7.849609375, -7.55419921875, -7.2587890625, -6.96337890625, -6.66796875, -6.37255859375, -6.0771484375, -5.78173828125, -5.486328125, -5.19091796875, -4.8955078125, -4.60009765625, -4.3046875, -4.00927734375, -3.7138671875, -3.41845703125, -3.123046875, -2.82763671875, -2.5322265625, -2.23681640625, -1.94140625, -1.64599609375, -1.3505859375, -1.05517578125, -0.759765625, -0.46435546875, -0.1689453125, 0.12646484375, 0.421875, 0.71728515625, 1.0126953125, 1.30810546875, 1.603515625, 1.89892578125, 2.1943359375, 2.48974609375, 2.78515625, 3.08056640625, 3.3759765625, 3.67138671875, 3.966796875, 4.26220703125, 4.5576171875, 4.85302734375, 5.1484375, 5.44384765625, 5.7392578125, 6.03466796875, 6.330078125, 6.62548828125, 6.9208984375, 7.21630859375, 7.51171875, 7.80712890625, 8.1025390625, 8.39794921875, 8.693359375, 8.98876953125, 9.2841796875, 9.57958984375, 9.875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 5.0, 8.0, 9.0, 12.0, 11.0, 13.0, 21.0, 19.0, 24.0, 30.0, 49.0, 39.0, 49.0, 92.0, 147.0, 107.0, 64.0, 52.0, 34.0, 40.0, 19.0, 25.0, 13.0, 20.0, 24.0, 11.0, 12.0, 8.0, 10.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0009217262268066406, -0.0008917376399040222, -0.0008617490530014038, -0.0008317604660987854, -0.000801771879196167, -0.0007717832922935486, -0.0007417947053909302, -0.0007118061184883118, -0.0006818175315856934, -0.000651828944683075, -0.0006218403577804565, -0.0005918517708778381, -0.0005618631839752197, -0.0005318745970726013, -0.0005018860101699829, -0.0004718974232673645, -0.0004419088363647461, -0.0004119202494621277, -0.0003819316625595093, -0.00035194307565689087, -0.00032195448875427246, -0.00029196590185165405, -0.00026197731494903564, -0.00023198872804641724, -0.00020200014114379883, -0.00017201155424118042, -0.000142022967338562, -0.0001120343804359436, -8.20457935333252e-05, -5.205720663070679e-05, -2.206861972808838e-05, 7.91996717453003e-06, 3.790855407714844e-05, 6.789714097976685e-05, 9.788572788238525e-05, 0.00012787431478500366, 0.00015786290168762207, 0.00018785148859024048, 0.0002178400754928589, 0.0002478286623954773, 0.0002778172492980957, 0.0003078058362007141, 0.0003377944231033325, 0.00036778301000595093, 0.00039777159690856934, 0.00042776018381118774, 0.00045774877071380615, 0.00048773735761642456, 0.000517725944519043, 0.0005477145314216614, 0.0005777031183242798, 0.0006076917052268982, 0.0006376802921295166, 0.000667668879032135, 0.0006976574659347534, 0.0007276460528373718, 0.0007576346397399902, 0.0007876232266426086, 0.000817611813545227, 0.0008476004004478455, 0.0008775889873504639, 0.0009075775742530823, 0.0009375661611557007, 0.0009675547480583191, 0.0009975433349609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 5.0, 16.0, 17.0, 20.0, 26.0, 42.0, 85.0, 114.0, 139.0, 318.0, 522.0, 1048.0, 2383.0, 7279.0, 29808.0, 187067.0, 701198.0, 92632.0, 17441.0, 4760.0, 1709.0, 837.0, 406.0, 232.0, 127.0, 84.0, 52.0, 44.0, 33.0, 23.0, 24.0, 16.0, 10.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.34375, -14.869140625, -14.39453125, -13.919921875, -13.4453125, -12.970703125, -12.49609375, -12.021484375, -11.546875, -11.072265625, -10.59765625, -10.123046875, -9.6484375, -9.173828125, -8.69921875, -8.224609375, -7.75, -7.275390625, -6.80078125, -6.326171875, -5.8515625, -5.376953125, -4.90234375, -4.427734375, -3.953125, -3.478515625, -3.00390625, -2.529296875, -2.0546875, -1.580078125, -1.10546875, -0.630859375, -0.15625, 0.318359375, 0.79296875, 1.267578125, 1.7421875, 2.216796875, 2.69140625, 3.166015625, 3.640625, 4.115234375, 4.58984375, 5.064453125, 5.5390625, 6.013671875, 6.48828125, 6.962890625, 7.4375, 7.912109375, 8.38671875, 8.861328125, 9.3359375, 9.810546875, 10.28515625, 10.759765625, 11.234375, 11.708984375, 12.18359375, 12.658203125, 13.1328125, 13.607421875, 14.08203125, 14.556640625, 15.03125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 13.0, 17.0, 13.0, 21.0, 41.0, 38.0, 37.0, 97.0, 115.0, 147.0, 129.0, 76.0, 52.0, 36.0, 33.0, 22.0, 25.0, 11.0, 7.0, 11.0, 7.0, 3.0, 8.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.4769287109375, -14.047607421875, -13.6182861328125, -13.18896484375, -12.7596435546875, -12.330322265625, -11.9010009765625, -11.4716796875, -11.0423583984375, -10.613037109375, -10.1837158203125, -9.75439453125, -9.3250732421875, -8.895751953125, -8.4664306640625, -8.037109375, -7.6077880859375, -7.178466796875, -6.7491455078125, -6.31982421875, -5.8905029296875, -5.461181640625, -5.0318603515625, -4.6025390625, -4.1732177734375, -3.743896484375, -3.3145751953125, -2.88525390625, -2.4559326171875, -2.026611328125, -1.5972900390625, -1.16796875, -0.7386474609375, -0.309326171875, 0.1199951171875, 0.54931640625, 0.9786376953125, 1.407958984375, 1.8372802734375, 2.2666015625, 2.6959228515625, 3.125244140625, 3.5545654296875, 3.98388671875, 4.4132080078125, 4.842529296875, 5.2718505859375, 5.701171875, 6.1304931640625, 6.559814453125, 6.9891357421875, 7.41845703125, 7.8477783203125, 8.277099609375, 8.7064208984375, 9.1357421875, 9.5650634765625, 9.994384765625, 10.4237060546875, 10.85302734375, 11.2823486328125, 11.711669921875, 12.1409912109375, 12.5703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 12.0, 33.0, 80.0, 153.0, 242.0, 227.0, 138.0, 74.0, 21.0, 13.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.99069213867188, -136.34861755371094, -128.70655822753906, -121.06448364257812, -113.42241668701172, -105.78034973144531, -98.13827514648438, -90.49620819091797, -82.85414123535156, -75.21207427978516, -67.57000732421875, -59.92793273925781, -52.285865783691406, -44.643798828125, -37.00172805786133, -29.359657287597656, -21.71759033203125, -14.075521469116211, -6.433452606201172, 1.2086162567138672, 8.850685119628906, 16.492752075195312, 24.134822845458984, 31.776893615722656, 39.41896057128906, 47.06102752685547, 54.70309829711914, 62.34516906738281, 69.98723602294922, 77.62930297851562, 85.27137756347656, 92.91344451904297, 100.55551147460938, 108.19757843017578, 115.83964538574219, 123.48171997070312, 131.123779296875, 138.76585388183594, 146.40792846679688, 154.04998779296875, 161.6920623779297, 169.33413696289062, 176.9761962890625, 184.61827087402344, 192.26034545898438, 199.90240478515625, 207.5444793701172, 215.18655395507812, 222.82861328125, 230.47068786621094, 238.1127471923828, 245.75482177734375, 253.39688110351562, 261.0389404296875, 268.6810302734375, 276.3230895996094, 283.96514892578125, 291.6072082519531, 299.2492980957031, 306.891357421875, 314.5334167480469, 322.17547607421875, 329.81756591796875, 337.4596252441406, 345.1017150878906]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 7.0, 6.0, 16.0, 18.0, 22.0, 23.0, 23.0, 35.0, 19.0, 27.0, 44.0, 29.0, 25.0, 40.0, 38.0, 39.0, 50.0, 42.0, 37.0, 45.0, 45.0, 29.0, 41.0, 35.0, 34.0, 25.0, 20.0, 28.0, 21.0, 17.0, 17.0, 23.0, 14.0, 9.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-94.14822387695312, -91.14797973632812, -88.1477279663086, -85.14747619628906, -82.14723205566406, -79.14698791503906, -76.14673614501953, -73.146484375, -70.146240234375, -67.14599609375, -64.14574432373047, -61.1454963684082, -58.14524841308594, -55.14500045776367, -52.144752502441406, -49.14450454711914, -46.144256591796875, -43.14400863647461, -40.143760681152344, -37.14351272583008, -34.14326477050781, -31.143016815185547, -28.14276885986328, -25.142520904541016, -22.14227294921875, -19.142024993896484, -16.14177703857422, -13.141529083251953, -10.141281127929688, -7.141033172607422, -4.140785217285156, -1.1405372619628906, 1.8597030639648438, 4.859951019287109, 7.860198974609375, 10.86044692993164, 13.860694885253906, 16.860942840576172, 19.861190795898438, 22.861438751220703, 25.86168670654297, 28.861934661865234, 31.8621826171875, 34.862430572509766, 37.86267852783203, 40.8629264831543, 43.86317443847656, 46.86342239379883, 49.863670349121094, 52.86391830444336, 55.864166259765625, 58.86441421508789, 61.864662170410156, 64.86491394042969, 67.86515808105469, 70.86540222167969, 73.86565399169922, 76.86590576171875, 79.86614990234375, 82.86639404296875, 85.86664581298828, 88.86689758300781, 91.86714172363281, 94.86738586425781, 97.86763763427734]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 2.0, 9.0, 3.0, 5.0, 14.0, 14.0, 16.0, 23.0, 28.0, 31.0, 45.0, 66.0, 116.0, 191.0, 303.0, 497.0, 910.0, 1828.0, 3829.0, 9445.0, 29744.0, 159041.0, 3549306.0, 369913.0, 46039.0, 13213.0, 5016.0, 2170.0, 1075.0, 544.0, 320.0, 172.0, 124.0, 62.0, 50.0, 27.0, 17.0, 25.0, 17.0, 10.0, 7.0, 7.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.2294921875, -17.490234375, -16.7509765625, -16.01171875, -15.2724609375, -14.533203125, -13.7939453125, -13.0546875, -12.3154296875, -11.576171875, -10.8369140625, -10.09765625, -9.3583984375, -8.619140625, -7.8798828125, -7.140625, -6.4013671875, -5.662109375, -4.9228515625, -4.18359375, -3.4443359375, -2.705078125, -1.9658203125, -1.2265625, -0.4873046875, 0.251953125, 0.9912109375, 1.73046875, 2.4697265625, 3.208984375, 3.9482421875, 4.6875, 5.4267578125, 6.166015625, 6.9052734375, 7.64453125, 8.3837890625, 9.123046875, 9.8623046875, 10.6015625, 11.3408203125, 12.080078125, 12.8193359375, 13.55859375, 14.2978515625, 15.037109375, 15.7763671875, 16.515625, 17.2548828125, 17.994140625, 18.7333984375, 19.47265625, 20.2119140625, 20.951171875, 21.6904296875, 22.4296875, 23.1689453125, 23.908203125, 24.6474609375, 25.38671875, 26.1259765625, 26.865234375, 27.6044921875, 28.34375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 12.0, 17.0, 32.0, 36.0, 35.0, 66.0, 75.0, 76.0, 62.0, 98.0, 94.0, 100.0, 66.0, 52.0, 56.0, 32.0, 28.0, 20.0, 10.0, 9.0, 11.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.1722412109375, -8.906982421875, -8.6417236328125, -8.37646484375, -8.1112060546875, -7.845947265625, -7.5806884765625, -7.3154296875, -7.0501708984375, -6.784912109375, -6.5196533203125, -6.25439453125, -5.9891357421875, -5.723876953125, -5.4586181640625, -5.193359375, -4.9281005859375, -4.662841796875, -4.3975830078125, -4.13232421875, -3.8670654296875, -3.601806640625, -3.3365478515625, -3.0712890625, -2.8060302734375, -2.540771484375, -2.2755126953125, -2.01025390625, -1.7449951171875, -1.479736328125, -1.2144775390625, -0.94921875, -0.6839599609375, -0.418701171875, -0.1534423828125, 0.11181640625, 0.3770751953125, 0.642333984375, 0.9075927734375, 1.1728515625, 1.4381103515625, 1.703369140625, 1.9686279296875, 2.23388671875, 2.4991455078125, 2.764404296875, 3.0296630859375, 3.294921875, 3.5601806640625, 3.825439453125, 4.0906982421875, 4.35595703125, 4.6212158203125, 4.886474609375, 5.1517333984375, 5.4169921875, 5.6822509765625, 5.947509765625, 6.2127685546875, 6.47802734375, 6.7432861328125, 7.008544921875, 7.2738037109375, 7.5390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 12.0, 12.0, 34.0, 47.0, 56.0, 70.0, 113.0, 168.0, 361.0, 725.0, 1630.0, 5091.0, 19279.0, 136439.0, 3586944.0, 394177.0, 36543.0, 7981.0, 2507.0, 962.0, 444.0, 227.0, 130.0, 78.0, 58.0, 53.0, 29.0, 28.0, 13.0, 12.0, 13.0, 3.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.115966796875, -22.31005859375, -21.504150390625, -20.6982421875, -19.892333984375, -19.08642578125, -18.280517578125, -17.474609375, -16.668701171875, -15.86279296875, -15.056884765625, -14.2509765625, -13.445068359375, -12.63916015625, -11.833251953125, -11.02734375, -10.221435546875, -9.41552734375, -8.609619140625, -7.8037109375, -6.997802734375, -6.19189453125, -5.385986328125, -4.580078125, -3.774169921875, -2.96826171875, -2.162353515625, -1.3564453125, -0.550537109375, 0.25537109375, 1.061279296875, 1.8671875, 2.673095703125, 3.47900390625, 4.284912109375, 5.0908203125, 5.896728515625, 6.70263671875, 7.508544921875, 8.314453125, 9.120361328125, 9.92626953125, 10.732177734375, 11.5380859375, 12.343994140625, 13.14990234375, 13.955810546875, 14.76171875, 15.567626953125, 16.37353515625, 17.179443359375, 17.9853515625, 18.791259765625, 19.59716796875, 20.403076171875, 21.208984375, 22.014892578125, 22.82080078125, 23.626708984375, 24.4326171875, 25.238525390625, 26.04443359375, 26.850341796875, 27.65625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 4.0, 16.0, 28.0, 40.0, 71.0, 167.0, 453.0, 2278.0, 663.0, 167.0, 78.0, 38.0, 23.0, 13.0, 12.0, 8.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.78125, -25.1898193359375, -24.598388671875, -24.0069580078125, -23.41552734375, -22.8240966796875, -22.232666015625, -21.6412353515625, -21.0498046875, -20.4583740234375, -19.866943359375, -19.2755126953125, -18.68408203125, -18.0926513671875, -17.501220703125, -16.9097900390625, -16.318359375, -15.7269287109375, -15.135498046875, -14.5440673828125, -13.95263671875, -13.3612060546875, -12.769775390625, -12.1783447265625, -11.5869140625, -10.9954833984375, -10.404052734375, -9.8126220703125, -9.22119140625, -8.6297607421875, -8.038330078125, -7.4468994140625, -6.85546875, -6.2640380859375, -5.672607421875, -5.0811767578125, -4.48974609375, -3.8983154296875, -3.306884765625, -2.7154541015625, -2.1240234375, -1.5325927734375, -0.941162109375, -0.3497314453125, 0.24169921875, 0.8331298828125, 1.424560546875, 2.0159912109375, 2.607421875, 3.1988525390625, 3.790283203125, 4.3817138671875, 4.97314453125, 5.5645751953125, 6.156005859375, 6.7474365234375, 7.3388671875, 7.9302978515625, 8.521728515625, 9.1131591796875, 9.70458984375, 10.2960205078125, 10.887451171875, 11.4788818359375, 12.0703125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 36.0, 92.0, 233.0, 307.0, 195.0, 65.0, 33.0, 12.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-167.21585083007812, -163.2576904296875, -159.29953002929688, -155.3413543701172, -151.38319396972656, -147.42503356933594, -143.46685791015625, -139.50869750976562, -135.550537109375, -131.59237670898438, -127.63420867919922, -123.67604064941406, -119.71788024902344, -115.75971984863281, -111.80155181884766, -107.8433837890625, -103.88522338867188, -99.92706298828125, -95.9688949584961, -92.01072692871094, -88.05256652832031, -84.09440612792969, -80.13623809814453, -76.17807006835938, -72.21990966796875, -68.26174926757812, -64.30358123779297, -60.34541702270508, -56.38725280761719, -52.4290885925293, -48.470924377441406, -44.512760162353516, -40.554595947265625, -36.596431732177734, -32.638267517089844, -28.680103302001953, -24.721939086914062, -20.763774871826172, -16.80561065673828, -12.84744644165039, -8.8892822265625, -4.931118011474609, -0.9729537963867188, 2.985210418701172, 6.9433746337890625, 10.901538848876953, 14.859703063964844, 18.817867279052734, 22.776031494140625, 26.734195709228516, 30.692359924316406, 34.6505241394043, 38.60868835449219, 42.56685256958008, 46.52501678466797, 50.48318099975586, 54.44134521484375, 58.39950942993164, 62.35767364501953, 66.31584167480469, 70.27400207519531, 74.23216247558594, 78.1903305053711, 82.14849853515625, 86.10665893554688]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 5.0, 14.0, 15.0, 18.0, 18.0, 31.0, 42.0, 49.0, 49.0, 70.0, 76.0, 74.0, 72.0, 74.0, 56.0, 77.0, 57.0, 36.0, 45.0, 33.0, 27.0, 15.0, 12.0, 12.0, 7.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.215576171875, -62.46308135986328, -60.71058654785156, -58.958091735839844, -57.205596923828125, -55.453102111816406, -53.70060729980469, -51.94811248779297, -50.19561767578125, -48.44312286376953, -46.69062805175781, -44.938133239746094, -43.185638427734375, -41.433143615722656, -39.68064880371094, -37.92815399169922, -36.175655364990234, -34.423160552978516, -32.6706657409668, -30.918170928955078, -29.16567611694336, -27.41318130493164, -25.66068458557129, -23.90818977355957, -22.15569496154785, -20.403200149536133, -18.650705337524414, -16.898208618164062, -15.14571475982666, -13.393219947814941, -11.640724182128906, -9.888229370117188, -8.135734558105469, -6.38323974609375, -4.630744457244873, -2.878249168395996, -1.1257543563842773, 0.6267404556274414, 2.3792362213134766, 4.131731033325195, 5.884225845336914, 7.636720657348633, 9.389215469360352, 11.141711235046387, 12.894206047058105, 14.646700859069824, 16.39919662475586, 18.151691436767578, 19.904186248779297, 21.656681060791016, 23.409175872802734, 25.161670684814453, 26.914165496826172, 28.66666030883789, 30.419157028198242, 32.171653747558594, 33.92414855957031, 35.67664337158203, 37.42913818359375, 39.18163299560547, 40.93412780761719, 42.686622619628906, 44.439117431640625, 46.191612243652344, 47.94410705566406]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 10.0, 8.0, 29.0, 26.0, 44.0, 100.0, 142.0, 230.0, 403.0, 757.0, 1868.0, 5206.0, 17594.0, 73235.0, 317533.0, 451839.0, 135999.0, 30343.0, 8139.0, 2771.0, 1098.0, 530.0, 271.0, 150.0, 82.0, 45.0, 39.0, 21.0, 19.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.689208984375, -23.98779296875, -23.286376953125, -22.5849609375, -21.883544921875, -21.18212890625, -20.480712890625, -19.779296875, -19.077880859375, -18.37646484375, -17.675048828125, -16.9736328125, -16.272216796875, -15.57080078125, -14.869384765625, -14.16796875, -13.466552734375, -12.76513671875, -12.063720703125, -11.3623046875, -10.660888671875, -9.95947265625, -9.258056640625, -8.556640625, -7.855224609375, -7.15380859375, -6.452392578125, -5.7509765625, -5.049560546875, -4.34814453125, -3.646728515625, -2.9453125, -2.243896484375, -1.54248046875, -0.841064453125, -0.1396484375, 0.561767578125, 1.26318359375, 1.964599609375, 2.666015625, 3.367431640625, 4.06884765625, 4.770263671875, 5.4716796875, 6.173095703125, 6.87451171875, 7.575927734375, 8.27734375, 8.978759765625, 9.68017578125, 10.381591796875, 11.0830078125, 11.784423828125, 12.48583984375, 13.187255859375, 13.888671875, 14.590087890625, 15.29150390625, 15.992919921875, 16.6943359375, 17.395751953125, 18.09716796875, 18.798583984375, 19.5]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 11.0, 16.0, 22.0, 39.0, 53.0, 63.0, 57.0, 80.0, 87.0, 112.0, 89.0, 93.0, 59.0, 61.0, 47.0, 34.0, 34.0, 14.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.455078125, -10.16015625, -9.865234375, -9.5703125, -9.275390625, -8.98046875, -8.685546875, -8.390625, -8.095703125, -7.80078125, -7.505859375, -7.2109375, -6.916015625, -6.62109375, -6.326171875, -6.03125, -5.736328125, -5.44140625, -5.146484375, -4.8515625, -4.556640625, -4.26171875, -3.966796875, -3.671875, -3.376953125, -3.08203125, -2.787109375, -2.4921875, -2.197265625, -1.90234375, -1.607421875, -1.3125, -1.017578125, -0.72265625, -0.427734375, -0.1328125, 0.162109375, 0.45703125, 0.751953125, 1.046875, 1.341796875, 1.63671875, 1.931640625, 2.2265625, 2.521484375, 2.81640625, 3.111328125, 3.40625, 3.701171875, 3.99609375, 4.291015625, 4.5859375, 4.880859375, 5.17578125, 5.470703125, 5.765625, 6.060546875, 6.35546875, 6.650390625, 6.9453125, 7.240234375, 7.53515625, 7.830078125, 8.125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 10.0, 4.0, 4.0, 10.0, 18.0, 22.0, 23.0, 38.0, 63.0, 68.0, 106.0, 118.0, 141.0, 224.0, 336.0, 583.0, 1010.0, 2349.0, 7855.0, 41842.0, 309969.0, 561998.0, 99374.0, 15063.0, 3719.0, 1380.0, 761.0, 448.0, 256.0, 178.0, 135.0, 137.0, 70.0, 59.0, 49.0, 31.0, 31.0, 22.0, 10.0, 11.0, 8.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-23.25, -22.426025390625, -21.60205078125, -20.778076171875, -19.9541015625, -19.130126953125, -18.30615234375, -17.482177734375, -16.658203125, -15.834228515625, -15.01025390625, -14.186279296875, -13.3623046875, -12.538330078125, -11.71435546875, -10.890380859375, -10.06640625, -9.242431640625, -8.41845703125, -7.594482421875, -6.7705078125, -5.946533203125, -5.12255859375, -4.298583984375, -3.474609375, -2.650634765625, -1.82666015625, -1.002685546875, -0.1787109375, 0.645263671875, 1.46923828125, 2.293212890625, 3.1171875, 3.941162109375, 4.76513671875, 5.589111328125, 6.4130859375, 7.237060546875, 8.06103515625, 8.885009765625, 9.708984375, 10.532958984375, 11.35693359375, 12.180908203125, 13.0048828125, 13.828857421875, 14.65283203125, 15.476806640625, 16.30078125, 17.124755859375, 17.94873046875, 18.772705078125, 19.5966796875, 20.420654296875, 21.24462890625, 22.068603515625, 22.892578125, 23.716552734375, 24.54052734375, 25.364501953125, 26.1884765625, 27.012451171875, 27.83642578125, 28.660400390625, 29.484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 10.0, 8.0, 13.0, 21.0, 12.0, 31.0, 39.0, 35.0, 43.0, 37.0, 55.0, 49.0, 47.0, 40.0, 51.0, 49.0, 62.0, 50.0, 47.0, 49.0, 40.0, 35.0, 30.0, 32.0, 25.0, 14.0, 19.0, 12.0, 10.0, 5.0, 7.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.296875, -30.3447265625, -29.392578125, -28.4404296875, -27.48828125, -26.5361328125, -25.583984375, -24.6318359375, -23.6796875, -22.7275390625, -21.775390625, -20.8232421875, -19.87109375, -18.9189453125, -17.966796875, -17.0146484375, -16.0625, -15.1103515625, -14.158203125, -13.2060546875, -12.25390625, -11.3017578125, -10.349609375, -9.3974609375, -8.4453125, -7.4931640625, -6.541015625, -5.5888671875, -4.63671875, -3.6845703125, -2.732421875, -1.7802734375, -0.828125, 0.1240234375, 1.076171875, 2.0283203125, 2.98046875, 3.9326171875, 4.884765625, 5.8369140625, 6.7890625, 7.7412109375, 8.693359375, 9.6455078125, 10.59765625, 11.5498046875, 12.501953125, 13.4541015625, 14.40625, 15.3583984375, 16.310546875, 17.2626953125, 18.21484375, 19.1669921875, 20.119140625, 21.0712890625, 22.0234375, 22.9755859375, 23.927734375, 24.8798828125, 25.83203125, 26.7841796875, 27.736328125, 28.6884765625, 29.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 3.0, 9.0, 19.0, 42.0, 61.0, 150.0, 333.0, 1162.0, 6371.0, 71137.0, 770939.0, 183275.0, 12278.0, 1923.0, 487.0, 171.0, 89.0, 44.0, 12.0, 10.0, 14.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.28662109375, -22.6513671875, -22.01611328125, -21.380859375, -20.74560546875, -20.1103515625, -19.47509765625, -18.83984375, -18.20458984375, -17.5693359375, -16.93408203125, -16.298828125, -15.66357421875, -15.0283203125, -14.39306640625, -13.7578125, -13.12255859375, -12.4873046875, -11.85205078125, -11.216796875, -10.58154296875, -9.9462890625, -9.31103515625, -8.67578125, -8.04052734375, -7.4052734375, -6.77001953125, -6.134765625, -5.49951171875, -4.8642578125, -4.22900390625, -3.59375, -2.95849609375, -2.3232421875, -1.68798828125, -1.052734375, -0.41748046875, 0.2177734375, 0.85302734375, 1.48828125, 2.12353515625, 2.7587890625, 3.39404296875, 4.029296875, 4.66455078125, 5.2998046875, 5.93505859375, 6.5703125, 7.20556640625, 7.8408203125, 8.47607421875, 9.111328125, 9.74658203125, 10.3818359375, 11.01708984375, 11.65234375, 12.28759765625, 12.9228515625, 13.55810546875, 14.193359375, 14.82861328125, 15.4638671875, 16.09912109375, 16.734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 11.0, 20.0, 32.0, 36.0, 38.0, 44.0, 60.0, 71.0, 83.0, 91.0, 86.0, 77.0, 60.0, 63.0, 38.0, 39.0, 23.0, 20.0, 12.0, 15.0, 8.0, 6.0, 11.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010251998901367188, -0.0009864717721939087, -0.0009477436542510986, -0.0009090155363082886, -0.0008702874183654785, -0.0008315593004226685, -0.0007928311824798584, -0.0007541030645370483, -0.0007153749465942383, -0.0006766468286514282, -0.0006379187107086182, -0.0005991905927658081, -0.000560462474822998, -0.000521734356880188, -0.00048300623893737793, -0.00044427812099456787, -0.0004055500030517578, -0.00036682188510894775, -0.0003280937671661377, -0.00028936564922332764, -0.0002506375312805176, -0.00021190941333770752, -0.00017318129539489746, -0.0001344531774520874, -9.572505950927734e-05, -5.6996941566467285e-05, -1.8268823623657227e-05, 2.0459294319152832e-05, 5.918741226196289e-05, 9.791553020477295e-05, 0.000136643648147583, 0.00017537176609039307, 0.00021409988403320312, 0.0002528280019760132, 0.00029155611991882324, 0.0003302842378616333, 0.00036901235580444336, 0.0004077404737472534, 0.0004464685916900635, 0.00048519670963287354, 0.0005239248275756836, 0.0005626529455184937, 0.0006013810634613037, 0.0006401091814041138, 0.0006788372993469238, 0.0007175654172897339, 0.0007562935352325439, 0.000795021653175354, 0.0008337497711181641, 0.0008724778890609741, 0.0009112060070037842, 0.0009499341249465942, 0.0009886622428894043, 0.0010273903608322144, 0.0010661184787750244, 0.0011048465967178345, 0.0011435747146606445, 0.0011823028326034546, 0.0012210309505462646, 0.0012597590684890747, 0.0012984871864318848, 0.0013372153043746948, 0.0013759434223175049, 0.001414671540260315, 0.001453399658203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 3.0, 10.0, 3.0, 4.0, 9.0, 28.0, 27.0, 42.0, 71.0, 120.0, 190.0, 296.0, 645.0, 1345.0, 3993.0, 17186.0, 131705.0, 681121.0, 181858.0, 21928.0, 4724.0, 1651.0, 706.0, 357.0, 204.0, 110.0, 73.0, 42.0, 35.0, 20.0, 20.0, 2.0, 6.0, 8.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.328125, -17.8128662109375, -17.297607421875, -16.7823486328125, -16.26708984375, -15.7518310546875, -15.236572265625, -14.7213134765625, -14.2060546875, -13.6907958984375, -13.175537109375, -12.6602783203125, -12.14501953125, -11.6297607421875, -11.114501953125, -10.5992431640625, -10.083984375, -9.5687255859375, -9.053466796875, -8.5382080078125, -8.02294921875, -7.5076904296875, -6.992431640625, -6.4771728515625, -5.9619140625, -5.4466552734375, -4.931396484375, -4.4161376953125, -3.90087890625, -3.3856201171875, -2.870361328125, -2.3551025390625, -1.83984375, -1.3245849609375, -0.809326171875, -0.2940673828125, 0.22119140625, 0.7364501953125, 1.251708984375, 1.7669677734375, 2.2822265625, 2.7974853515625, 3.312744140625, 3.8280029296875, 4.34326171875, 4.8585205078125, 5.373779296875, 5.8890380859375, 6.404296875, 6.9195556640625, 7.434814453125, 7.9500732421875, 8.46533203125, 8.9805908203125, 9.495849609375, 10.0111083984375, 10.5263671875, 11.0416259765625, 11.556884765625, 12.0721435546875, 12.58740234375, 13.1026611328125, 13.617919921875, 14.1331787109375, 14.6484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 9.0, 19.0, 19.0, 29.0, 43.0, 69.0, 79.0, 80.0, 93.0, 97.0, 89.0, 105.0, 55.0, 71.0, 31.0, 26.0, 22.0, 15.0, 10.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0703125, -13.635498046875, -13.20068359375, -12.765869140625, -12.3310546875, -11.896240234375, -11.46142578125, -11.026611328125, -10.591796875, -10.156982421875, -9.72216796875, -9.287353515625, -8.8525390625, -8.417724609375, -7.98291015625, -7.548095703125, -7.11328125, -6.678466796875, -6.24365234375, -5.808837890625, -5.3740234375, -4.939208984375, -4.50439453125, -4.069580078125, -3.634765625, -3.199951171875, -2.76513671875, -2.330322265625, -1.8955078125, -1.460693359375, -1.02587890625, -0.591064453125, -0.15625, 0.278564453125, 0.71337890625, 1.148193359375, 1.5830078125, 2.017822265625, 2.45263671875, 2.887451171875, 3.322265625, 3.757080078125, 4.19189453125, 4.626708984375, 5.0615234375, 5.496337890625, 5.93115234375, 6.365966796875, 6.80078125, 7.235595703125, 7.67041015625, 8.105224609375, 8.5400390625, 8.974853515625, 9.40966796875, 9.844482421875, 10.279296875, 10.714111328125, 11.14892578125, 11.583740234375, 12.0185546875, 12.453369140625, 12.88818359375, 13.322998046875, 13.7578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 14.0, 44.0, 114.0, 199.0, 301.0, 181.0, 93.0, 29.0, 9.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.59791564941406, -228.41453552246094, -218.23114013671875, -208.04776000976562, -197.86436462402344, -187.6809844970703, -177.49758911132812, -167.314208984375, -157.13082885742188, -146.94744873046875, -136.76405334472656, -126.58067321777344, -116.39727783203125, -106.21389770507812, -96.03050994873047, -85.84712219238281, -75.66372680664062, -65.48033905029297, -55.29695129394531, -45.11356735229492, -34.930179595947266, -24.74679183959961, -14.563407897949219, -4.3800201416015625, 5.803367614746094, 15.986754417419434, 26.170141220092773, 36.3535270690918, 46.53691482543945, 56.72030258178711, 66.9036865234375, 77.08707427978516, 87.27044677734375, 97.4538345336914, 107.63722229003906, 117.82060241699219, 128.00399780273438, 138.1873779296875, 148.37075805664062, 158.5541534423828, 168.737548828125, 178.92092895507812, 189.1043243408203, 199.28770446777344, 209.47109985351562, 219.65447998046875, 229.83786010742188, 240.02125549316406, 250.2046356201172, 260.3880310058594, 270.5714111328125, 280.7547912597656, 290.93817138671875, 301.12158203125, 311.3049621582031, 321.48834228515625, 331.6717224121094, 341.8551025390625, 352.0384826660156, 362.2218933105469, 372.4052734375, 382.5886535644531, 392.77203369140625, 402.9554443359375, 413.1388244628906]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 13.0, 18.0, 11.0, 13.0, 20.0, 23.0, 16.0, 21.0, 36.0, 36.0, 36.0, 34.0, 33.0, 54.0, 54.0, 47.0, 42.0, 45.0, 38.0, 43.0, 44.0, 35.0, 29.0, 27.0, 29.0, 27.0, 33.0, 18.0, 23.0, 15.0, 11.0, 8.0, 14.0, 5.0, 11.0, 8.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.6152572631836, -112.57432556152344, -108.53338623046875, -104.4924545288086, -100.45152282714844, -96.41058349609375, -92.3696517944336, -88.32872009277344, -84.28778076171875, -80.2468490600586, -76.2059097290039, -72.16497802734375, -68.12403869628906, -64.0831069946289, -60.04217529296875, -56.00123977661133, -51.960304260253906, -47.919368743896484, -43.87843322753906, -39.837501525878906, -35.796566009521484, -31.755630493164062, -27.714696884155273, -23.673763275146484, -19.632827758789062, -15.591893196105957, -11.550958633422852, -7.510024070739746, -3.4690895080566406, 0.5718460083007812, 4.61277961730957, 8.65371322631836, 12.69464111328125, 16.735576629638672, 20.77651023864746, 24.81744384765625, 28.858379364013672, 32.899314880371094, 36.94024658203125, 40.98118209838867, 45.022117614746094, 49.063053131103516, 53.10398864746094, 57.144920349121094, 61.185855865478516, 65.22679138183594, 69.2677230834961, 73.30865478515625, 77.34959411621094, 81.3905258178711, 85.43146514892578, 89.47239685058594, 93.51333618164062, 97.55426788330078, 101.59519958496094, 105.63613891601562, 109.67707061767578, 113.71800231933594, 117.75894165039062, 121.79987335205078, 125.84080505371094, 129.88174438476562, 133.9226837158203, 137.96360778808594, 142.00454711914062]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 14.0, 24.0, 18.0, 34.0, 48.0, 72.0, 123.0, 160.0, 323.0, 572.0, 1388.0, 4602.0, 23827.0, 3533526.0, 603061.0, 19785.0, 4023.0, 1252.0, 612.0, 297.0, 161.0, 118.0, 81.0, 52.0, 26.0, 17.0, 15.0, 14.0, 6.0, 4.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -29.104248046875, -28.09912109375, -27.093994140625, -26.0888671875, -25.083740234375, -24.07861328125, -23.073486328125, -22.068359375, -21.063232421875, -20.05810546875, -19.052978515625, -18.0478515625, -17.042724609375, -16.03759765625, -15.032470703125, -14.02734375, -13.022216796875, -12.01708984375, -11.011962890625, -10.0068359375, -9.001708984375, -7.99658203125, -6.991455078125, -5.986328125, -4.981201171875, -3.97607421875, -2.970947265625, -1.9658203125, -0.960693359375, 0.04443359375, 1.049560546875, 2.0546875, 3.059814453125, 4.06494140625, 5.070068359375, 6.0751953125, 7.080322265625, 8.08544921875, 9.090576171875, 10.095703125, 11.100830078125, 12.10595703125, 13.111083984375, 14.1162109375, 15.121337890625, 16.12646484375, 17.131591796875, 18.13671875, 19.141845703125, 20.14697265625, 21.152099609375, 22.1572265625, 23.162353515625, 24.16748046875, 25.172607421875, 26.177734375, 27.182861328125, 28.18798828125, 29.193115234375, 30.1982421875, 31.203369140625, 32.20849609375, 33.213623046875, 34.21875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 12.0, 19.0, 17.0, 25.0, 20.0, 31.0, 39.0, 56.0, 46.0, 76.0, 68.0, 74.0, 64.0, 77.0, 78.0, 68.0, 60.0, 36.0, 26.0, 26.0, 16.0, 17.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.84375, -10.5504150390625, -10.257080078125, -9.9637451171875, -9.67041015625, -9.3770751953125, -9.083740234375, -8.7904052734375, -8.4970703125, -8.2037353515625, -7.910400390625, -7.6170654296875, -7.32373046875, -7.0303955078125, -6.737060546875, -6.4437255859375, -6.150390625, -5.8570556640625, -5.563720703125, -5.2703857421875, -4.97705078125, -4.6837158203125, -4.390380859375, -4.0970458984375, -3.8037109375, -3.5103759765625, -3.217041015625, -2.9237060546875, -2.63037109375, -2.3370361328125, -2.043701171875, -1.7503662109375, -1.45703125, -1.1636962890625, -0.870361328125, -0.5770263671875, -0.28369140625, 0.0096435546875, 0.302978515625, 0.5963134765625, 0.8896484375, 1.1829833984375, 1.476318359375, 1.7696533203125, 2.06298828125, 2.3563232421875, 2.649658203125, 2.9429931640625, 3.236328125, 3.5296630859375, 3.822998046875, 4.1163330078125, 4.40966796875, 4.7030029296875, 4.996337890625, 5.2896728515625, 5.5830078125, 5.8763427734375, 6.169677734375, 6.4630126953125, 6.75634765625, 7.0496826171875, 7.343017578125, 7.6363525390625, 7.9296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 9.0, 13.0, 18.0, 30.0, 43.0, 59.0, 68.0, 120.0, 171.0, 209.0, 321.0, 475.0, 687.0, 1011.0, 1546.0, 2499.0, 4326.0, 7937.0, 17250.0, 46610.0, 235868.0, 3627968.0, 174062.0, 39620.0, 15251.0, 7246.0, 4050.0, 2259.0, 1429.0, 1005.0, 652.0, 449.0, 313.0, 190.0, 146.0, 90.0, 77.0, 59.0, 37.0, 23.0, 15.0, 18.0, 20.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9188232421875, -9.603271484375, -9.2877197265625, -8.97216796875, -8.6566162109375, -8.341064453125, -8.0255126953125, -7.7099609375, -7.3944091796875, -7.078857421875, -6.7633056640625, -6.44775390625, -6.1322021484375, -5.816650390625, -5.5010986328125, -5.185546875, -4.8699951171875, -4.554443359375, -4.2388916015625, -3.92333984375, -3.6077880859375, -3.292236328125, -2.9766845703125, -2.6611328125, -2.3455810546875, -2.030029296875, -1.7144775390625, -1.39892578125, -1.0833740234375, -0.767822265625, -0.4522705078125, -0.13671875, 0.1788330078125, 0.494384765625, 0.8099365234375, 1.12548828125, 1.4410400390625, 1.756591796875, 2.0721435546875, 2.3876953125, 2.7032470703125, 3.018798828125, 3.3343505859375, 3.64990234375, 3.9654541015625, 4.281005859375, 4.5965576171875, 4.912109375, 5.2276611328125, 5.543212890625, 5.8587646484375, 6.17431640625, 6.4898681640625, 6.805419921875, 7.1209716796875, 7.4365234375, 7.7520751953125, 8.067626953125, 8.3831787109375, 8.69873046875, 9.0142822265625, 9.329833984375, 9.6453857421875, 9.9609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 5.0, 6.0, 12.0, 14.0, 14.0, 20.0, 36.0, 74.0, 97.0, 250.0, 2014.0, 1017.0, 213.0, 97.0, 60.0, 21.0, 31.0, 14.0, 5.0, 14.0, 7.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.636810302734375, -2.55682373046875, -2.476837158203125, -2.3968505859375, -2.316864013671875, -2.23687744140625, -2.156890869140625, -2.076904296875, -1.996917724609375, -1.91693115234375, -1.836944580078125, -1.7569580078125, -1.676971435546875, -1.59698486328125, -1.516998291015625, -1.43701171875, -1.357025146484375, -1.27703857421875, -1.197052001953125, -1.1170654296875, -1.037078857421875, -0.95709228515625, -0.877105712890625, -0.797119140625, -0.717132568359375, -0.63714599609375, -0.557159423828125, -0.4771728515625, -0.397186279296875, -0.31719970703125, -0.237213134765625, -0.1572265625, -0.077239990234375, 0.00274658203125, 0.082733154296875, 0.1627197265625, 0.242706298828125, 0.32269287109375, 0.402679443359375, 0.482666015625, 0.562652587890625, 0.64263916015625, 0.722625732421875, 0.8026123046875, 0.882598876953125, 0.96258544921875, 1.042572021484375, 1.12255859375, 1.202545166015625, 1.28253173828125, 1.362518310546875, 1.4425048828125, 1.522491455078125, 1.60247802734375, 1.682464599609375, 1.762451171875, 1.842437744140625, 1.92242431640625, 2.002410888671875, 2.0823974609375, 2.162384033203125, 2.24237060546875, 2.322357177734375, 2.40234375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 2.0, 4.0, 19.0, 43.0, 87.0, 172.0, 243.0, 217.0, 126.0, 53.0, 20.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.50543975830078, -42.641212463378906, -41.77698516845703, -40.912757873535156, -40.04853057861328, -39.18430709838867, -38.3200798034668, -37.45585250854492, -36.59162521362305, -35.72739791870117, -34.8631706237793, -33.99894332885742, -33.13471984863281, -32.27049255371094, -31.406265258789062, -30.542037963867188, -29.677810668945312, -28.813583374023438, -27.949356079101562, -27.08513069152832, -26.220903396606445, -25.35667610168457, -24.492450714111328, -23.628223419189453, -22.763996124267578, -21.899768829345703, -21.035541534423828, -20.171316146850586, -19.30708885192871, -18.442861557006836, -17.578636169433594, -16.71440887451172, -15.850181579589844, -14.985954284667969, -14.12172794342041, -13.257501602172852, -12.393274307250977, -11.529047012329102, -10.664820671081543, -9.800594329833984, -8.93636703491211, -8.072139739990234, -7.207913398742676, -6.343686580657959, -5.479459762573242, -4.615232944488525, -3.7510061264038086, -2.886779308319092, -2.022552490234375, -1.1583256721496582, -0.2940988540649414, 0.5701279640197754, 1.4343547821044922, 2.298581600189209, 3.162808418273926, 4.027035236358643, 4.891262054443359, 5.755488872528076, 6.619715690612793, 7.48394250869751, 8.348169326782227, 9.212396621704102, 10.07662296295166, 10.940849304199219, 11.805076599121094]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 17.0, 19.0, 29.0, 23.0, 28.0, 42.0, 38.0, 47.0, 52.0, 47.0, 47.0, 64.0, 67.0, 54.0, 49.0, 57.0, 53.0, 44.0, 40.0, 34.0, 32.0, 22.0, 24.0, 14.0, 6.0, 16.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.771883010864258, -7.431410312652588, -7.090937614440918, -6.750465393066406, -6.409992218017578, -6.069519996643066, -5.7290472984313965, -5.388574600219727, -5.048101902008057, -4.707629203796387, -4.367156505584717, -4.026683807373047, -3.686211347579956, -3.345738649368286, -3.0052661895751953, -2.6647934913635254, -2.3243207931518555, -1.9838480949401855, -1.6433755159378052, -1.3029029369354248, -0.9624302387237549, -0.621957540512085, -0.28148508071899414, 0.05898761749267578, 0.3994603157043457, 0.7399329543113708, 1.080405592918396, 1.4208781719207764, 1.7613508701324463, 2.101823568344116, 2.442296028137207, 2.782768726348877, 3.123241424560547, 3.463714122772217, 3.8041868209838867, 4.144659042358398, 4.485132217407227, 4.825604438781738, 5.166077136993408, 5.506549835205078, 5.847022533416748, 6.187495231628418, 6.527967929840088, 6.868440628051758, 7.2089128494262695, 7.549386024475098, 7.889858245849609, 8.230331420898438, 8.57080364227295, 8.911275863647461, 9.251749038696289, 9.5922212600708, 9.932694435119629, 10.27316665649414, 10.613639831542969, 10.95411205291748, 11.294584274291992, 11.635056495666504, 11.975529670715332, 12.316001892089844, 12.656475067138672, 12.996947288513184, 13.337419509887695, 13.677892684936523, 14.018365859985352]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 15.0, 26.0, 40.0, 83.0, 121.0, 221.0, 398.0, 871.0, 2502.0, 7070.0, 24691.0, 99116.0, 350364.0, 395963.0, 123079.0, 30531.0, 8463.0, 2856.0, 1114.0, 457.0, 253.0, 140.0, 66.0, 38.0, 24.0, 13.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-27.25, -26.570068359375, -25.89013671875, -25.210205078125, -24.5302734375, -23.850341796875, -23.17041015625, -22.490478515625, -21.810546875, -21.130615234375, -20.45068359375, -19.770751953125, -19.0908203125, -18.410888671875, -17.73095703125, -17.051025390625, -16.37109375, -15.691162109375, -15.01123046875, -14.331298828125, -13.6513671875, -12.971435546875, -12.29150390625, -11.611572265625, -10.931640625, -10.251708984375, -9.57177734375, -8.891845703125, -8.2119140625, -7.531982421875, -6.85205078125, -6.172119140625, -5.4921875, -4.812255859375, -4.13232421875, -3.452392578125, -2.7724609375, -2.092529296875, -1.41259765625, -0.732666015625, -0.052734375, 0.627197265625, 1.30712890625, 1.987060546875, 2.6669921875, 3.346923828125, 4.02685546875, 4.706787109375, 5.38671875, 6.066650390625, 6.74658203125, 7.426513671875, 8.1064453125, 8.786376953125, 9.46630859375, 10.146240234375, 10.826171875, 11.506103515625, 12.18603515625, 12.865966796875, 13.5458984375, 14.225830078125, 14.90576171875, 15.585693359375, 16.265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 17.0, 23.0, 25.0, 17.0, 21.0, 33.0, 46.0, 49.0, 56.0, 68.0, 67.0, 68.0, 67.0, 68.0, 77.0, 62.0, 57.0, 33.0, 32.0, 18.0, 18.0, 21.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.6326904296875, -10.343505859375, -10.0543212890625, -9.76513671875, -9.4759521484375, -9.186767578125, -8.8975830078125, -8.6083984375, -8.3192138671875, -8.030029296875, -7.7408447265625, -7.45166015625, -7.1624755859375, -6.873291015625, -6.5841064453125, -6.294921875, -6.0057373046875, -5.716552734375, -5.4273681640625, -5.13818359375, -4.8489990234375, -4.559814453125, -4.2706298828125, -3.9814453125, -3.6922607421875, -3.403076171875, -3.1138916015625, -2.82470703125, -2.5355224609375, -2.246337890625, -1.9571533203125, -1.66796875, -1.3787841796875, -1.089599609375, -0.8004150390625, -0.51123046875, -0.2220458984375, 0.067138671875, 0.3563232421875, 0.6455078125, 0.9346923828125, 1.223876953125, 1.5130615234375, 1.80224609375, 2.0914306640625, 2.380615234375, 2.6697998046875, 2.958984375, 3.2481689453125, 3.537353515625, 3.8265380859375, 4.11572265625, 4.4049072265625, 4.694091796875, 4.9832763671875, 5.2724609375, 5.5616455078125, 5.850830078125, 6.1400146484375, 6.42919921875, 6.7183837890625, 7.007568359375, 7.2967529296875, 7.5859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 7.0, 13.0, 18.0, 32.0, 33.0, 49.0, 74.0, 138.0, 224.0, 306.0, 585.0, 1358.0, 6167.0, 94697.0, 871541.0, 65668.0, 5023.0, 1163.0, 523.0, 326.0, 181.0, 140.0, 103.0, 64.0, 40.0, 26.0, 21.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.71875, -58.16552734375, -56.6123046875, -55.05908203125, -53.505859375, -51.95263671875, -50.3994140625, -48.84619140625, -47.29296875, -45.73974609375, -44.1865234375, -42.63330078125, -41.080078125, -39.52685546875, -37.9736328125, -36.42041015625, -34.8671875, -33.31396484375, -31.7607421875, -30.20751953125, -28.654296875, -27.10107421875, -25.5478515625, -23.99462890625, -22.44140625, -20.88818359375, -19.3349609375, -17.78173828125, -16.228515625, -14.67529296875, -13.1220703125, -11.56884765625, -10.015625, -8.46240234375, -6.9091796875, -5.35595703125, -3.802734375, -2.24951171875, -0.6962890625, 0.85693359375, 2.41015625, 3.96337890625, 5.5166015625, 7.06982421875, 8.623046875, 10.17626953125, 11.7294921875, 13.28271484375, 14.8359375, 16.38916015625, 17.9423828125, 19.49560546875, 21.048828125, 22.60205078125, 24.1552734375, 25.70849609375, 27.26171875, 28.81494140625, 30.3681640625, 31.92138671875, 33.474609375, 35.02783203125, 36.5810546875, 38.13427734375, 39.6875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 10.0, 6.0, 15.0, 10.0, 12.0, 15.0, 19.0, 25.0, 31.0, 40.0, 35.0, 43.0, 44.0, 59.0, 55.0, 64.0, 49.0, 65.0, 57.0, 48.0, 49.0, 40.0, 35.0, 38.0, 31.0, 17.0, 16.0, 13.0, 7.0, 17.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-39.8125, -38.6748046875, -37.537109375, -36.3994140625, -35.26171875, -34.1240234375, -32.986328125, -31.8486328125, -30.7109375, -29.5732421875, -28.435546875, -27.2978515625, -26.16015625, -25.0224609375, -23.884765625, -22.7470703125, -21.609375, -20.4716796875, -19.333984375, -18.1962890625, -17.05859375, -15.9208984375, -14.783203125, -13.6455078125, -12.5078125, -11.3701171875, -10.232421875, -9.0947265625, -7.95703125, -6.8193359375, -5.681640625, -4.5439453125, -3.40625, -2.2685546875, -1.130859375, 0.0068359375, 1.14453125, 2.2822265625, 3.419921875, 4.5576171875, 5.6953125, 6.8330078125, 7.970703125, 9.1083984375, 10.24609375, 11.3837890625, 12.521484375, 13.6591796875, 14.796875, 15.9345703125, 17.072265625, 18.2099609375, 19.34765625, 20.4853515625, 21.623046875, 22.7607421875, 23.8984375, 25.0361328125, 26.173828125, 27.3115234375, 28.44921875, 29.5869140625, 30.724609375, 31.8623046875, 33.0]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 14.0, 19.0, 29.0, 27.0, 64.0, 128.0, 245.0, 840.0, 6003.0, 346692.0, 683404.0, 9349.0, 1101.0, 296.0, 142.0, 68.0, 46.0, 23.0, 16.0, 8.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.641845703125, -26.75244140625, -25.863037109375, -24.9736328125, -24.084228515625, -23.19482421875, -22.305419921875, -21.416015625, -20.526611328125, -19.63720703125, -18.747802734375, -17.8583984375, -16.968994140625, -16.07958984375, -15.190185546875, -14.30078125, -13.411376953125, -12.52197265625, -11.632568359375, -10.7431640625, -9.853759765625, -8.96435546875, -8.074951171875, -7.185546875, -6.296142578125, -5.40673828125, -4.517333984375, -3.6279296875, -2.738525390625, -1.84912109375, -0.959716796875, -0.0703125, 0.819091796875, 1.70849609375, 2.597900390625, 3.4873046875, 4.376708984375, 5.26611328125, 6.155517578125, 7.044921875, 7.934326171875, 8.82373046875, 9.713134765625, 10.6025390625, 11.491943359375, 12.38134765625, 13.270751953125, 14.16015625, 15.049560546875, 15.93896484375, 16.828369140625, 17.7177734375, 18.607177734375, 19.49658203125, 20.385986328125, 21.275390625, 22.164794921875, 23.05419921875, 23.943603515625, 24.8330078125, 25.722412109375, 26.61181640625, 27.501220703125, 28.390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 4.0, 8.0, 20.0, 23.0, 50.0, 63.0, 80.0, 109.0, 127.0, 143.0, 106.0, 92.0, 66.0, 36.0, 27.0, 23.0, 10.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00244903564453125, -0.002394631505012512, -0.0023402273654937744, -0.0022858232259750366, -0.002231419086456299, -0.002177014946937561, -0.0021226108074188232, -0.0020682066679000854, -0.0020138025283813477, -0.00195939838886261, -0.001904994249343872, -0.0018505901098251343, -0.0017961859703063965, -0.0017417818307876587, -0.001687377691268921, -0.001632973551750183, -0.0015785694122314453, -0.0015241652727127075, -0.0014697611331939697, -0.001415356993675232, -0.0013609528541564941, -0.0013065487146377563, -0.0012521445751190186, -0.0011977404356002808, -0.001143336296081543, -0.0010889321565628052, -0.0010345280170440674, -0.0009801238775253296, -0.0009257197380065918, -0.000871315598487854, -0.0008169114589691162, -0.0007625073194503784, -0.0007081031799316406, -0.0006536990404129028, -0.000599294900894165, -0.0005448907613754272, -0.0004904866218566895, -0.00043608248233795166, -0.00038167834281921387, -0.0003272742033004761, -0.0002728700637817383, -0.0002184659242630005, -0.0001640617847442627, -0.0001096576452255249, -5.525350570678711e-05, -8.493661880493164e-07, 5.3554773330688477e-05, 0.00010795891284942627, 0.00016236305236816406, 0.00021676719188690186, 0.00027117133140563965, 0.00032557547092437744, 0.00037997961044311523, 0.00043438374996185303, 0.0004887878894805908, 0.0005431920289993286, 0.0005975961685180664, 0.0006520003080368042, 0.000706404447555542, 0.0007608085870742798, 0.0008152127265930176, 0.0008696168661117554, 0.0009240210056304932, 0.000978425145149231, 0.0010328292846679688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 11.0, 21.0, 24.0, 56.0, 87.0, 223.0, 501.0, 1535.0, 8072.0, 305793.0, 716015.0, 12993.0, 2085.0, 615.0, 245.0, 112.0, 68.0, 25.0, 21.0, 10.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3125, -31.41748046875, -30.5224609375, -29.62744140625, -28.732421875, -27.83740234375, -26.9423828125, -26.04736328125, -25.15234375, -24.25732421875, -23.3623046875, -22.46728515625, -21.572265625, -20.67724609375, -19.7822265625, -18.88720703125, -17.9921875, -17.09716796875, -16.2021484375, -15.30712890625, -14.412109375, -13.51708984375, -12.6220703125, -11.72705078125, -10.83203125, -9.93701171875, -9.0419921875, -8.14697265625, -7.251953125, -6.35693359375, -5.4619140625, -4.56689453125, -3.671875, -2.77685546875, -1.8818359375, -0.98681640625, -0.091796875, 0.80322265625, 1.6982421875, 2.59326171875, 3.48828125, 4.38330078125, 5.2783203125, 6.17333984375, 7.068359375, 7.96337890625, 8.8583984375, 9.75341796875, 10.6484375, 11.54345703125, 12.4384765625, 13.33349609375, 14.228515625, 15.12353515625, 16.0185546875, 16.91357421875, 17.80859375, 18.70361328125, 19.5986328125, 20.49365234375, 21.388671875, 22.28369140625, 23.1787109375, 24.07373046875, 24.96875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 19.0, 47.0, 76.0, 122.0, 187.0, 211.0, 135.0, 82.0, 45.0, 24.0, 18.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.005615234375, -20.16748046875, -19.329345703125, -18.4912109375, -17.653076171875, -16.81494140625, -15.976806640625, -15.138671875, -14.300537109375, -13.46240234375, -12.624267578125, -11.7861328125, -10.947998046875, -10.10986328125, -9.271728515625, -8.43359375, -7.595458984375, -6.75732421875, -5.919189453125, -5.0810546875, -4.242919921875, -3.40478515625, -2.566650390625, -1.728515625, -0.890380859375, -0.05224609375, 0.785888671875, 1.6240234375, 2.462158203125, 3.30029296875, 4.138427734375, 4.9765625, 5.814697265625, 6.65283203125, 7.490966796875, 8.3291015625, 9.167236328125, 10.00537109375, 10.843505859375, 11.681640625, 12.519775390625, 13.35791015625, 14.196044921875, 15.0341796875, 15.872314453125, 16.71044921875, 17.548583984375, 18.38671875, 19.224853515625, 20.06298828125, 20.901123046875, 21.7392578125, 22.577392578125, 23.41552734375, 24.253662109375, 25.091796875, 25.929931640625, 26.76806640625, 27.606201171875, 28.4443359375, 29.282470703125, 30.12060546875, 30.958740234375, 31.796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 9.0, 12.0, 33.0, 59.0, 105.0, 161.0, 184.0, 182.0, 110.0, 77.0, 26.0, 14.0, 17.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.9571075439453, -176.0902099609375, -169.2233123779297, -162.35641479492188, -155.48951721191406, -148.62261962890625, -141.75570678710938, -134.88882446289062, -128.02191162109375, -121.15501403808594, -114.28811645507812, -107.42121887207031, -100.5543212890625, -93.68742370605469, -86.82051849365234, -79.95362091064453, -73.08673095703125, -66.21983337402344, -59.352935791015625, -52.48603439331055, -45.619136810302734, -38.75223922729492, -31.885337829589844, -25.01844024658203, -18.15154266357422, -11.28464412689209, -4.417745590209961, 2.4491539001464844, 9.316051483154297, 16.18294906616211, 23.049850463867188, 29.916748046875, 36.783660888671875, 43.65055847167969, 50.5174560546875, 57.38435745239258, 64.25125122070312, 71.11814880371094, 77.98505401611328, 84.8519515991211, 91.7188491821289, 98.58574676513672, 105.45264434814453, 112.31954956054688, 119.18644714355469, 126.0533447265625, 132.9202423095703, 139.78713989257812, 146.65403747558594, 153.52093505859375, 160.38783264160156, 167.25473022460938, 174.1216278076172, 180.988525390625, 187.85543823242188, 194.72232055664062, 201.5892333984375, 208.4561309814453, 215.32302856445312, 222.18992614746094, 229.05682373046875, 235.92372131347656, 242.79061889648438, 249.65753173828125, 256.5244140625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 2.0, 7.0, 6.0, 8.0, 10.0, 16.0, 11.0, 20.0, 20.0, 30.0, 19.0, 32.0, 35.0, 30.0, 38.0, 42.0, 42.0, 49.0, 47.0, 52.0, 55.0, 50.0, 37.0, 43.0, 44.0, 47.0, 29.0, 29.0, 16.0, 29.0, 25.0, 16.0, 8.0, 8.0, 12.0, 10.0, 7.0, 1.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-143.59466552734375, -139.39735412597656, -135.20004272460938, -131.0027313232422, -126.80541229248047, -122.60810089111328, -118.41078186035156, -114.21347045898438, -110.01615905761719, -105.81884765625, -101.62153625488281, -97.4242172241211, -93.2269058227539, -89.02959442138672, -84.832275390625, -80.63496398925781, -76.43765258789062, -72.24034118652344, -68.04302978515625, -63.84571075439453, -59.648399353027344, -55.451087951660156, -51.2537727355957, -47.05645751953125, -42.85914611816406, -38.661834716796875, -34.46451950073242, -30.2672061920166, -26.06989288330078, -21.87257957458496, -17.67526626586914, -13.47795295715332, -9.2806396484375, -5.08332633972168, -0.8860130310058594, 3.311300277709961, 7.508613586425781, 11.705926895141602, 15.903240203857422, 20.100553512573242, 24.297866821289062, 28.495180130004883, 32.6924934387207, 36.889808654785156, 41.087120056152344, 45.28443145751953, 49.481746673583984, 53.67906188964844, 57.876373291015625, 62.07368469238281, 66.27099609375, 70.46831512451172, 74.6656265258789, 78.8629379272461, 83.06025695800781, 87.257568359375, 91.45487976074219, 95.65219116210938, 99.84950256347656, 104.04682159423828, 108.24413299560547, 112.44144439697266, 116.63876342773438, 120.83607482910156, 125.03338623046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 17.0, 14.0, 23.0, 25.0, 33.0, 68.0, 106.0, 145.0, 295.0, 488.0, 978.0, 2486.0, 7347.0, 33327.0, 3254185.0, 852956.0, 30361.0, 6908.0, 2331.0, 971.0, 495.0, 253.0, 165.0, 90.0, 56.0, 34.0, 27.0, 20.0, 17.0, 12.0, 12.0, 4.0, 7.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.1220703125, -16.462890625, -15.8037109375, -15.14453125, -14.4853515625, -13.826171875, -13.1669921875, -12.5078125, -11.8486328125, -11.189453125, -10.5302734375, -9.87109375, -9.2119140625, -8.552734375, -7.8935546875, -7.234375, -6.5751953125, -5.916015625, -5.2568359375, -4.59765625, -3.9384765625, -3.279296875, -2.6201171875, -1.9609375, -1.3017578125, -0.642578125, 0.0166015625, 0.67578125, 1.3349609375, 1.994140625, 2.6533203125, 3.3125, 3.9716796875, 4.630859375, 5.2900390625, 5.94921875, 6.6083984375, 7.267578125, 7.9267578125, 8.5859375, 9.2451171875, 9.904296875, 10.5634765625, 11.22265625, 11.8818359375, 12.541015625, 13.2001953125, 13.859375, 14.5185546875, 15.177734375, 15.8369140625, 16.49609375, 17.1552734375, 17.814453125, 18.4736328125, 19.1328125, 19.7919921875, 20.451171875, 21.1103515625, 21.76953125, 22.4287109375, 23.087890625, 23.7470703125, 24.40625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 15.0, 24.0, 21.0, 37.0, 39.0, 31.0, 55.0, 62.0, 56.0, 89.0, 75.0, 70.0, 63.0, 54.0, 68.0, 45.0, 37.0, 31.0, 30.0, 18.0, 13.0, 12.0, 6.0, 5.0, 10.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8359375, -10.54779052734375, -10.2596435546875, -9.97149658203125, -9.683349609375, -9.39520263671875, -9.1070556640625, -8.81890869140625, -8.53076171875, -8.24261474609375, -7.9544677734375, -7.66632080078125, -7.378173828125, -7.09002685546875, -6.8018798828125, -6.51373291015625, -6.2255859375, -5.93743896484375, -5.6492919921875, -5.36114501953125, -5.072998046875, -4.78485107421875, -4.4967041015625, -4.20855712890625, -3.92041015625, -3.63226318359375, -3.3441162109375, -3.05596923828125, -2.767822265625, -2.47967529296875, -2.1915283203125, -1.90338134765625, -1.615234375, -1.32708740234375, -1.0389404296875, -0.75079345703125, -0.462646484375, -0.17449951171875, 0.1136474609375, 0.40179443359375, 0.68994140625, 0.97808837890625, 1.2662353515625, 1.55438232421875, 1.842529296875, 2.13067626953125, 2.4188232421875, 2.70697021484375, 2.9951171875, 3.28326416015625, 3.5714111328125, 3.85955810546875, 4.147705078125, 4.43585205078125, 4.7239990234375, 5.01214599609375, 5.30029296875, 5.58843994140625, 5.8765869140625, 6.16473388671875, 6.452880859375, 6.74102783203125, 7.0291748046875, 7.31732177734375, 7.60546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 4.0, 4.0, 11.0, 11.0, 21.0, 26.0, 30.0, 54.0, 72.0, 122.0, 148.0, 211.0, 332.0, 464.0, 680.0, 1043.0, 1619.0, 2672.0, 4787.0, 9001.0, 21227.0, 69499.0, 885913.0, 3064775.0, 84291.0, 24293.0, 10143.0, 4878.0, 2821.0, 1719.0, 1109.0, 766.0, 499.0, 296.0, 219.0, 148.0, 105.0, 68.0, 53.0, 37.0, 28.0, 22.0, 15.0, 12.0, 12.0, 9.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.1171875, -8.803466796875, -8.48974609375, -8.176025390625, -7.8623046875, -7.548583984375, -7.23486328125, -6.921142578125, -6.607421875, -6.293701171875, -5.97998046875, -5.666259765625, -5.3525390625, -5.038818359375, -4.72509765625, -4.411376953125, -4.09765625, -3.783935546875, -3.47021484375, -3.156494140625, -2.8427734375, -2.529052734375, -2.21533203125, -1.901611328125, -1.587890625, -1.274169921875, -0.96044921875, -0.646728515625, -0.3330078125, -0.019287109375, 0.29443359375, 0.608154296875, 0.921875, 1.235595703125, 1.54931640625, 1.863037109375, 2.1767578125, 2.490478515625, 2.80419921875, 3.117919921875, 3.431640625, 3.745361328125, 4.05908203125, 4.372802734375, 4.6865234375, 5.000244140625, 5.31396484375, 5.627685546875, 5.94140625, 6.255126953125, 6.56884765625, 6.882568359375, 7.1962890625, 7.510009765625, 7.82373046875, 8.137451171875, 8.451171875, 8.764892578125, 9.07861328125, 9.392333984375, 9.7060546875, 10.019775390625, 10.33349609375, 10.647216796875, 10.9609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 13.0, 18.0, 26.0, 50.0, 60.0, 183.0, 1327.0, 2003.0, 210.0, 69.0, 38.0, 11.0, 18.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.039642333984375, -2.90155029296875, -2.763458251953125, -2.6253662109375, -2.487274169921875, -2.34918212890625, -2.211090087890625, -2.072998046875, -1.934906005859375, -1.79681396484375, -1.658721923828125, -1.5206298828125, -1.382537841796875, -1.24444580078125, -1.106353759765625, -0.96826171875, -0.830169677734375, -0.69207763671875, -0.553985595703125, -0.4158935546875, -0.277801513671875, -0.13970947265625, -0.001617431640625, 0.136474609375, 0.274566650390625, 0.41265869140625, 0.550750732421875, 0.6888427734375, 0.826934814453125, 0.96502685546875, 1.103118896484375, 1.2412109375, 1.379302978515625, 1.51739501953125, 1.655487060546875, 1.7935791015625, 1.931671142578125, 2.06976318359375, 2.207855224609375, 2.345947265625, 2.484039306640625, 2.62213134765625, 2.760223388671875, 2.8983154296875, 3.036407470703125, 3.17449951171875, 3.312591552734375, 3.45068359375, 3.588775634765625, 3.72686767578125, 3.864959716796875, 4.0030517578125, 4.141143798828125, 4.27923583984375, 4.417327880859375, 4.555419921875, 4.693511962890625, 4.83160400390625, 4.969696044921875, 5.1077880859375, 5.245880126953125, 5.38397216796875, 5.522064208984375, 5.66015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 13.0, 17.0, 45.0, 80.0, 102.0, 148.0, 161.0, 132.0, 106.0, 70.0, 57.0, 31.0, 14.0, 10.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.652231216430664, -29.01502799987793, -28.377822875976562, -27.740619659423828, -27.10341453552246, -26.466211318969727, -25.82900619506836, -25.191802978515625, -24.55459976196289, -23.917396545410156, -23.28019142150879, -22.642988204956055, -22.005783081054688, -21.368579864501953, -20.73137664794922, -20.09417152404785, -19.456966400146484, -18.81976318359375, -18.182558059692383, -17.54535484313965, -16.90814971923828, -16.270946502685547, -15.633742332458496, -14.996538162231445, -14.359334945678711, -13.72213077545166, -13.08492660522461, -12.447723388671875, -11.810519218444824, -11.173315048217773, -10.536110877990723, -9.898906707763672, -9.261703491210938, -8.624499320983887, -7.987295627593994, -7.350091457366943, -6.712887763977051, -6.07568359375, -5.438479423522949, -4.801275730133057, -4.164071559906006, -3.526867628097534, -2.8896636962890625, -2.2524595260620117, -1.61525559425354, -0.9780516624450684, -0.3408474922180176, 0.296356201171875, 0.9335603713989258, 1.5707643032073975, 2.207968235015869, 2.84517240524292, 3.4823763370513916, 4.119580268859863, 4.756784439086914, 5.393988132476807, 6.031192302703857, 6.668396472930908, 7.305600166320801, 7.942804336547852, 8.580008506774902, 9.217212677001953, 9.854415893554688, 10.491620063781738, 11.128824234008789]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 11.0, 7.0, 12.0, 10.0, 15.0, 14.0, 24.0, 15.0, 20.0, 31.0, 33.0, 34.0, 46.0, 42.0, 43.0, 60.0, 55.0, 47.0, 44.0, 49.0, 42.0, 42.0, 40.0, 38.0, 27.0, 30.0, 21.0, 25.0, 33.0, 20.0, 14.0, 16.0, 13.0, 9.0, 2.0, 8.0, 0.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.573230743408203, -8.279401779174805, -7.98557186126709, -7.691742897033691, -7.397913455963135, -7.104084014892578, -6.81025505065918, -6.516425609588623, -6.222596168518066, -5.92876672744751, -5.634937286376953, -5.341108322143555, -5.047278881072998, -4.753449440002441, -4.459620475769043, -4.165791034698486, -3.8719615936279297, -3.578132152557373, -3.2843029499053955, -2.990473747253418, -2.6966443061828613, -2.4028148651123047, -2.108985662460327, -1.8151564598083496, -1.521327018737793, -1.2274976968765259, -0.9336683750152588, -0.6398390531539917, -0.3460097312927246, -0.05218040943145752, 0.24164891242980957, 0.5354781150817871, 0.8293085098266602, 1.1231378316879272, 1.4169671535491943, 1.7107964754104614, 2.0046257972717285, 2.298455238342285, 2.5922844409942627, 2.8861136436462402, 3.179943084716797, 3.4737725257873535, 3.767601728439331, 4.061430931091309, 4.355260372161865, 4.649089813232422, 4.94291877746582, 5.236748218536377, 5.530577659606934, 5.82440710067749, 6.118236541748047, 6.412065505981445, 6.705894947052002, 6.999724388122559, 7.293553352355957, 7.587382793426514, 7.88121223449707, 8.175041198730469, 8.468871116638184, 8.762700080871582, 9.056529998779297, 9.350358963012695, 9.644187927246094, 9.938016891479492, 10.231846809387207]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 17.0, 22.0, 44.0, 68.0, 144.0, 269.0, 512.0, 1237.0, 3262.0, 11141.0, 46813.0, 228948.0, 507018.0, 194740.0, 39518.0, 9728.0, 2929.0, 1107.0, 515.0, 219.0, 128.0, 80.0, 31.0, 17.0, 16.0, 12.0, 2.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.234375, -24.6104736328125, -23.986572265625, -23.3626708984375, -22.73876953125, -22.1148681640625, -21.490966796875, -20.8670654296875, -20.2431640625, -19.6192626953125, -18.995361328125, -18.3714599609375, -17.74755859375, -17.1236572265625, -16.499755859375, -15.8758544921875, -15.251953125, -14.6280517578125, -14.004150390625, -13.3802490234375, -12.75634765625, -12.1324462890625, -11.508544921875, -10.8846435546875, -10.2607421875, -9.6368408203125, -9.012939453125, -8.3890380859375, -7.76513671875, -7.1412353515625, -6.517333984375, -5.8934326171875, -5.26953125, -4.6456298828125, -4.021728515625, -3.3978271484375, -2.77392578125, -2.1500244140625, -1.526123046875, -0.9022216796875, -0.2783203125, 0.3455810546875, 0.969482421875, 1.5933837890625, 2.21728515625, 2.8411865234375, 3.465087890625, 4.0889892578125, 4.712890625, 5.3367919921875, 5.960693359375, 6.5845947265625, 7.20849609375, 7.8323974609375, 8.456298828125, 9.0802001953125, 9.7041015625, 10.3280029296875, 10.951904296875, 11.5758056640625, 12.19970703125, 12.8236083984375, 13.447509765625, 14.0714111328125, 14.6953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 16.0, 15.0, 23.0, 33.0, 32.0, 34.0, 47.0, 44.0, 64.0, 81.0, 82.0, 73.0, 65.0, 56.0, 73.0, 53.0, 45.0, 37.0, 33.0, 15.0, 15.0, 18.0, 6.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.75, -10.4542236328125, -10.158447265625, -9.8626708984375, -9.56689453125, -9.2711181640625, -8.975341796875, -8.6795654296875, -8.3837890625, -8.0880126953125, -7.792236328125, -7.4964599609375, -7.20068359375, -6.9049072265625, -6.609130859375, -6.3133544921875, -6.017578125, -5.7218017578125, -5.426025390625, -5.1302490234375, -4.83447265625, -4.5386962890625, -4.242919921875, -3.9471435546875, -3.6513671875, -3.3555908203125, -3.059814453125, -2.7640380859375, -2.46826171875, -2.1724853515625, -1.876708984375, -1.5809326171875, -1.28515625, -0.9893798828125, -0.693603515625, -0.3978271484375, -0.10205078125, 0.1937255859375, 0.489501953125, 0.7852783203125, 1.0810546875, 1.3768310546875, 1.672607421875, 1.9683837890625, 2.26416015625, 2.5599365234375, 2.855712890625, 3.1514892578125, 3.447265625, 3.7430419921875, 4.038818359375, 4.3345947265625, 4.63037109375, 4.9261474609375, 5.221923828125, 5.5177001953125, 5.8134765625, 6.1092529296875, 6.405029296875, 6.7008056640625, 6.99658203125, 7.2923583984375, 7.588134765625, 7.8839111328125, 8.1796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 9.0, 13.0, 14.0, 16.0, 23.0, 30.0, 37.0, 61.0, 105.0, 153.0, 209.0, 321.0, 492.0, 904.0, 2091.0, 8447.0, 99431.0, 829576.0, 94088.0, 8145.0, 2036.0, 898.0, 467.0, 317.0, 197.0, 137.0, 92.0, 62.0, 41.0, 28.0, 28.0, 16.0, 18.0, 16.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.21875, -34.134765625, -33.05078125, -31.966796875, -30.8828125, -29.798828125, -28.71484375, -27.630859375, -26.546875, -25.462890625, -24.37890625, -23.294921875, -22.2109375, -21.126953125, -20.04296875, -18.958984375, -17.875, -16.791015625, -15.70703125, -14.623046875, -13.5390625, -12.455078125, -11.37109375, -10.287109375, -9.203125, -8.119140625, -7.03515625, -5.951171875, -4.8671875, -3.783203125, -2.69921875, -1.615234375, -0.53125, 0.552734375, 1.63671875, 2.720703125, 3.8046875, 4.888671875, 5.97265625, 7.056640625, 8.140625, 9.224609375, 10.30859375, 11.392578125, 12.4765625, 13.560546875, 14.64453125, 15.728515625, 16.8125, 17.896484375, 18.98046875, 20.064453125, 21.1484375, 22.232421875, 23.31640625, 24.400390625, 25.484375, 26.568359375, 27.65234375, 28.736328125, 29.8203125, 30.904296875, 31.98828125, 33.072265625, 34.15625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 8.0, 5.0, 7.0, 8.0, 16.0, 16.0, 19.0, 14.0, 28.0, 33.0, 39.0, 34.0, 43.0, 48.0, 41.0, 53.0, 46.0, 43.0, 44.0, 52.0, 52.0, 45.0, 45.0, 32.0, 34.0, 28.0, 27.0, 25.0, 19.0, 17.0, 12.0, 17.0, 9.0, 6.0, 5.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.1875, -29.259765625, -28.33203125, -27.404296875, -26.4765625, -25.548828125, -24.62109375, -23.693359375, -22.765625, -21.837890625, -20.91015625, -19.982421875, -19.0546875, -18.126953125, -17.19921875, -16.271484375, -15.34375, -14.416015625, -13.48828125, -12.560546875, -11.6328125, -10.705078125, -9.77734375, -8.849609375, -7.921875, -6.994140625, -6.06640625, -5.138671875, -4.2109375, -3.283203125, -2.35546875, -1.427734375, -0.5, 0.427734375, 1.35546875, 2.283203125, 3.2109375, 4.138671875, 5.06640625, 5.994140625, 6.921875, 7.849609375, 8.77734375, 9.705078125, 10.6328125, 11.560546875, 12.48828125, 13.416015625, 14.34375, 15.271484375, 16.19921875, 17.126953125, 18.0546875, 18.982421875, 19.91015625, 20.837890625, 21.765625, 22.693359375, 23.62109375, 24.548828125, 25.4765625, 26.404296875, 27.33203125, 28.259765625, 29.1875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 6.0, 11.0, 10.0, 5.0, 7.0, 14.0, 19.0, 38.0, 43.0, 65.0, 103.0, 150.0, 233.0, 569.0, 1860.0, 20861.0, 918818.0, 100558.0, 3584.0, 767.0, 322.0, 163.0, 114.0, 72.0, 44.0, 25.0, 27.0, 16.0, 22.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.225830078125, -24.49853515625, -23.771240234375, -23.0439453125, -22.316650390625, -21.58935546875, -20.862060546875, -20.134765625, -19.407470703125, -18.68017578125, -17.952880859375, -17.2255859375, -16.498291015625, -15.77099609375, -15.043701171875, -14.31640625, -13.589111328125, -12.86181640625, -12.134521484375, -11.4072265625, -10.679931640625, -9.95263671875, -9.225341796875, -8.498046875, -7.770751953125, -7.04345703125, -6.316162109375, -5.5888671875, -4.861572265625, -4.13427734375, -3.406982421875, -2.6796875, -1.952392578125, -1.22509765625, -0.497802734375, 0.2294921875, 0.956787109375, 1.68408203125, 2.411376953125, 3.138671875, 3.865966796875, 4.59326171875, 5.320556640625, 6.0478515625, 6.775146484375, 7.50244140625, 8.229736328125, 8.95703125, 9.684326171875, 10.41162109375, 11.138916015625, 11.8662109375, 12.593505859375, 13.32080078125, 14.048095703125, 14.775390625, 15.502685546875, 16.22998046875, 16.957275390625, 17.6845703125, 18.411865234375, 19.13916015625, 19.866455078125, 20.59375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 7.0, 18.0, 22.0, 25.0, 37.0, 53.0, 78.0, 97.0, 147.0, 126.0, 104.0, 75.0, 64.0, 42.0, 24.0, 17.0, 17.0, 12.0, 5.0, 6.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014333724975585938, -0.0013885349035263062, -0.0013436973094940186, -0.001298859715461731, -0.0012540221214294434, -0.0012091845273971558, -0.0011643469333648682, -0.0011195093393325806, -0.001074671745300293, -0.0010298341512680054, -0.0009849965572357178, -0.0009401589632034302, -0.0008953213691711426, -0.000850483775138855, -0.0008056461811065674, -0.0007608085870742798, -0.0007159709930419922, -0.0006711333990097046, -0.000626295804977417, -0.0005814582109451294, -0.0005366206169128418, -0.0004917830228805542, -0.0004469454288482666, -0.000402107834815979, -0.0003572702407836914, -0.0003124326467514038, -0.0002675950527191162, -0.0002227574586868286, -0.00017791986465454102, -0.00013308227062225342, -8.824467658996582e-05, -4.340708255767822e-05, 1.430511474609375e-06, 4.626810550689697e-05, 9.110569953918457e-05, 0.00013594329357147217, 0.00018078088760375977, 0.00022561848163604736, 0.00027045607566833496, 0.00031529366970062256, 0.00036013126373291016, 0.00040496885776519775, 0.00044980645179748535, 0.000494644045829773, 0.0005394816398620605, 0.0005843192338943481, 0.0006291568279266357, 0.0006739944219589233, 0.0007188320159912109, 0.0007636696100234985, 0.0008085072040557861, 0.0008533447980880737, 0.0008981823921203613, 0.0009430199861526489, 0.0009878575801849365, 0.0010326951742172241, 0.0010775327682495117, 0.0011223703622817993, 0.001167207956314087, 0.0012120455503463745, 0.0012568831443786621, 0.0013017207384109497, 0.0013465583324432373, 0.001391395926475525, 0.0014362335205078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 17.0, 16.0, 17.0, 32.0, 58.0, 61.0, 136.0, 180.0, 360.0, 798.0, 2212.0, 8738.0, 84636.0, 883005.0, 57712.0, 7004.0, 1926.0, 755.0, 354.0, 181.0, 107.0, 71.0, 32.0, 38.0, 28.0, 17.0, 14.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.734375, -21.12109375, -20.5078125, -19.89453125, -19.28125, -18.66796875, -18.0546875, -17.44140625, -16.828125, -16.21484375, -15.6015625, -14.98828125, -14.375, -13.76171875, -13.1484375, -12.53515625, -11.921875, -11.30859375, -10.6953125, -10.08203125, -9.46875, -8.85546875, -8.2421875, -7.62890625, -7.015625, -6.40234375, -5.7890625, -5.17578125, -4.5625, -3.94921875, -3.3359375, -2.72265625, -2.109375, -1.49609375, -0.8828125, -0.26953125, 0.34375, 0.95703125, 1.5703125, 2.18359375, 2.796875, 3.41015625, 4.0234375, 4.63671875, 5.25, 5.86328125, 6.4765625, 7.08984375, 7.703125, 8.31640625, 8.9296875, 9.54296875, 10.15625, 10.76953125, 11.3828125, 11.99609375, 12.609375, 13.22265625, 13.8359375, 14.44921875, 15.0625, 15.67578125, 16.2890625, 16.90234375, 17.515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 12.0, 6.0, 11.0, 17.0, 23.0, 38.0, 61.0, 115.0, 161.0, 172.0, 143.0, 94.0, 52.0, 25.0, 20.0, 11.0, 11.0, 7.0, 6.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.6181640625, -16.033203125, -15.4482421875, -14.86328125, -14.2783203125, -13.693359375, -13.1083984375, -12.5234375, -11.9384765625, -11.353515625, -10.7685546875, -10.18359375, -9.5986328125, -9.013671875, -8.4287109375, -7.84375, -7.2587890625, -6.673828125, -6.0888671875, -5.50390625, -4.9189453125, -4.333984375, -3.7490234375, -3.1640625, -2.5791015625, -1.994140625, -1.4091796875, -0.82421875, -0.2392578125, 0.345703125, 0.9306640625, 1.515625, 2.1005859375, 2.685546875, 3.2705078125, 3.85546875, 4.4404296875, 5.025390625, 5.6103515625, 6.1953125, 6.7802734375, 7.365234375, 7.9501953125, 8.53515625, 9.1201171875, 9.705078125, 10.2900390625, 10.875, 11.4599609375, 12.044921875, 12.6298828125, 13.21484375, 13.7998046875, 14.384765625, 14.9697265625, 15.5546875, 16.1396484375, 16.724609375, 17.3095703125, 17.89453125, 18.4794921875, 19.064453125, 19.6494140625, 20.234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 18.0, 73.0, 184.0, 305.0, 244.0, 115.0, 27.0, 12.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.9559326171875, -322.10931396484375, -312.2626953125, -302.41607666015625, -292.5694580078125, -282.72283935546875, -272.876220703125, -263.0296325683594, -253.18301391601562, -243.33639526367188, -233.48977661132812, -223.64315795898438, -213.7965545654297, -203.94993591308594, -194.1033172607422, -184.2567138671875, -174.4100799560547, -164.56346130371094, -154.7168426513672, -144.8702392578125, -135.02362060546875, -125.177001953125, -115.33038330078125, -105.48377227783203, -95.63715362548828, -85.79053497314453, -75.94392395019531, -66.09730529785156, -56.25069046020508, -46.404075622558594, -36.557456970214844, -26.710845947265625, -16.864227294921875, -7.017611503601074, 2.8290042877197266, 12.675621032714844, 22.522235870361328, 32.36885070800781, 42.21546936035156, 52.06208038330078, 61.90869903564453, 71.75531768798828, 81.6019287109375, 91.44854736328125, 101.295166015625, 111.14177703857422, 120.98839569091797, 130.8350067138672, 140.68162536621094, 150.5282440185547, 160.37486267089844, 170.22146606445312, 180.06808471679688, 189.91470336914062, 199.76132202148438, 209.60794067382812, 219.45455932617188, 229.30117797851562, 239.14779663085938, 248.99441528320312, 258.8410339355469, 268.6876220703125, 278.53424072265625, 288.380859375, 298.22747802734375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 11.0, 18.0, 21.0, 27.0, 24.0, 33.0, 42.0, 50.0, 48.0, 55.0, 52.0, 66.0, 67.0, 49.0, 43.0, 64.0, 61.0, 46.0, 33.0, 45.0, 34.0, 24.0, 19.0, 11.0, 15.0, 10.0, 6.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.1114501953125, -128.2686309814453, -123.42582702636719, -118.5830078125, -113.74019622802734, -108.89738464355469, -104.05457305908203, -99.21176147460938, -94.36894226074219, -89.52613067626953, -84.68331909179688, -79.84049987792969, -74.99768829345703, -70.15487670898438, -65.31206512451172, -60.4692497253418, -55.626441955566406, -50.78363037109375, -45.94081497192383, -41.09800338745117, -36.25518798828125, -31.412376403808594, -26.569564819335938, -21.726749420166016, -16.88393783569336, -12.04112434387207, -7.198311805725098, -2.355499267578125, 2.487314224243164, 7.330127716064453, 12.17293930053711, 17.01575469970703, 21.858566284179688, 26.701379776000977, 31.544193267822266, 36.38700485229492, 41.229820251464844, 46.0726318359375, 50.915443420410156, 55.75825881958008, 60.601070404052734, 65.44388580322266, 70.28669738769531, 75.12950897216797, 79.97232055664062, 84.81513977050781, 89.65794372558594, 94.50076293945312, 99.34357452392578, 104.18638610839844, 109.0291976928711, 113.87200927734375, 118.71482849121094, 123.5576400756836, 128.40045166015625, 133.24327087402344, 138.08607482910156, 142.92889404296875, 147.77169799804688, 152.61451721191406, 157.4573211669922, 162.30014038085938, 167.1429443359375, 171.9857635498047, 176.82858276367188]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 11.0, 10.0, 22.0, 18.0, 36.0, 70.0, 115.0, 257.0, 605.0, 1584.0, 7661.0, 135655.0, 4027080.0, 16851.0, 2722.0, 859.0, 324.0, 172.0, 92.0, 41.0, 37.0, 22.0, 9.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.03125, -29.00244140625, -27.9736328125, -26.94482421875, -25.916015625, -24.88720703125, -23.8583984375, -22.82958984375, -21.80078125, -20.77197265625, -19.7431640625, -18.71435546875, -17.685546875, -16.65673828125, -15.6279296875, -14.59912109375, -13.5703125, -12.54150390625, -11.5126953125, -10.48388671875, -9.455078125, -8.42626953125, -7.3974609375, -6.36865234375, -5.33984375, -4.31103515625, -3.2822265625, -2.25341796875, -1.224609375, -0.19580078125, 0.8330078125, 1.86181640625, 2.890625, 3.91943359375, 4.9482421875, 5.97705078125, 7.005859375, 8.03466796875, 9.0634765625, 10.09228515625, 11.12109375, 12.14990234375, 13.1787109375, 14.20751953125, 15.236328125, 16.26513671875, 17.2939453125, 18.32275390625, 19.3515625, 20.38037109375, 21.4091796875, 22.43798828125, 23.466796875, 24.49560546875, 25.5244140625, 26.55322265625, 27.58203125, 28.61083984375, 29.6396484375, 30.66845703125, 31.697265625, 32.72607421875, 33.7548828125, 34.78369140625, 35.8125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 14.0, 13.0, 25.0, 20.0, 23.0, 45.0, 48.0, 55.0, 62.0, 76.0, 94.0, 76.0, 79.0, 77.0, 54.0, 61.0, 43.0, 33.0, 23.0, 18.0, 18.0, 11.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.6953125, -10.3743896484375, -10.053466796875, -9.7325439453125, -9.41162109375, -9.0906982421875, -8.769775390625, -8.4488525390625, -8.1279296875, -7.8070068359375, -7.486083984375, -7.1651611328125, -6.84423828125, -6.5233154296875, -6.202392578125, -5.8814697265625, -5.560546875, -5.2396240234375, -4.918701171875, -4.5977783203125, -4.27685546875, -3.9559326171875, -3.635009765625, -3.3140869140625, -2.9931640625, -2.6722412109375, -2.351318359375, -2.0303955078125, -1.70947265625, -1.3885498046875, -1.067626953125, -0.7467041015625, -0.42578125, -0.1048583984375, 0.216064453125, 0.5369873046875, 0.85791015625, 1.1788330078125, 1.499755859375, 1.8206787109375, 2.1416015625, 2.4625244140625, 2.783447265625, 3.1043701171875, 3.42529296875, 3.7462158203125, 4.067138671875, 4.3880615234375, 4.708984375, 5.0299072265625, 5.350830078125, 5.6717529296875, 5.99267578125, 6.3135986328125, 6.634521484375, 6.9554443359375, 7.2763671875, 7.5972900390625, 7.918212890625, 8.2391357421875, 8.56005859375, 8.8809814453125, 9.201904296875, 9.5228271484375, 9.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 9.0, 14.0, 12.0, 23.0, 27.0, 31.0, 35.0, 63.0, 68.0, 114.0, 158.0, 228.0, 379.0, 580.0, 961.0, 1885.0, 4183.0, 12105.0, 61110.0, 3916942.0, 163300.0, 20417.0, 5953.0, 2481.0, 1198.0, 690.0, 414.0, 291.0, 186.0, 110.0, 95.0, 66.0, 31.0, 37.0, 27.0, 21.0, 16.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.0567626953125, -11.621337890625, -11.1859130859375, -10.75048828125, -10.3150634765625, -9.879638671875, -9.4442138671875, -9.0087890625, -8.5733642578125, -8.137939453125, -7.7025146484375, -7.26708984375, -6.8316650390625, -6.396240234375, -5.9608154296875, -5.525390625, -5.0899658203125, -4.654541015625, -4.2191162109375, -3.78369140625, -3.3482666015625, -2.912841796875, -2.4774169921875, -2.0419921875, -1.6065673828125, -1.171142578125, -0.7357177734375, -0.30029296875, 0.1351318359375, 0.570556640625, 1.0059814453125, 1.44140625, 1.8768310546875, 2.312255859375, 2.7476806640625, 3.18310546875, 3.6185302734375, 4.053955078125, 4.4893798828125, 4.9248046875, 5.3602294921875, 5.795654296875, 6.2310791015625, 6.66650390625, 7.1019287109375, 7.537353515625, 7.9727783203125, 8.408203125, 8.8436279296875, 9.279052734375, 9.7144775390625, 10.14990234375, 10.5853271484375, 11.020751953125, 11.4561767578125, 11.8916015625, 12.3270263671875, 12.762451171875, 13.1978759765625, 13.63330078125, 14.0687255859375, 14.504150390625, 14.9395751953125, 15.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 53.0, 110.0, 3085.0, 654.0, 87.0, 30.0, 11.0, 9.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.4710693359375, -7.274169921875, -7.0772705078125, -6.88037109375, -6.6834716796875, -6.486572265625, -6.2896728515625, -6.0927734375, -5.8958740234375, -5.698974609375, -5.5020751953125, -5.30517578125, -5.1082763671875, -4.911376953125, -4.7144775390625, -4.517578125, -4.3206787109375, -4.123779296875, -3.9268798828125, -3.72998046875, -3.5330810546875, -3.336181640625, -3.1392822265625, -2.9423828125, -2.7454833984375, -2.548583984375, -2.3516845703125, -2.15478515625, -1.9578857421875, -1.760986328125, -1.5640869140625, -1.3671875, -1.1702880859375, -0.973388671875, -0.7764892578125, -0.57958984375, -0.3826904296875, -0.185791015625, 0.0111083984375, 0.2080078125, 0.4049072265625, 0.601806640625, 0.7987060546875, 0.99560546875, 1.1925048828125, 1.389404296875, 1.5863037109375, 1.783203125, 1.9801025390625, 2.177001953125, 2.3739013671875, 2.57080078125, 2.7677001953125, 2.964599609375, 3.1614990234375, 3.3583984375, 3.5552978515625, 3.752197265625, 3.9490966796875, 4.14599609375, 4.3428955078125, 4.539794921875, 4.7366943359375, 4.93359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 17.0, 45.0, 186.0, 392.0, 268.0, 65.0, 11.0, 10.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.90681457519531, -63.607025146484375, -62.30723571777344, -61.007442474365234, -59.7076530456543, -58.40786361694336, -57.10807418823242, -55.80828094482422, -54.50849151611328, -53.208702087402344, -51.908912658691406, -50.6091194152832, -49.309329986572266, -48.00954055786133, -46.70975112915039, -45.40995788574219, -44.11016845703125, -42.81037902832031, -41.510589599609375, -40.21079635620117, -38.911006927490234, -37.6112174987793, -36.31142807006836, -35.011634826660156, -33.711849212646484, -32.41205978393555, -31.112268447875977, -29.81247901916504, -28.51268768310547, -27.21289825439453, -25.913108825683594, -24.613317489624023, -23.313528060913086, -22.01373863220215, -20.713947296142578, -19.41415786743164, -18.11436653137207, -16.814577102661133, -15.514786720275879, -14.214996337890625, -12.915205955505371, -11.615415573120117, -10.315625190734863, -9.01583480834961, -7.716044902801514, -6.41625452041626, -5.116464614868164, -3.81667423248291, -2.5168838500976562, -1.217093586921692, 0.08269667625427246, 1.3824868202209473, 2.682277202606201, 3.982067584991455, 5.281857490539551, 6.581647872924805, 7.881438255310059, 9.181228637695312, 10.481019020080566, 11.78080940246582, 13.080598831176758, 14.380390167236328, 15.680179595947266, 16.979969024658203, 18.279760360717773]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 8.0, 13.0, 28.0, 31.0, 42.0, 49.0, 77.0, 78.0, 78.0, 84.0, 79.0, 70.0, 64.0, 82.0, 57.0, 38.0, 35.0, 24.0, 20.0, 8.0, 15.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.594514846801758, -15.123682975769043, -14.652851104736328, -14.182018280029297, -13.711186408996582, -13.240354537963867, -12.769521713256836, -12.298689842224121, -11.827857971191406, -11.357026100158691, -10.886194229125977, -10.415361404418945, -9.94452953338623, -9.473697662353516, -9.002864837646484, -8.53203296661377, -8.061201095581055, -7.59036922454834, -7.119536876678467, -6.648704528808594, -6.177872657775879, -5.707040786743164, -5.236208438873291, -4.765376091003418, -4.294544219970703, -3.823712110519409, -3.3528800010681152, -2.8820478916168213, -2.4112157821655273, -1.9403836727142334, -1.4695515632629395, -0.9987194538116455, -0.527888298034668, -0.05705618858337402, 0.4137759208679199, 0.8846080303192139, 1.3554401397705078, 1.8262722492218018, 2.2971043586730957, 2.7679364681243896, 3.2387685775756836, 3.7096006870269775, 4.1804327964782715, 4.6512651443481445, 5.122097015380859, 5.592928886413574, 6.063761234283447, 6.53459358215332, 7.005425453186035, 7.47625732421875, 7.947089672088623, 8.417922019958496, 8.888753890991211, 9.359585762023926, 9.83041763305664, 10.301250457763672, 10.772082328796387, 11.242914199829102, 11.713747024536133, 12.184578895568848, 12.655410766601562, 13.126242637634277, 13.597074508666992, 14.067907333374023, 14.538739204406738]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 5.0, 16.0, 22.0, 50.0, 80.0, 135.0, 274.0, 502.0, 1147.0, 3211.0, 11820.0, 61654.0, 361528.0, 486005.0, 97532.0, 17515.0, 4273.0, 1448.0, 616.0, 300.0, 166.0, 89.0, 58.0, 38.0, 25.0, 8.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.272705078125, -19.57666015625, -18.880615234375, -18.1845703125, -17.488525390625, -16.79248046875, -16.096435546875, -15.400390625, -14.704345703125, -14.00830078125, -13.312255859375, -12.6162109375, -11.920166015625, -11.22412109375, -10.528076171875, -9.83203125, -9.135986328125, -8.43994140625, -7.743896484375, -7.0478515625, -6.351806640625, -5.65576171875, -4.959716796875, -4.263671875, -3.567626953125, -2.87158203125, -2.175537109375, -1.4794921875, -0.783447265625, -0.08740234375, 0.608642578125, 1.3046875, 2.000732421875, 2.69677734375, 3.392822265625, 4.0888671875, 4.784912109375, 5.48095703125, 6.177001953125, 6.873046875, 7.569091796875, 8.26513671875, 8.961181640625, 9.6572265625, 10.353271484375, 11.04931640625, 11.745361328125, 12.44140625, 13.137451171875, 13.83349609375, 14.529541015625, 15.2255859375, 15.921630859375, 16.61767578125, 17.313720703125, 18.009765625, 18.705810546875, 19.40185546875, 20.097900390625, 20.7939453125, 21.489990234375, 22.18603515625, 22.882080078125, 23.578125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 14.0, 15.0, 24.0, 30.0, 33.0, 44.0, 53.0, 60.0, 75.0, 79.0, 73.0, 67.0, 82.0, 66.0, 62.0, 47.0, 40.0, 33.0, 17.0, 24.0, 12.0, 8.0, 11.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.796875, -10.47705078125, -10.1572265625, -9.83740234375, -9.517578125, -9.19775390625, -8.8779296875, -8.55810546875, -8.23828125, -7.91845703125, -7.5986328125, -7.27880859375, -6.958984375, -6.63916015625, -6.3193359375, -5.99951171875, -5.6796875, -5.35986328125, -5.0400390625, -4.72021484375, -4.400390625, -4.08056640625, -3.7607421875, -3.44091796875, -3.12109375, -2.80126953125, -2.4814453125, -2.16162109375, -1.841796875, -1.52197265625, -1.2021484375, -0.88232421875, -0.5625, -0.24267578125, 0.0771484375, 0.39697265625, 0.716796875, 1.03662109375, 1.3564453125, 1.67626953125, 1.99609375, 2.31591796875, 2.6357421875, 2.95556640625, 3.275390625, 3.59521484375, 3.9150390625, 4.23486328125, 4.5546875, 4.87451171875, 5.1943359375, 5.51416015625, 5.833984375, 6.15380859375, 6.4736328125, 6.79345703125, 7.11328125, 7.43310546875, 7.7529296875, 8.07275390625, 8.392578125, 8.71240234375, 9.0322265625, 9.35205078125, 9.671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 10.0, 26.0, 36.0, 55.0, 108.0, 189.0, 379.0, 1006.0, 3317.0, 33037.0, 936404.0, 67087.0, 4719.0, 1231.0, 472.0, 209.0, 96.0, 65.0, 32.0, 25.0, 16.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.03125, -46.15478515625, -44.2783203125, -42.40185546875, -40.525390625, -38.64892578125, -36.7724609375, -34.89599609375, -33.01953125, -31.14306640625, -29.2666015625, -27.39013671875, -25.513671875, -23.63720703125, -21.7607421875, -19.88427734375, -18.0078125, -16.13134765625, -14.2548828125, -12.37841796875, -10.501953125, -8.62548828125, -6.7490234375, -4.87255859375, -2.99609375, -1.11962890625, 0.7568359375, 2.63330078125, 4.509765625, 6.38623046875, 8.2626953125, 10.13916015625, 12.015625, 13.89208984375, 15.7685546875, 17.64501953125, 19.521484375, 21.39794921875, 23.2744140625, 25.15087890625, 27.02734375, 28.90380859375, 30.7802734375, 32.65673828125, 34.533203125, 36.40966796875, 38.2861328125, 40.16259765625, 42.0390625, 43.91552734375, 45.7919921875, 47.66845703125, 49.544921875, 51.42138671875, 53.2978515625, 55.17431640625, 57.05078125, 58.92724609375, 60.8037109375, 62.68017578125, 64.556640625, 66.43310546875, 68.3095703125, 70.18603515625, 72.0625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 1.0, 10.0, 4.0, 4.0, 12.0, 10.0, 22.0, 23.0, 24.0, 31.0, 47.0, 59.0, 65.0, 64.0, 87.0, 88.0, 75.0, 78.0, 58.0, 53.0, 41.0, 41.0, 19.0, 18.0, 6.0, 14.0, 13.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5625, -46.83984375, -45.1171875, -43.39453125, -41.671875, -39.94921875, -38.2265625, -36.50390625, -34.78125, -33.05859375, -31.3359375, -29.61328125, -27.890625, -26.16796875, -24.4453125, -22.72265625, -21.0, -19.27734375, -17.5546875, -15.83203125, -14.109375, -12.38671875, -10.6640625, -8.94140625, -7.21875, -5.49609375, -3.7734375, -2.05078125, -0.328125, 1.39453125, 3.1171875, 4.83984375, 6.5625, 8.28515625, 10.0078125, 11.73046875, 13.453125, 15.17578125, 16.8984375, 18.62109375, 20.34375, 22.06640625, 23.7890625, 25.51171875, 27.234375, 28.95703125, 30.6796875, 32.40234375, 34.125, 35.84765625, 37.5703125, 39.29296875, 41.015625, 42.73828125, 44.4609375, 46.18359375, 47.90625, 49.62890625, 51.3515625, 53.07421875, 54.796875, 56.51953125, 58.2421875, 59.96484375, 61.6875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 10.0, 16.0, 14.0, 19.0, 31.0, 24.0, 43.0, 67.0, 86.0, 188.0, 303.0, 639.0, 2287.0, 28034.0, 987559.0, 25566.0, 2224.0, 634.0, 288.0, 150.0, 97.0, 66.0, 51.0, 35.0, 27.0, 21.0, 14.0, 12.0, 6.0, 12.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.1875, -30.1298828125, -29.072265625, -28.0146484375, -26.95703125, -25.8994140625, -24.841796875, -23.7841796875, -22.7265625, -21.6689453125, -20.611328125, -19.5537109375, -18.49609375, -17.4384765625, -16.380859375, -15.3232421875, -14.265625, -13.2080078125, -12.150390625, -11.0927734375, -10.03515625, -8.9775390625, -7.919921875, -6.8623046875, -5.8046875, -4.7470703125, -3.689453125, -2.6318359375, -1.57421875, -0.5166015625, 0.541015625, 1.5986328125, 2.65625, 3.7138671875, 4.771484375, 5.8291015625, 6.88671875, 7.9443359375, 9.001953125, 10.0595703125, 11.1171875, 12.1748046875, 13.232421875, 14.2900390625, 15.34765625, 16.4052734375, 17.462890625, 18.5205078125, 19.578125, 20.6357421875, 21.693359375, 22.7509765625, 23.80859375, 24.8662109375, 25.923828125, 26.9814453125, 28.0390625, 29.0966796875, 30.154296875, 31.2119140625, 32.26953125, 33.3271484375, 34.384765625, 35.4423828125, 36.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 6.0, 13.0, 10.0, 11.0, 21.0, 26.0, 27.0, 44.0, 53.0, 69.0, 98.0, 140.0, 108.0, 95.0, 67.0, 51.0, 45.0, 36.0, 23.0, 12.0, 10.0, 9.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013723373413085938, -0.0013263523578643799, -0.001280367374420166, -0.0012343823909759521, -0.0011883974075317383, -0.0011424124240875244, -0.0010964274406433105, -0.0010504424571990967, -0.0010044574737548828, -0.0009584724903106689, -0.0009124875068664551, -0.0008665025234222412, -0.0008205175399780273, -0.0007745325565338135, -0.0007285475730895996, -0.0006825625896453857, -0.0006365776062011719, -0.000590592622756958, -0.0005446076393127441, -0.0004986226558685303, -0.0004526376724243164, -0.00040665268898010254, -0.00036066770553588867, -0.0003146827220916748, -0.00026869773864746094, -0.00022271275520324707, -0.0001767277717590332, -0.00013074278831481934, -8.475780487060547e-05, -3.87728214263916e-05, 7.212162017822266e-06, 5.319714546203613e-05, 9.918212890625e-05, 0.00014516711235046387, 0.00019115209579467773, 0.0002371370792388916, 0.00028312206268310547, 0.00032910704612731934, 0.0003750920295715332, 0.00042107701301574707, 0.00046706199645996094, 0.0005130469799041748, 0.0005590319633483887, 0.0006050169467926025, 0.0006510019302368164, 0.0006969869136810303, 0.0007429718971252441, 0.000788956880569458, 0.0008349418640136719, 0.0008809268474578857, 0.0009269118309020996, 0.0009728968143463135, 0.0010188817977905273, 0.0010648667812347412, 0.001110851764678955, 0.001156836748123169, 0.0012028217315673828, 0.0012488067150115967, 0.0012947916984558105, 0.0013407766819000244, 0.0013867616653442383, 0.0014327466487884521, 0.001478731632232666, 0.0015247166156768799, 0.0015707015991210938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 8.0, 8.0, 18.0, 9.0, 17.0, 43.0, 68.0, 109.0, 161.0, 281.0, 646.0, 1974.0, 7707.0, 71710.0, 909140.0, 47497.0, 6185.0, 1601.0, 625.0, 295.0, 146.0, 118.0, 51.0, 36.0, 22.0, 11.0, 13.0, 8.0, 2.0, 8.0, 10.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.932373046875, -23.14599609375, -22.359619140625, -21.5732421875, -20.786865234375, -20.00048828125, -19.214111328125, -18.427734375, -17.641357421875, -16.85498046875, -16.068603515625, -15.2822265625, -14.495849609375, -13.70947265625, -12.923095703125, -12.13671875, -11.350341796875, -10.56396484375, -9.777587890625, -8.9912109375, -8.204833984375, -7.41845703125, -6.632080078125, -5.845703125, -5.059326171875, -4.27294921875, -3.486572265625, -2.7001953125, -1.913818359375, -1.12744140625, -0.341064453125, 0.4453125, 1.231689453125, 2.01806640625, 2.804443359375, 3.5908203125, 4.377197265625, 5.16357421875, 5.949951171875, 6.736328125, 7.522705078125, 8.30908203125, 9.095458984375, 9.8818359375, 10.668212890625, 11.45458984375, 12.240966796875, 13.02734375, 13.813720703125, 14.60009765625, 15.386474609375, 16.1728515625, 16.959228515625, 17.74560546875, 18.531982421875, 19.318359375, 20.104736328125, 20.89111328125, 21.677490234375, 22.4638671875, 23.250244140625, 24.03662109375, 24.822998046875, 25.609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 11.0, 13.0, 22.0, 52.0, 92.0, 207.0, 209.0, 152.0, 85.0, 51.0, 22.0, 17.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.1953125, -27.234375, -26.2734375, -25.3125, -24.3515625, -23.390625, -22.4296875, -21.46875, -20.5078125, -19.546875, -18.5859375, -17.625, -16.6640625, -15.703125, -14.7421875, -13.78125, -12.8203125, -11.859375, -10.8984375, -9.9375, -8.9765625, -8.015625, -7.0546875, -6.09375, -5.1328125, -4.171875, -3.2109375, -2.25, -1.2890625, -0.328125, 0.6328125, 1.59375, 2.5546875, 3.515625, 4.4765625, 5.4375, 6.3984375, 7.359375, 8.3203125, 9.28125, 10.2421875, 11.203125, 12.1640625, 13.125, 14.0859375, 15.046875, 16.0078125, 16.96875, 17.9296875, 18.890625, 19.8515625, 20.8125, 21.7734375, 22.734375, 23.6953125, 24.65625, 25.6171875, 26.578125, 27.5390625, 28.5, 29.4609375, 30.421875, 31.3828125, 32.34375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 11.0, 51.0, 190.0, 396.0, 234.0, 75.0, 28.0, 11.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-417.301025390625, -404.06207275390625, -390.8231201171875, -377.58416748046875, -364.34521484375, -351.10626220703125, -337.8673095703125, -324.62835693359375, -311.389404296875, -298.15045166015625, -284.9114990234375, -271.67254638671875, -258.43359375, -245.19464111328125, -231.95570373535156, -218.7167510986328, -205.47781372070312, -192.23886108398438, -178.99990844726562, -165.76095581054688, -152.52200317382812, -139.28305053710938, -126.04411315917969, -112.80516052246094, -99.56620788574219, -86.32725524902344, -73.08830261230469, -59.84935760498047, -46.61040496826172, -33.37145233154297, -20.13250732421875, -6.8935546875, 6.34539794921875, 19.584348678588867, 32.823299407958984, 46.06224822998047, 59.30120086669922, 72.54015350341797, 85.77909851074219, 99.01805114746094, 112.25700378417969, 125.49595642089844, 138.7349090576172, 151.97384643554688, 165.21279907226562, 178.45175170898438, 191.69070434570312, 204.92965698242188, 218.16860961914062, 231.40756225585938, 244.64651489257812, 257.8854675292969, 271.1244201660156, 284.3633728027344, 297.602294921875, 310.84124755859375, 324.0802001953125, 337.31915283203125, 350.55810546875, 363.79705810546875, 377.0360107421875, 390.27496337890625, 403.513916015625, 416.75286865234375, 429.9918212890625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 12.0, 7.0, 8.0, 12.0, 15.0, 18.0, 17.0, 24.0, 20.0, 24.0, 36.0, 30.0, 30.0, 29.0, 50.0, 46.0, 44.0, 42.0, 36.0, 38.0, 39.0, 42.0, 49.0, 39.0, 22.0, 34.0, 30.0, 21.0, 28.0, 22.0, 15.0, 28.0, 17.0, 19.0, 7.0, 17.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-142.9937744140625, -138.75523376464844, -134.5166778564453, -130.27813720703125, -126.03958892822266, -121.80104064941406, -117.56249237060547, -113.32394409179688, -109.08540344238281, -104.84685516357422, -100.60830688476562, -96.36976623535156, -92.13121795654297, -87.89266967773438, -83.65412139892578, -79.41557312011719, -75.1770248413086, -70.9384765625, -66.6999282836914, -62.46138381958008, -58.22283935546875, -53.984291076660156, -49.74574279785156, -45.50719451904297, -41.26865005493164, -37.03010177612305, -32.79155731201172, -28.553009033203125, -24.314462661743164, -20.075916290283203, -15.83736801147461, -11.598821640014648, -7.3602752685546875, -3.1217284202575684, 1.1168184280395508, 5.355365753173828, 9.593912124633789, 13.83245849609375, 18.071006774902344, 22.309553146362305, 26.548099517822266, 30.786645889282227, 35.02519226074219, 39.26374053955078, 43.502288818359375, 47.7408332824707, 51.9793815612793, 56.217926025390625, 60.45647430419922, 64.69502258300781, 68.9335708618164, 73.172119140625, 77.41065979003906, 81.64920806884766, 85.88775634765625, 90.12630462646484, 94.36485290527344, 98.60340118408203, 102.84194946289062, 107.08049011230469, 111.31903839111328, 115.55758666992188, 119.79613494873047, 124.03468322753906, 128.27322387695312]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 3.0, 10.0, 7.0, 14.0, 22.0, 40.0, 55.0, 87.0, 161.0, 311.0, 636.0, 1642.0, 4851.0, 25740.0, 3940954.0, 202084.0, 12332.0, 3051.0, 1181.0, 495.0, 230.0, 120.0, 79.0, 39.0, 40.0, 24.0, 18.0, 15.0, 6.0, 7.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.59375, -32.570068359375, -31.54638671875, -30.522705078125, -29.4990234375, -28.475341796875, -27.45166015625, -26.427978515625, -25.404296875, -24.380615234375, -23.35693359375, -22.333251953125, -21.3095703125, -20.285888671875, -19.26220703125, -18.238525390625, -17.21484375, -16.191162109375, -15.16748046875, -14.143798828125, -13.1201171875, -12.096435546875, -11.07275390625, -10.049072265625, -9.025390625, -8.001708984375, -6.97802734375, -5.954345703125, -4.9306640625, -3.906982421875, -2.88330078125, -1.859619140625, -0.8359375, 0.187744140625, 1.21142578125, 2.235107421875, 3.2587890625, 4.282470703125, 5.30615234375, 6.329833984375, 7.353515625, 8.377197265625, 9.40087890625, 10.424560546875, 11.4482421875, 12.471923828125, 13.49560546875, 14.519287109375, 15.54296875, 16.566650390625, 17.59033203125, 18.614013671875, 19.6376953125, 20.661376953125, 21.68505859375, 22.708740234375, 23.732421875, 24.756103515625, 25.77978515625, 26.803466796875, 27.8271484375, 28.850830078125, 29.87451171875, 30.898193359375, 31.921875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 6.0, 15.0, 16.0, 21.0, 31.0, 55.0, 48.0, 68.0, 70.0, 70.0, 101.0, 94.0, 76.0, 70.0, 60.0, 49.0, 34.0, 29.0, 22.0, 12.0, 15.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.5, -10.1484375, -9.796875, -9.4453125, -9.09375, -8.7421875, -8.390625, -8.0390625, -7.6875, -7.3359375, -6.984375, -6.6328125, -6.28125, -5.9296875, -5.578125, -5.2265625, -4.875, -4.5234375, -4.171875, -3.8203125, -3.46875, -3.1171875, -2.765625, -2.4140625, -2.0625, -1.7109375, -1.359375, -1.0078125, -0.65625, -0.3046875, 0.046875, 0.3984375, 0.75, 1.1015625, 1.453125, 1.8046875, 2.15625, 2.5078125, 2.859375, 3.2109375, 3.5625, 3.9140625, 4.265625, 4.6171875, 4.96875, 5.3203125, 5.671875, 6.0234375, 6.375, 6.7265625, 7.078125, 7.4296875, 7.78125, 8.1328125, 8.484375, 8.8359375, 9.1875, 9.5390625, 9.890625, 10.2421875, 10.59375, 10.9453125, 11.296875, 11.6484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 6.0, 9.0, 7.0, 11.0, 18.0, 35.0, 24.0, 42.0, 75.0, 73.0, 108.0, 143.0, 240.0, 324.0, 432.0, 646.0, 964.0, 1633.0, 2774.0, 5326.0, 11254.0, 32047.0, 205504.0, 3782400.0, 107009.0, 23288.0, 8866.0, 4380.0, 2375.0, 1382.0, 919.0, 607.0, 392.0, 272.0, 211.0, 145.0, 105.0, 70.0, 47.0, 35.0, 23.0, 18.0, 14.0, 6.0, 14.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.5390625, -13.13330078125, -12.7275390625, -12.32177734375, -11.916015625, -11.51025390625, -11.1044921875, -10.69873046875, -10.29296875, -9.88720703125, -9.4814453125, -9.07568359375, -8.669921875, -8.26416015625, -7.8583984375, -7.45263671875, -7.046875, -6.64111328125, -6.2353515625, -5.82958984375, -5.423828125, -5.01806640625, -4.6123046875, -4.20654296875, -3.80078125, -3.39501953125, -2.9892578125, -2.58349609375, -2.177734375, -1.77197265625, -1.3662109375, -0.96044921875, -0.5546875, -0.14892578125, 0.2568359375, 0.66259765625, 1.068359375, 1.47412109375, 1.8798828125, 2.28564453125, 2.69140625, 3.09716796875, 3.5029296875, 3.90869140625, 4.314453125, 4.72021484375, 5.1259765625, 5.53173828125, 5.9375, 6.34326171875, 6.7490234375, 7.15478515625, 7.560546875, 7.96630859375, 8.3720703125, 8.77783203125, 9.18359375, 9.58935546875, 9.9951171875, 10.40087890625, 10.806640625, 11.21240234375, 11.6181640625, 12.02392578125, 12.4296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 15.0, 11.0, 30.0, 51.0, 142.0, 2015.0, 1520.0, 144.0, 58.0, 25.0, 15.0, 13.0, 9.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.0, -12.6485595703125, -12.297119140625, -11.9456787109375, -11.59423828125, -11.2427978515625, -10.891357421875, -10.5399169921875, -10.1884765625, -9.8370361328125, -9.485595703125, -9.1341552734375, -8.78271484375, -8.4312744140625, -8.079833984375, -7.7283935546875, -7.376953125, -7.0255126953125, -6.674072265625, -6.3226318359375, -5.97119140625, -5.6197509765625, -5.268310546875, -4.9168701171875, -4.5654296875, -4.2139892578125, -3.862548828125, -3.5111083984375, -3.15966796875, -2.8082275390625, -2.456787109375, -2.1053466796875, -1.75390625, -1.4024658203125, -1.051025390625, -0.6995849609375, -0.34814453125, 0.0032958984375, 0.354736328125, 0.7061767578125, 1.0576171875, 1.4090576171875, 1.760498046875, 2.1119384765625, 2.46337890625, 2.8148193359375, 3.166259765625, 3.5177001953125, 3.869140625, 4.2205810546875, 4.572021484375, 4.9234619140625, 5.27490234375, 5.6263427734375, 5.977783203125, 6.3292236328125, 6.6806640625, 7.0321044921875, 7.383544921875, 7.7349853515625, 8.08642578125, 8.4378662109375, 8.789306640625, 9.1407470703125, 9.4921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 11.0, 36.0, 61.0, 98.0, 207.0, 243.0, 188.0, 87.0, 31.0, 17.0, 6.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.73462677001953, -85.80229187011719, -83.86994934082031, -81.93761444091797, -80.0052719116211, -78.07293701171875, -76.14059448242188, -74.20825958251953, -72.27591705322266, -70.34358215332031, -68.41123962402344, -66.4789047241211, -64.54656219482422, -62.61422348022461, -60.681884765625, -58.749549865722656, -56.81721115112305, -54.88487243652344, -52.95253372192383, -51.02019500732422, -49.08785629272461, -47.155517578125, -45.223182678222656, -43.29084014892578, -41.35850524902344, -39.42616653442383, -37.49382781982422, -35.56148910522461, -33.629150390625, -31.69681167602539, -29.764474868774414, -27.832136154174805, -25.899799346923828, -23.96746063232422, -22.03512191772461, -20.102783203125, -18.17044448852539, -16.23810577392578, -14.305768966674805, -12.373430252075195, -10.441091537475586, -8.508752822875977, -6.576414585113525, -4.644076347351074, -2.711737632751465, -0.7793989181518555, 1.1529388427734375, 3.085277557373047, 5.017616271972656, 6.949954986572266, 8.882293701171875, 10.814631462097168, 12.746970176696777, 14.679308891296387, 16.61164665222168, 18.54398536682129, 20.4763240814209, 22.408662796020508, 24.341001510620117, 26.273338317871094, 28.205677032470703, 30.138015747070312, 32.07035446166992, 34.00269317626953, 35.93503189086914]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 12.0, 9.0, 17.0, 22.0, 28.0, 18.0, 20.0, 32.0, 29.0, 29.0, 30.0, 38.0, 34.0, 47.0, 43.0, 41.0, 48.0, 38.0, 47.0, 46.0, 33.0, 38.0, 41.0, 32.0, 28.0, 20.0, 25.0, 29.0, 18.0, 11.0, 21.0, 13.0, 17.0, 6.0, 5.0, 9.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.06989288330078, -16.444284439086914, -15.81867504119873, -15.193066596984863, -14.567458152770996, -13.941848754882812, -13.316240310668945, -12.690631866455078, -12.065023422241211, -11.439414978027344, -10.81380558013916, -10.188197135925293, -9.562588691711426, -8.936979293823242, -8.311370849609375, -7.685762405395508, -7.060153007507324, -6.434544086456299, -5.808935642242432, -5.183326721191406, -4.557718276977539, -3.9321093559265137, -3.3065004348754883, -2.680891990661621, -2.0552830696105957, -1.4296743869781494, -0.8040655851364136, -0.17845678329467773, 0.44715189933776855, 1.0727605819702148, 1.6983695030212402, 2.3239779472351074, 2.949586868286133, 3.575195550918579, 4.200804233551025, 4.826413154602051, 5.452021598815918, 6.077630519866943, 6.703239440917969, 7.328847885131836, 7.954456806182861, 8.580065727233887, 9.205674171447754, 9.831283569335938, 10.456892013549805, 11.082500457763672, 11.708108901977539, 12.333717346191406, 12.95932674407959, 13.584935188293457, 14.21054458618164, 14.836153030395508, 15.461761474609375, 16.087369918823242, 16.71297836303711, 17.33858871459961, 17.964197158813477, 18.589805603027344, 19.21541404724121, 19.841022491455078, 20.466632843017578, 21.092241287231445, 21.717849731445312, 22.34345817565918, 22.969066619873047]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 13.0, 19.0, 25.0, 51.0, 71.0, 127.0, 210.0, 369.0, 754.0, 1672.0, 4143.0, 13445.0, 64770.0, 384804.0, 468387.0, 84628.0, 16574.0, 4760.0, 1868.0, 858.0, 409.0, 234.0, 104.0, 73.0, 52.0, 27.0, 26.0, 12.0, 14.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-24.953125, -24.24169921875, -23.5302734375, -22.81884765625, -22.107421875, -21.39599609375, -20.6845703125, -19.97314453125, -19.26171875, -18.55029296875, -17.8388671875, -17.12744140625, -16.416015625, -15.70458984375, -14.9931640625, -14.28173828125, -13.5703125, -12.85888671875, -12.1474609375, -11.43603515625, -10.724609375, -10.01318359375, -9.3017578125, -8.59033203125, -7.87890625, -7.16748046875, -6.4560546875, -5.74462890625, -5.033203125, -4.32177734375, -3.6103515625, -2.89892578125, -2.1875, -1.47607421875, -0.7646484375, -0.05322265625, 0.658203125, 1.36962890625, 2.0810546875, 2.79248046875, 3.50390625, 4.21533203125, 4.9267578125, 5.63818359375, 6.349609375, 7.06103515625, 7.7724609375, 8.48388671875, 9.1953125, 9.90673828125, 10.6181640625, 11.32958984375, 12.041015625, 12.75244140625, 13.4638671875, 14.17529296875, 14.88671875, 15.59814453125, 16.3095703125, 17.02099609375, 17.732421875, 18.44384765625, 19.1552734375, 19.86669921875, 20.578125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 12.0, 32.0, 27.0, 37.0, 49.0, 58.0, 70.0, 91.0, 64.0, 96.0, 88.0, 65.0, 65.0, 53.0, 38.0, 32.0, 24.0, 16.0, 15.0, 11.0, 11.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.662353515625, -10.30908203125, -9.955810546875, -9.6025390625, -9.249267578125, -8.89599609375, -8.542724609375, -8.189453125, -7.836181640625, -7.48291015625, -7.129638671875, -6.7763671875, -6.423095703125, -6.06982421875, -5.716552734375, -5.36328125, -5.010009765625, -4.65673828125, -4.303466796875, -3.9501953125, -3.596923828125, -3.24365234375, -2.890380859375, -2.537109375, -2.183837890625, -1.83056640625, -1.477294921875, -1.1240234375, -0.770751953125, -0.41748046875, -0.064208984375, 0.2890625, 0.642333984375, 0.99560546875, 1.348876953125, 1.7021484375, 2.055419921875, 2.40869140625, 2.761962890625, 3.115234375, 3.468505859375, 3.82177734375, 4.175048828125, 4.5283203125, 4.881591796875, 5.23486328125, 5.588134765625, 5.94140625, 6.294677734375, 6.64794921875, 7.001220703125, 7.3544921875, 7.707763671875, 8.06103515625, 8.414306640625, 8.767578125, 9.120849609375, 9.47412109375, 9.827392578125, 10.1806640625, 10.533935546875, 10.88720703125, 11.240478515625, 11.59375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 14.0, 14.0, 21.0, 22.0, 36.0, 61.0, 86.0, 117.0, 240.0, 484.0, 992.0, 3148.0, 17617.0, 583967.0, 422229.0, 14665.0, 2848.0, 963.0, 403.0, 229.0, 126.0, 80.0, 40.0, 37.0, 19.0, 28.0, 17.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.59375, -50.998046875, -49.40234375, -47.806640625, -46.2109375, -44.615234375, -43.01953125, -41.423828125, -39.828125, -38.232421875, -36.63671875, -35.041015625, -33.4453125, -31.849609375, -30.25390625, -28.658203125, -27.0625, -25.466796875, -23.87109375, -22.275390625, -20.6796875, -19.083984375, -17.48828125, -15.892578125, -14.296875, -12.701171875, -11.10546875, -9.509765625, -7.9140625, -6.318359375, -4.72265625, -3.126953125, -1.53125, 0.064453125, 1.66015625, 3.255859375, 4.8515625, 6.447265625, 8.04296875, 9.638671875, 11.234375, 12.830078125, 14.42578125, 16.021484375, 17.6171875, 19.212890625, 20.80859375, 22.404296875, 24.0, 25.595703125, 27.19140625, 28.787109375, 30.3828125, 31.978515625, 33.57421875, 35.169921875, 36.765625, 38.361328125, 39.95703125, 41.552734375, 43.1484375, 44.744140625, 46.33984375, 47.935546875, 49.53125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 4.0, 7.0, 16.0, 11.0, 16.0, 18.0, 45.0, 47.0, 60.0, 60.0, 66.0, 65.0, 74.0, 87.0, 95.0, 61.0, 65.0, 48.0, 46.0, 23.0, 23.0, 12.0, 14.0, 6.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-67.0, -65.31005859375, -63.6201171875, -61.93017578125, -60.240234375, -58.55029296875, -56.8603515625, -55.17041015625, -53.48046875, -51.79052734375, -50.1005859375, -48.41064453125, -46.720703125, -45.03076171875, -43.3408203125, -41.65087890625, -39.9609375, -38.27099609375, -36.5810546875, -34.89111328125, -33.201171875, -31.51123046875, -29.8212890625, -28.13134765625, -26.44140625, -24.75146484375, -23.0615234375, -21.37158203125, -19.681640625, -17.99169921875, -16.3017578125, -14.61181640625, -12.921875, -11.23193359375, -9.5419921875, -7.85205078125, -6.162109375, -4.47216796875, -2.7822265625, -1.09228515625, 0.59765625, 2.28759765625, 3.9775390625, 5.66748046875, 7.357421875, 9.04736328125, 10.7373046875, 12.42724609375, 14.1171875, 15.80712890625, 17.4970703125, 19.18701171875, 20.876953125, 22.56689453125, 24.2568359375, 25.94677734375, 27.63671875, 29.32666015625, 31.0166015625, 32.70654296875, 34.396484375, 36.08642578125, 37.7763671875, 39.46630859375, 41.15625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 10.0, 18.0, 11.0, 24.0, 25.0, 25.0, 24.0, 46.0, 83.0, 117.0, 152.0, 220.0, 416.0, 931.0, 2755.0, 14194.0, 176640.0, 786934.0, 55837.0, 6715.0, 1662.0, 681.0, 349.0, 201.0, 128.0, 92.0, 69.0, 54.0, 41.0, 17.0, 18.0, 12.0, 12.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.53125, -12.130859375, -11.73046875, -11.330078125, -10.9296875, -10.529296875, -10.12890625, -9.728515625, -9.328125, -8.927734375, -8.52734375, -8.126953125, -7.7265625, -7.326171875, -6.92578125, -6.525390625, -6.125, -5.724609375, -5.32421875, -4.923828125, -4.5234375, -4.123046875, -3.72265625, -3.322265625, -2.921875, -2.521484375, -2.12109375, -1.720703125, -1.3203125, -0.919921875, -0.51953125, -0.119140625, 0.28125, 0.681640625, 1.08203125, 1.482421875, 1.8828125, 2.283203125, 2.68359375, 3.083984375, 3.484375, 3.884765625, 4.28515625, 4.685546875, 5.0859375, 5.486328125, 5.88671875, 6.287109375, 6.6875, 7.087890625, 7.48828125, 7.888671875, 8.2890625, 8.689453125, 9.08984375, 9.490234375, 9.890625, 10.291015625, 10.69140625, 11.091796875, 11.4921875, 11.892578125, 12.29296875, 12.693359375, 13.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 12.0, 10.0, 17.0, 28.0, 33.0, 54.0, 67.0, 104.0, 157.0, 156.0, 89.0, 69.0, 48.0, 42.0, 33.0, 15.0, 16.0, 9.0, 12.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014410018920898438, -0.0013854354619979858, -0.001329869031906128, -0.00127430260181427, -0.0012187361717224121, -0.0011631697416305542, -0.0011076033115386963, -0.0010520368814468384, -0.0009964704513549805, -0.0009409040212631226, -0.0008853375911712646, -0.0008297711610794067, -0.0007742047309875488, -0.0007186383008956909, -0.000663071870803833, -0.0006075054407119751, -0.0005519390106201172, -0.0004963725805282593, -0.00044080615043640137, -0.00038523972034454346, -0.00032967329025268555, -0.00027410686016082764, -0.00021854043006896973, -0.00016297399997711182, -0.0001074075698852539, -5.1841139793395996e-05, 3.725290298461914e-06, 5.9291720390319824e-05, 0.00011485815048217773, 0.00017042458057403564, 0.00022599101066589355, 0.00028155744075775146, 0.0003371238708496094, 0.0003926903009414673, 0.0004482567310333252, 0.0005038231611251831, 0.000559389591217041, 0.0006149560213088989, 0.0006705224514007568, 0.0007260888814926147, 0.0007816553115844727, 0.0008372217416763306, 0.0008927881717681885, 0.0009483546018600464, 0.0010039210319519043, 0.0010594874620437622, 0.0011150538921356201, 0.001170620322227478, 0.001226186752319336, 0.0012817531824111938, 0.0013373196125030518, 0.0013928860425949097, 0.0014484524726867676, 0.0015040189027786255, 0.0015595853328704834, 0.0016151517629623413, 0.0016707181930541992, 0.0017262846231460571, 0.001781851053237915, 0.001837417483329773, 0.0018929839134216309, 0.0019485503435134888, 0.0020041167736053467, 0.0020596832036972046, 0.0021152496337890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 1.0, 5.0, 15.0, 10.0, 18.0, 24.0, 25.0, 52.0, 92.0, 153.0, 279.0, 600.0, 1366.0, 4506.0, 22153.0, 408334.0, 576471.0, 26511.0, 5051.0, 1554.0, 587.0, 308.0, 157.0, 85.0, 61.0, 49.0, 18.0, 20.0, 8.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.515869140625, -13.01611328125, -12.516357421875, -12.0166015625, -11.516845703125, -11.01708984375, -10.517333984375, -10.017578125, -9.517822265625, -9.01806640625, -8.518310546875, -8.0185546875, -7.518798828125, -7.01904296875, -6.519287109375, -6.01953125, -5.519775390625, -5.02001953125, -4.520263671875, -4.0205078125, -3.520751953125, -3.02099609375, -2.521240234375, -2.021484375, -1.521728515625, -1.02197265625, -0.522216796875, -0.0224609375, 0.477294921875, 0.97705078125, 1.476806640625, 1.9765625, 2.476318359375, 2.97607421875, 3.475830078125, 3.9755859375, 4.475341796875, 4.97509765625, 5.474853515625, 5.974609375, 6.474365234375, 6.97412109375, 7.473876953125, 7.9736328125, 8.473388671875, 8.97314453125, 9.472900390625, 9.97265625, 10.472412109375, 10.97216796875, 11.471923828125, 11.9716796875, 12.471435546875, 12.97119140625, 13.470947265625, 13.970703125, 14.470458984375, 14.97021484375, 15.469970703125, 15.9697265625, 16.469482421875, 16.96923828125, 17.468994140625, 17.96875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 7.0, 2.0, 7.0, 11.0, 12.0, 19.0, 23.0, 26.0, 33.0, 23.0, 41.0, 43.0, 46.0, 65.0, 84.0, 69.0, 71.0, 57.0, 64.0, 52.0, 49.0, 25.0, 29.0, 17.0, 16.0, 16.0, 13.0, 15.0, 9.0, 5.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.8984375, -7.66937255859375, -7.4403076171875, -7.21124267578125, -6.982177734375, -6.75311279296875, -6.5240478515625, -6.29498291015625, -6.06591796875, -5.83685302734375, -5.6077880859375, -5.37872314453125, -5.149658203125, -4.92059326171875, -4.6915283203125, -4.46246337890625, -4.2333984375, -4.00433349609375, -3.7752685546875, -3.54620361328125, -3.317138671875, -3.08807373046875, -2.8590087890625, -2.62994384765625, -2.40087890625, -2.17181396484375, -1.9427490234375, -1.71368408203125, -1.484619140625, -1.25555419921875, -1.0264892578125, -0.79742431640625, -0.568359375, -0.33929443359375, -0.1102294921875, 0.11883544921875, 0.347900390625, 0.57696533203125, 0.8060302734375, 1.03509521484375, 1.26416015625, 1.49322509765625, 1.7222900390625, 1.95135498046875, 2.180419921875, 2.40948486328125, 2.6385498046875, 2.86761474609375, 3.0966796875, 3.32574462890625, 3.5548095703125, 3.78387451171875, 4.012939453125, 4.24200439453125, 4.4710693359375, 4.70013427734375, 4.92919921875, 5.15826416015625, 5.3873291015625, 5.61639404296875, 5.845458984375, 6.07452392578125, 6.3035888671875, 6.53265380859375, 6.76171875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 30.0, 67.0, 258.0, 358.0, 191.0, 61.0, 17.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.54031372070312, -232.77296447753906, -220.005615234375, -207.23826599121094, -194.47091674804688, -181.7035675048828, -168.93621826171875, -156.1688690185547, -143.40151977539062, -130.63417053222656, -117.8668212890625, -105.09947204589844, -92.33212280273438, -79.56477355957031, -66.79742431640625, -54.03007507324219, -41.262725830078125, -28.495376586914062, -15.72802734375, -2.9606781005859375, 9.806671142578125, 22.574020385742188, 35.34136962890625, 48.10871887207031, 60.876068115234375, 73.64341735839844, 86.4107666015625, 99.17811584472656, 111.94546508789062, 124.71281433105469, 137.48016357421875, 150.2475128173828, 163.014892578125, 175.78224182128906, 188.54959106445312, 201.3169403076172, 214.08428955078125, 226.8516387939453, 239.61898803710938, 252.38633728027344, 265.1536865234375, 277.9210205078125, 290.6883850097656, 303.45574951171875, 316.22308349609375, 328.99041748046875, 341.7577819824219, 354.525146484375, 367.29248046875, 380.059814453125, 392.8271789550781, 405.59454345703125, 418.36187744140625, 431.12921142578125, 443.8965759277344, 456.6639404296875, 469.4312744140625, 482.1986083984375, 494.9659729003906, 507.73333740234375, 520.5006713867188, 533.2680053710938, 546.035400390625, 558.802734375, 571.570068359375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 4.0, 7.0, 10.0, 7.0, 10.0, 15.0, 17.0, 18.0, 22.0, 31.0, 44.0, 36.0, 36.0, 48.0, 56.0, 54.0, 55.0, 56.0, 63.0, 48.0, 48.0, 42.0, 41.0, 37.0, 31.0, 30.0, 18.0, 18.0, 14.0, 14.0, 12.0, 15.0, 8.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-142.78099060058594, -138.21658325195312, -133.6521759033203, -129.08775329589844, -124.52334594726562, -119.95893859863281, -115.39453125, -110.83012390136719, -106.26570892333984, -101.70130157470703, -97.13688659667969, -92.57247924804688, -88.00807189941406, -83.44365692138672, -78.8792495727539, -74.31483459472656, -69.75042724609375, -65.18601989746094, -60.621604919433594, -56.05719757080078, -51.4927864074707, -46.928375244140625, -42.36396789550781, -37.799556732177734, -33.235145568847656, -28.670734405517578, -24.106325149536133, -19.541915893554688, -14.97750473022461, -10.413093566894531, -5.848684310913086, -1.2842750549316406, 3.280120849609375, 7.844531059265137, 12.408941268920898, 16.973350524902344, 21.537761688232422, 26.1021728515625, 30.666582107543945, 35.23099136352539, 39.79540252685547, 44.35981369018555, 48.924224853515625, 53.48863220214844, 58.053043365478516, 62.617454528808594, 67.1818618774414, 71.74627685546875, 76.31068420410156, 80.87509155273438, 85.43950653076172, 90.00391387939453, 94.56832885742188, 99.13273620605469, 103.6971435546875, 108.26155090332031, 112.82596588134766, 117.39037322998047, 121.95478820800781, 126.51919555664062, 131.08360290527344, 135.64801025390625, 140.21243286132812, 144.77684020996094, 149.34124755859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 14.0, 20.0, 20.0, 42.0, 47.0, 109.0, 269.0, 627.0, 1659.0, 6481.0, 54112.0, 3959135.0, 156902.0, 10928.0, 2415.0, 768.0, 311.0, 154.0, 88.0, 69.0, 31.0, 19.0, 14.0, 13.0, 7.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.6875, -31.716064453125, -30.74462890625, -29.773193359375, -28.8017578125, -27.830322265625, -26.85888671875, -25.887451171875, -24.916015625, -23.944580078125, -22.97314453125, -22.001708984375, -21.0302734375, -20.058837890625, -19.08740234375, -18.115966796875, -17.14453125, -16.173095703125, -15.20166015625, -14.230224609375, -13.2587890625, -12.287353515625, -11.31591796875, -10.344482421875, -9.373046875, -8.401611328125, -7.43017578125, -6.458740234375, -5.4873046875, -4.515869140625, -3.54443359375, -2.572998046875, -1.6015625, -0.630126953125, 0.34130859375, 1.312744140625, 2.2841796875, 3.255615234375, 4.22705078125, 5.198486328125, 6.169921875, 7.141357421875, 8.11279296875, 9.084228515625, 10.0556640625, 11.027099609375, 11.99853515625, 12.969970703125, 13.94140625, 14.912841796875, 15.88427734375, 16.855712890625, 17.8271484375, 18.798583984375, 19.77001953125, 20.741455078125, 21.712890625, 22.684326171875, 23.65576171875, 24.627197265625, 25.5986328125, 26.570068359375, 27.54150390625, 28.512939453125, 29.484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 18.0, 16.0, 17.0, 26.0, 32.0, 60.0, 52.0, 63.0, 75.0, 74.0, 89.0, 89.0, 75.0, 75.0, 45.0, 45.0, 35.0, 25.0, 22.0, 15.0, 11.0, 6.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5255126953125, -10.168212890625, -9.8109130859375, -9.45361328125, -9.0963134765625, -8.739013671875, -8.3817138671875, -8.0244140625, -7.6671142578125, -7.309814453125, -6.9525146484375, -6.59521484375, -6.2379150390625, -5.880615234375, -5.5233154296875, -5.166015625, -4.8087158203125, -4.451416015625, -4.0941162109375, -3.73681640625, -3.3795166015625, -3.022216796875, -2.6649169921875, -2.3076171875, -1.9503173828125, -1.593017578125, -1.2357177734375, -0.87841796875, -0.5211181640625, -0.163818359375, 0.1934814453125, 0.55078125, 0.9080810546875, 1.265380859375, 1.6226806640625, 1.97998046875, 2.3372802734375, 2.694580078125, 3.0518798828125, 3.4091796875, 3.7664794921875, 4.123779296875, 4.4810791015625, 4.83837890625, 5.1956787109375, 5.552978515625, 5.9102783203125, 6.267578125, 6.6248779296875, 6.982177734375, 7.3394775390625, 7.69677734375, 8.0540771484375, 8.411376953125, 8.7686767578125, 9.1259765625, 9.4832763671875, 9.840576171875, 10.1978759765625, 10.55517578125, 10.9124755859375, 11.269775390625, 11.6270751953125, 11.984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 12.0, 11.0, 19.0, 31.0, 62.0, 165.0, 359.0, 838.0, 2796.0, 20613.0, 3498188.0, 655633.0, 12654.0, 1905.0, 553.0, 222.0, 96.0, 37.0, 22.0, 11.0, 12.0, 10.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.65625, -23.41796875, -22.1796875, -20.94140625, -19.703125, -18.46484375, -17.2265625, -15.98828125, -14.75, -13.51171875, -12.2734375, -11.03515625, -9.796875, -8.55859375, -7.3203125, -6.08203125, -4.84375, -3.60546875, -2.3671875, -1.12890625, 0.109375, 1.34765625, 2.5859375, 3.82421875, 5.0625, 6.30078125, 7.5390625, 8.77734375, 10.015625, 11.25390625, 12.4921875, 13.73046875, 14.96875, 16.20703125, 17.4453125, 18.68359375, 19.921875, 21.16015625, 22.3984375, 23.63671875, 24.875, 26.11328125, 27.3515625, 28.58984375, 29.828125, 31.06640625, 32.3046875, 33.54296875, 34.78125, 36.01953125, 37.2578125, 38.49609375, 39.734375, 40.97265625, 42.2109375, 43.44921875, 44.6875, 45.92578125, 47.1640625, 48.40234375, 49.640625, 50.87890625, 52.1171875, 53.35546875, 54.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 19.0, 31.0, 61.0, 93.0, 315.0, 1496.0, 1434.0, 326.0, 97.0, 46.0, 34.0, 17.0, 10.0, 15.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.65966796875, -35.7880859375, -34.91650390625, -34.044921875, -33.17333984375, -32.3017578125, -31.43017578125, -30.55859375, -29.68701171875, -28.8154296875, -27.94384765625, -27.072265625, -26.20068359375, -25.3291015625, -24.45751953125, -23.5859375, -22.71435546875, -21.8427734375, -20.97119140625, -20.099609375, -19.22802734375, -18.3564453125, -17.48486328125, -16.61328125, -15.74169921875, -14.8701171875, -13.99853515625, -13.126953125, -12.25537109375, -11.3837890625, -10.51220703125, -9.640625, -8.76904296875, -7.8974609375, -7.02587890625, -6.154296875, -5.28271484375, -4.4111328125, -3.53955078125, -2.66796875, -1.79638671875, -0.9248046875, -0.05322265625, 0.818359375, 1.68994140625, 2.5615234375, 3.43310546875, 4.3046875, 5.17626953125, 6.0478515625, 6.91943359375, 7.791015625, 8.66259765625, 9.5341796875, 10.40576171875, 11.27734375, 12.14892578125, 13.0205078125, 13.89208984375, 14.763671875, 15.63525390625, 16.5068359375, 17.37841796875, 18.25]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 15.0, 20.0, 43.0, 152.0, 288.0, 263.0, 132.0, 51.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-422.85546875, -414.736083984375, -406.61669921875, -398.497314453125, -390.3779296875, -382.258544921875, -374.13916015625, -366.019775390625, -357.900390625, -349.781005859375, -341.66162109375, -333.542236328125, -325.4228515625, -317.303466796875, -309.18408203125, -301.064697265625, -292.9453430175781, -284.8259582519531, -276.7065734863281, -268.5871887207031, -260.4678039550781, -252.34841918945312, -244.2290496826172, -236.1096649169922, -227.9902801513672, -219.8708953857422, -211.7515106201172, -203.6321258544922, -195.51275634765625, -187.39337158203125, -179.27398681640625, -171.15460205078125, -163.03524780273438, -154.91586303710938, -146.79647827148438, -138.67709350585938, -130.55770874023438, -122.4383316040039, -114.31895446777344, -106.19956970214844, -98.0801773071289, -89.9607925415039, -81.84141540527344, -73.72203063964844, -65.60264587402344, -57.48326110839844, -49.3638801574707, -41.24449920654297, -33.12511444091797, -25.0057315826416, -16.886348724365234, -8.766965866088867, -0.6475830078125, 7.4718017578125, 15.591182708740234, 23.71056365966797, 31.82994842529297, 39.94933319091797, 48.0687141418457, 56.18809509277344, 64.30747985839844, 72.42686462402344, 80.54624938964844, 88.6656265258789, 96.7850112915039]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 7.0, 13.0, 13.0, 12.0, 20.0, 21.0, 32.0, 35.0, 42.0, 53.0, 52.0, 60.0, 70.0, 58.0, 55.0, 74.0, 65.0, 51.0, 61.0, 53.0, 39.0, 24.0, 27.0, 14.0, 6.0, 8.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.60990905761719, -119.7569580078125, -115.90399932861328, -112.0510482788086, -108.1980972290039, -104.34513854980469, -100.4921875, -96.63923645019531, -92.7862777709961, -88.9333267211914, -85.08036804199219, -81.2274169921875, -77.37446594238281, -73.5215072631836, -69.6685562133789, -65.81559753417969, -61.962650299072266, -58.10969543457031, -54.256744384765625, -50.40378952026367, -46.55083465576172, -42.69788360595703, -38.84492874145508, -34.991973876953125, -31.139020919799805, -27.286067962646484, -23.43311309814453, -19.58016014099121, -15.727206230163574, -11.874252319335938, -8.021299362182617, -4.168344497680664, -0.31539154052734375, 3.537562131881714, 7.3905158042907715, 11.24346923828125, 15.096423149108887, 18.949377059936523, 22.802330017089844, 26.655284881591797, 30.508237838745117, 34.36119079589844, 38.21414566040039, 42.067100524902344, 45.92005157470703, 49.773006439208984, 53.62596130371094, 57.478912353515625, 61.33186721801758, 65.18482208251953, 69.03777313232422, 72.89073181152344, 76.74368286132812, 80.59663391113281, 84.4495849609375, 88.30254364013672, 92.1554946899414, 96.0084457397461, 99.86140441894531, 103.71435546875, 107.56730651855469, 111.4202651977539, 115.2732162475586, 119.12617492675781, 122.9791259765625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 10.0, 10.0, 16.0, 17.0, 38.0, 41.0, 62.0, 85.0, 157.0, 252.0, 489.0, 966.0, 1963.0, 4618.0, 13885.0, 51195.0, 229505.0, 534101.0, 156792.0, 36792.0, 10460.0, 3701.0, 1615.0, 727.0, 374.0, 240.0, 128.0, 102.0, 58.0, 41.0, 33.0, 20.0, 18.0, 4.0, 8.0, 6.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-19.375, -18.776611328125, -18.17822265625, -17.579833984375, -16.9814453125, -16.383056640625, -15.78466796875, -15.186279296875, -14.587890625, -13.989501953125, -13.39111328125, -12.792724609375, -12.1943359375, -11.595947265625, -10.99755859375, -10.399169921875, -9.80078125, -9.202392578125, -8.60400390625, -8.005615234375, -7.4072265625, -6.808837890625, -6.21044921875, -5.612060546875, -5.013671875, -4.415283203125, -3.81689453125, -3.218505859375, -2.6201171875, -2.021728515625, -1.42333984375, -0.824951171875, -0.2265625, 0.371826171875, 0.97021484375, 1.568603515625, 2.1669921875, 2.765380859375, 3.36376953125, 3.962158203125, 4.560546875, 5.158935546875, 5.75732421875, 6.355712890625, 6.9541015625, 7.552490234375, 8.15087890625, 8.749267578125, 9.34765625, 9.946044921875, 10.54443359375, 11.142822265625, 11.7412109375, 12.339599609375, 12.93798828125, 13.536376953125, 14.134765625, 14.733154296875, 15.33154296875, 15.929931640625, 16.5283203125, 17.126708984375, 17.72509765625, 18.323486328125, 18.921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 9.0, 17.0, 15.0, 23.0, 36.0, 36.0, 49.0, 66.0, 92.0, 79.0, 70.0, 93.0, 70.0, 68.0, 59.0, 52.0, 36.0, 32.0, 17.0, 24.0, 13.0, 11.0, 2.0, 7.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.6287841796875, -10.273193359375, -9.9176025390625, -9.56201171875, -9.2064208984375, -8.850830078125, -8.4952392578125, -8.1396484375, -7.7840576171875, -7.428466796875, -7.0728759765625, -6.71728515625, -6.3616943359375, -6.006103515625, -5.6505126953125, -5.294921875, -4.9393310546875, -4.583740234375, -4.2281494140625, -3.87255859375, -3.5169677734375, -3.161376953125, -2.8057861328125, -2.4501953125, -2.0946044921875, -1.739013671875, -1.3834228515625, -1.02783203125, -0.6722412109375, -0.316650390625, 0.0389404296875, 0.39453125, 0.7501220703125, 1.105712890625, 1.4613037109375, 1.81689453125, 2.1724853515625, 2.528076171875, 2.8836669921875, 3.2392578125, 3.5948486328125, 3.950439453125, 4.3060302734375, 4.66162109375, 5.0172119140625, 5.372802734375, 5.7283935546875, 6.083984375, 6.4395751953125, 6.795166015625, 7.1507568359375, 7.50634765625, 7.8619384765625, 8.217529296875, 8.5731201171875, 8.9287109375, 9.2843017578125, 9.639892578125, 9.9954833984375, 10.35107421875, 10.7066650390625, 11.062255859375, 11.4178466796875, 11.7734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 4.0, 5.0, 11.0, 16.0, 13.0, 12.0, 25.0, 36.0, 52.0, 72.0, 81.0, 138.0, 224.0, 388.0, 973.0, 2751.0, 11607.0, 192386.0, 806583.0, 25788.0, 4604.0, 1385.0, 553.0, 288.0, 166.0, 99.0, 59.0, 56.0, 42.0, 27.0, 19.0, 20.0, 15.0, 15.0, 5.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.40625, -46.80322265625, -45.2001953125, -43.59716796875, -41.994140625, -40.39111328125, -38.7880859375, -37.18505859375, -35.58203125, -33.97900390625, -32.3759765625, -30.77294921875, -29.169921875, -27.56689453125, -25.9638671875, -24.36083984375, -22.7578125, -21.15478515625, -19.5517578125, -17.94873046875, -16.345703125, -14.74267578125, -13.1396484375, -11.53662109375, -9.93359375, -8.33056640625, -6.7275390625, -5.12451171875, -3.521484375, -1.91845703125, -0.3154296875, 1.28759765625, 2.890625, 4.49365234375, 6.0966796875, 7.69970703125, 9.302734375, 10.90576171875, 12.5087890625, 14.11181640625, 15.71484375, 17.31787109375, 18.9208984375, 20.52392578125, 22.126953125, 23.72998046875, 25.3330078125, 26.93603515625, 28.5390625, 30.14208984375, 31.7451171875, 33.34814453125, 34.951171875, 36.55419921875, 38.1572265625, 39.76025390625, 41.36328125, 42.96630859375, 44.5693359375, 46.17236328125, 47.775390625, 49.37841796875, 50.9814453125, 52.58447265625, 54.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 10.0, 10.0, 19.0, 27.0, 31.0, 48.0, 48.0, 46.0, 90.0, 67.0, 80.0, 67.0, 78.0, 86.0, 56.0, 50.0, 46.0, 37.0, 20.0, 21.0, 10.0, 12.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.03125, -61.3447265625, -59.658203125, -57.9716796875, -56.28515625, -54.5986328125, -52.912109375, -51.2255859375, -49.5390625, -47.8525390625, -46.166015625, -44.4794921875, -42.79296875, -41.1064453125, -39.419921875, -37.7333984375, -36.046875, -34.3603515625, -32.673828125, -30.9873046875, -29.30078125, -27.6142578125, -25.927734375, -24.2412109375, -22.5546875, -20.8681640625, -19.181640625, -17.4951171875, -15.80859375, -14.1220703125, -12.435546875, -10.7490234375, -9.0625, -7.3759765625, -5.689453125, -4.0029296875, -2.31640625, -0.6298828125, 1.056640625, 2.7431640625, 4.4296875, 6.1162109375, 7.802734375, 9.4892578125, 11.17578125, 12.8623046875, 14.548828125, 16.2353515625, 17.921875, 19.6083984375, 21.294921875, 22.9814453125, 24.66796875, 26.3544921875, 28.041015625, 29.7275390625, 31.4140625, 33.1005859375, 34.787109375, 36.4736328125, 38.16015625, 39.8466796875, 41.533203125, 43.2197265625, 44.90625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 2.0, 13.0, 13.0, 21.0, 30.0, 34.0, 35.0, 75.0, 130.0, 268.0, 744.0, 3502.0, 92574.0, 937135.0, 11594.0, 1441.0, 412.0, 191.0, 100.0, 73.0, 41.0, 24.0, 17.0, 18.0, 15.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.34375, -31.475341796875, -30.60693359375, -29.738525390625, -28.8701171875, -28.001708984375, -27.13330078125, -26.264892578125, -25.396484375, -24.528076171875, -23.65966796875, -22.791259765625, -21.9228515625, -21.054443359375, -20.18603515625, -19.317626953125, -18.44921875, -17.580810546875, -16.71240234375, -15.843994140625, -14.9755859375, -14.107177734375, -13.23876953125, -12.370361328125, -11.501953125, -10.633544921875, -9.76513671875, -8.896728515625, -8.0283203125, -7.159912109375, -6.29150390625, -5.423095703125, -4.5546875, -3.686279296875, -2.81787109375, -1.949462890625, -1.0810546875, -0.212646484375, 0.65576171875, 1.524169921875, 2.392578125, 3.260986328125, 4.12939453125, 4.997802734375, 5.8662109375, 6.734619140625, 7.60302734375, 8.471435546875, 9.33984375, 10.208251953125, 11.07666015625, 11.945068359375, 12.8134765625, 13.681884765625, 14.55029296875, 15.418701171875, 16.287109375, 17.155517578125, 18.02392578125, 18.892333984375, 19.7607421875, 20.629150390625, 21.49755859375, 22.365966796875, 23.234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 8.0, 9.0, 11.0, 24.0, 20.0, 25.0, 31.0, 52.0, 88.0, 111.0, 185.0, 117.0, 78.0, 52.0, 38.0, 30.0, 19.0, 18.0, 10.0, 16.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016574859619140625, -0.001604720950126648, -0.0015519559383392334, -0.0014991909265518188, -0.0014464259147644043, -0.0013936609029769897, -0.0013408958911895752, -0.0012881308794021606, -0.001235365867614746, -0.0011826008558273315, -0.001129835844039917, -0.0010770708322525024, -0.0010243058204650879, -0.0009715408086776733, -0.0009187757968902588, -0.0008660107851028442, -0.0008132457733154297, -0.0007604807615280151, -0.0007077157497406006, -0.000654950737953186, -0.0006021857261657715, -0.0005494207143783569, -0.0004966557025909424, -0.00044389069080352783, -0.0003911256790161133, -0.00033836066722869873, -0.0002855956554412842, -0.00023283064365386963, -0.00018006563186645508, -0.00012730062007904053, -7.453560829162598e-05, -2.1770596504211426e-05, 3.0994415283203125e-05, 8.375942707061768e-05, 0.00013652443885803223, 0.00018928945064544678, 0.00024205446243286133, 0.0002948194742202759, 0.00034758448600769043, 0.000400349497795105, 0.00045311450958251953, 0.0005058795213699341, 0.0005586445331573486, 0.0006114095449447632, 0.0006641745567321777, 0.0007169395685195923, 0.0007697045803070068, 0.0008224695920944214, 0.0008752346038818359, 0.0009279996156692505, 0.000980764627456665, 0.0010335296392440796, 0.0010862946510314941, 0.0011390596628189087, 0.0011918246746063232, 0.0012445896863937378, 0.0012973546981811523, 0.001350119709968567, 0.0014028847217559814, 0.001455649733543396, 0.0015084147453308105, 0.001561179757118225, 0.0016139447689056396, 0.0016667097806930542, 0.0017194747924804688]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 26.0, 42.0, 82.0, 130.0, 239.0, 532.0, 1652.0, 11125.0, 591426.0, 430310.0, 10296.0, 1635.0, 530.0, 223.0, 112.0, 70.0, 37.0, 24.0, 13.0, 5.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.176025390625, -26.35205078125, -25.528076171875, -24.7041015625, -23.880126953125, -23.05615234375, -22.232177734375, -21.408203125, -20.584228515625, -19.76025390625, -18.936279296875, -18.1123046875, -17.288330078125, -16.46435546875, -15.640380859375, -14.81640625, -13.992431640625, -13.16845703125, -12.344482421875, -11.5205078125, -10.696533203125, -9.87255859375, -9.048583984375, -8.224609375, -7.400634765625, -6.57666015625, -5.752685546875, -4.9287109375, -4.104736328125, -3.28076171875, -2.456787109375, -1.6328125, -0.808837890625, 0.01513671875, 0.839111328125, 1.6630859375, 2.487060546875, 3.31103515625, 4.135009765625, 4.958984375, 5.782958984375, 6.60693359375, 7.430908203125, 8.2548828125, 9.078857421875, 9.90283203125, 10.726806640625, 11.55078125, 12.374755859375, 13.19873046875, 14.022705078125, 14.8466796875, 15.670654296875, 16.49462890625, 17.318603515625, 18.142578125, 18.966552734375, 19.79052734375, 20.614501953125, 21.4384765625, 22.262451171875, 23.08642578125, 23.910400390625, 24.734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 5.0, 7.0, 12.0, 20.0, 32.0, 41.0, 43.0, 80.0, 103.0, 127.0, 135.0, 118.0, 84.0, 42.0, 39.0, 32.0, 15.0, 12.0, 6.0, 3.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4609375, -14.048583984375, -13.63623046875, -13.223876953125, -12.8115234375, -12.399169921875, -11.98681640625, -11.574462890625, -11.162109375, -10.749755859375, -10.33740234375, -9.925048828125, -9.5126953125, -9.100341796875, -8.68798828125, -8.275634765625, -7.86328125, -7.450927734375, -7.03857421875, -6.626220703125, -6.2138671875, -5.801513671875, -5.38916015625, -4.976806640625, -4.564453125, -4.152099609375, -3.73974609375, -3.327392578125, -2.9150390625, -2.502685546875, -2.09033203125, -1.677978515625, -1.265625, -0.853271484375, -0.44091796875, -0.028564453125, 0.3837890625, 0.796142578125, 1.20849609375, 1.620849609375, 2.033203125, 2.445556640625, 2.85791015625, 3.270263671875, 3.6826171875, 4.094970703125, 4.50732421875, 4.919677734375, 5.33203125, 5.744384765625, 6.15673828125, 6.569091796875, 6.9814453125, 7.393798828125, 7.80615234375, 8.218505859375, 8.630859375, 9.043212890625, 9.45556640625, 9.867919921875, 10.2802734375, 10.692626953125, 11.10498046875, 11.517333984375, 11.9296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 29.0, 91.0, 201.0, 333.0, 189.0, 83.0, 32.0, 14.0, 5.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-450.59918212890625, -440.44879150390625, -430.29840087890625, -420.14801025390625, -409.99761962890625, -399.84722900390625, -389.69683837890625, -379.54644775390625, -369.39605712890625, -359.24566650390625, -349.09527587890625, -338.94488525390625, -328.79449462890625, -318.64410400390625, -308.49371337890625, -298.34332275390625, -288.19293212890625, -278.04254150390625, -267.89215087890625, -257.74176025390625, -247.59136962890625, -237.44097900390625, -227.29058837890625, -217.14019775390625, -206.98980712890625, -196.83941650390625, -186.68902587890625, -176.53863525390625, -166.38824462890625, -156.23785400390625, -146.08746337890625, -135.93707275390625, -125.78671264648438, -115.63632202148438, -105.48593139648438, -95.33554077148438, -85.18515014648438, -75.03475952148438, -64.88436889648438, -54.733978271484375, -44.583587646484375, -34.433197021484375, -24.282806396484375, -14.132415771484375, -3.982025146484375, 6.168365478515625, 16.318756103515625, 26.469146728515625, 36.619537353515625, 46.769927978515625, 56.920318603515625, 67.07070922851562, 77.22109985351562, 87.37149047851562, 97.52188110351562, 107.67227172851562, 117.82266235351562, 127.97305297851562, 138.12344360351562, 148.27383422851562, 158.42422485351562, 168.57461547851562, 178.72500610351562, 188.87539672851562, 199.02578735351562]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 9.0, 4.0, 14.0, 15.0, 9.0, 30.0, 25.0, 16.0, 29.0, 38.0, 30.0, 41.0, 36.0, 61.0, 47.0, 60.0, 57.0, 60.0, 54.0, 46.0, 47.0, 37.0, 42.0, 33.0, 27.0, 19.0, 23.0, 19.0, 10.0, 5.0, 16.0, 11.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-167.07421875, -162.71084594726562, -158.34747314453125, -153.98410034179688, -149.6207275390625, -145.25735473632812, -140.89398193359375, -136.53060913085938, -132.167236328125, -127.80386352539062, -123.44049072265625, -119.07711791992188, -114.7137451171875, -110.35037231445312, -105.98699188232422, -101.62361907958984, -97.26023864746094, -92.89686584472656, -88.53349304199219, -84.17012023925781, -79.80674743652344, -75.44337463378906, -71.07999420166016, -66.71662139892578, -62.353248596191406, -57.98987579345703, -53.626502990722656, -49.263126373291016, -44.89975357055664, -40.536380767822266, -36.173004150390625, -31.80963134765625, -27.446273803710938, -23.082901000976562, -18.719526290893555, -14.356152534484863, -9.992778778076172, -5.629405975341797, -1.266031265258789, 3.0973434448242188, 7.460716247558594, 11.824090003967285, 16.187463760375977, 20.550838470458984, 24.91421127319336, 29.277584075927734, 33.640960693359375, 38.00433349609375, 42.367706298828125, 46.7310791015625, 51.094451904296875, 55.457828521728516, 59.82120132446289, 64.1845703125, 68.5479507446289, 72.91132354736328, 77.27469635009766, 81.63806915283203, 86.0014419555664, 90.36481475830078, 94.72819519042969, 99.09156799316406, 103.45494079589844, 107.81831359863281, 112.18168640136719]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 9.0, 17.0, 19.0, 19.0, 26.0, 22.0, 46.0, 77.0, 95.0, 177.0, 306.0, 536.0, 1038.0, 2189.0, 5551.0, 18305.0, 120270.0, 3236855.0, 742829.0, 48928.0, 10385.0, 3474.0, 1475.0, 712.0, 364.0, 198.0, 125.0, 90.0, 48.0, 28.0, 19.0, 17.0, 7.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.9609375, -15.501953125, -15.04296875, -14.583984375, -14.125, -13.666015625, -13.20703125, -12.748046875, -12.2890625, -11.830078125, -11.37109375, -10.912109375, -10.453125, -9.994140625, -9.53515625, -9.076171875, -8.6171875, -8.158203125, -7.69921875, -7.240234375, -6.78125, -6.322265625, -5.86328125, -5.404296875, -4.9453125, -4.486328125, -4.02734375, -3.568359375, -3.109375, -2.650390625, -2.19140625, -1.732421875, -1.2734375, -0.814453125, -0.35546875, 0.103515625, 0.5625, 1.021484375, 1.48046875, 1.939453125, 2.3984375, 2.857421875, 3.31640625, 3.775390625, 4.234375, 4.693359375, 5.15234375, 5.611328125, 6.0703125, 6.529296875, 6.98828125, 7.447265625, 7.90625, 8.365234375, 8.82421875, 9.283203125, 9.7421875, 10.201171875, 10.66015625, 11.119140625, 11.578125, 12.037109375, 12.49609375, 12.955078125, 13.4140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 6.0, 14.0, 12.0, 37.0, 23.0, 34.0, 44.0, 67.0, 56.0, 67.0, 74.0, 66.0, 70.0, 71.0, 71.0, 60.0, 47.0, 43.0, 34.0, 24.0, 23.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.828125, -11.5030517578125, -11.177978515625, -10.8529052734375, -10.52783203125, -10.2027587890625, -9.877685546875, -9.5526123046875, -9.2275390625, -8.9024658203125, -8.577392578125, -8.2523193359375, -7.92724609375, -7.6021728515625, -7.277099609375, -6.9520263671875, -6.626953125, -6.3018798828125, -5.976806640625, -5.6517333984375, -5.32666015625, -5.0015869140625, -4.676513671875, -4.3514404296875, -4.0263671875, -3.7012939453125, -3.376220703125, -3.0511474609375, -2.72607421875, -2.4010009765625, -2.075927734375, -1.7508544921875, -1.42578125, -1.1007080078125, -0.775634765625, -0.4505615234375, -0.12548828125, 0.1995849609375, 0.524658203125, 0.8497314453125, 1.1748046875, 1.4998779296875, 1.824951171875, 2.1500244140625, 2.47509765625, 2.8001708984375, 3.125244140625, 3.4503173828125, 3.775390625, 4.1004638671875, 4.425537109375, 4.7506103515625, 5.07568359375, 5.4007568359375, 5.725830078125, 6.0509033203125, 6.3759765625, 6.7010498046875, 7.026123046875, 7.3511962890625, 7.67626953125, 8.0013427734375, 8.326416015625, 8.6514892578125, 8.9765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 8.0, 8.0, 14.0, 22.0, 40.0, 88.0, 147.0, 322.0, 738.0, 1970.0, 5706.0, 21474.0, 184888.0, 3753484.0, 194658.0, 21697.0, 5701.0, 1898.0, 693.0, 352.0, 179.0, 84.0, 40.0, 20.0, 21.0, 15.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.8125, -25.190673828125, -24.56884765625, -23.947021484375, -23.3251953125, -22.703369140625, -22.08154296875, -21.459716796875, -20.837890625, -20.216064453125, -19.59423828125, -18.972412109375, -18.3505859375, -17.728759765625, -17.10693359375, -16.485107421875, -15.86328125, -15.241455078125, -14.61962890625, -13.997802734375, -13.3759765625, -12.754150390625, -12.13232421875, -11.510498046875, -10.888671875, -10.266845703125, -9.64501953125, -9.023193359375, -8.4013671875, -7.779541015625, -7.15771484375, -6.535888671875, -5.9140625, -5.292236328125, -4.67041015625, -4.048583984375, -3.4267578125, -2.804931640625, -2.18310546875, -1.561279296875, -0.939453125, -0.317626953125, 0.30419921875, 0.926025390625, 1.5478515625, 2.169677734375, 2.79150390625, 3.413330078125, 4.03515625, 4.656982421875, 5.27880859375, 5.900634765625, 6.5224609375, 7.144287109375, 7.76611328125, 8.387939453125, 9.009765625, 9.631591796875, 10.25341796875, 10.875244140625, 11.4970703125, 12.118896484375, 12.74072265625, 13.362548828125, 13.984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 3.0, 9.0, 12.0, 17.0, 22.0, 55.0, 119.0, 234.0, 704.0, 1490.0, 848.0, 291.0, 113.0, 49.0, 24.0, 19.0, 16.0, 6.0, 6.0, 6.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.65625, -18.992919921875, -18.32958984375, -17.666259765625, -17.0029296875, -16.339599609375, -15.67626953125, -15.012939453125, -14.349609375, -13.686279296875, -13.02294921875, -12.359619140625, -11.6962890625, -11.032958984375, -10.36962890625, -9.706298828125, -9.04296875, -8.379638671875, -7.71630859375, -7.052978515625, -6.3896484375, -5.726318359375, -5.06298828125, -4.399658203125, -3.736328125, -3.072998046875, -2.40966796875, -1.746337890625, -1.0830078125, -0.419677734375, 0.24365234375, 0.906982421875, 1.5703125, 2.233642578125, 2.89697265625, 3.560302734375, 4.2236328125, 4.886962890625, 5.55029296875, 6.213623046875, 6.876953125, 7.540283203125, 8.20361328125, 8.866943359375, 9.5302734375, 10.193603515625, 10.85693359375, 11.520263671875, 12.18359375, 12.846923828125, 13.51025390625, 14.173583984375, 14.8369140625, 15.500244140625, 16.16357421875, 16.826904296875, 17.490234375, 18.153564453125, 18.81689453125, 19.480224609375, 20.1435546875, 20.806884765625, 21.47021484375, 22.133544921875, 22.796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 2.0, 3.0, 9.0, 25.0, 52.0, 96.0, 200.0, 250.0, 196.0, 84.0, 42.0, 19.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.85833740234375, -207.51768493652344, -202.1770477294922, -196.83639526367188, -191.49575805664062, -186.1551055908203, -180.81446838378906, -175.47381591796875, -170.1331787109375, -164.7925262451172, -159.45188903808594, -154.11123657226562, -148.77059936523438, -143.42994689941406, -138.0893096923828, -132.7486572265625, -127.40801239013672, -122.06736755371094, -116.72672271728516, -111.38607788085938, -106.0454330444336, -100.70478820800781, -95.3641357421875, -90.02349853515625, -84.68284606933594, -79.34220123291016, -74.00155639648438, -68.6609115600586, -63.32026672363281, -57.97962188720703, -52.638973236083984, -47.2983283996582, -41.95768737792969, -36.617042541503906, -31.276397705078125, -25.93575096130371, -20.59510612487793, -15.254461288452148, -9.913814544677734, -4.573169708251953, 0.7674751281738281, 6.108120441436768, 11.448765754699707, 16.789411544799805, 22.130056381225586, 27.470701217651367, 32.81134796142578, 38.15199279785156, 43.492637634277344, 48.833282470703125, 54.173927307128906, 59.51457214355469, 64.85521697998047, 70.19586181640625, 75.53651428222656, 80.87715148925781, 86.21780395507812, 91.5584487915039, 96.89909362792969, 102.23973846435547, 107.58038330078125, 112.92102813720703, 118.26167297363281, 123.60232543945312, 128.94296264648438]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 4.0, 15.0, 11.0, 22.0, 24.0, 25.0, 26.0, 29.0, 45.0, 40.0, 31.0, 58.0, 50.0, 60.0, 65.0, 49.0, 55.0, 46.0, 56.0, 40.0, 38.0, 24.0, 38.0, 28.0, 21.0, 15.0, 19.0, 7.0, 7.0, 9.0, 11.0, 2.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.05650329589844, -67.6324462890625, -65.2083969116211, -62.78434371948242, -60.36029052734375, -57.93623733520508, -55.512184143066406, -53.08812713623047, -50.66407775878906, -48.24002456665039, -45.81597137451172, -43.39191818237305, -40.967864990234375, -38.5438117980957, -36.11975860595703, -33.695701599121094, -31.271648406982422, -28.84759521484375, -26.423542022705078, -23.999488830566406, -21.575435638427734, -19.151382446289062, -16.727327346801758, -14.303274154663086, -11.879220962524414, -9.455167770385742, -7.031114101409912, -4.607060432434082, -2.18300724029541, 0.24104595184326172, 2.66510009765625, 5.089153289794922, 7.513206481933594, 9.937259674072266, 12.361312866210938, 14.785367012023926, 17.20941925048828, 19.633472442626953, 22.057527542114258, 24.48158073425293, 26.9056339263916, 29.329687118530273, 31.753740310668945, 34.17779541015625, 36.60184860229492, 39.025901794433594, 41.449954986572266, 43.87400817871094, 46.29806137084961, 48.72211456298828, 51.14616775512695, 53.570220947265625, 55.9942741394043, 58.41832733154297, 60.842384338378906, 63.26643371582031, 65.69049072265625, 68.11454772949219, 70.5385971069336, 72.96265411376953, 75.38670349121094, 77.81076049804688, 80.23480987548828, 82.65886688232422, 85.08291625976562]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 12.0, 24.0, 65.0, 94.0, 172.0, 406.0, 885.0, 2438.0, 8076.0, 32936.0, 165954.0, 581530.0, 202727.0, 39102.0, 9606.0, 2713.0, 995.0, 379.0, 185.0, 94.0, 50.0, 24.0, 26.0, 13.0, 11.0, 5.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.434326171875, -18.83740234375, -18.240478515625, -17.6435546875, -17.046630859375, -16.44970703125, -15.852783203125, -15.255859375, -14.658935546875, -14.06201171875, -13.465087890625, -12.8681640625, -12.271240234375, -11.67431640625, -11.077392578125, -10.48046875, -9.883544921875, -9.28662109375, -8.689697265625, -8.0927734375, -7.495849609375, -6.89892578125, -6.302001953125, -5.705078125, -5.108154296875, -4.51123046875, -3.914306640625, -3.3173828125, -2.720458984375, -2.12353515625, -1.526611328125, -0.9296875, -0.332763671875, 0.26416015625, 0.861083984375, 1.4580078125, 2.054931640625, 2.65185546875, 3.248779296875, 3.845703125, 4.442626953125, 5.03955078125, 5.636474609375, 6.2333984375, 6.830322265625, 7.42724609375, 8.024169921875, 8.62109375, 9.218017578125, 9.81494140625, 10.411865234375, 11.0087890625, 11.605712890625, 12.20263671875, 12.799560546875, 13.396484375, 13.993408203125, 14.59033203125, 15.187255859375, 15.7841796875, 16.381103515625, 16.97802734375, 17.574951171875, 18.171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 8.0, 18.0, 24.0, 25.0, 32.0, 27.0, 38.0, 56.0, 62.0, 57.0, 62.0, 61.0, 63.0, 56.0, 71.0, 57.0, 51.0, 41.0, 39.0, 28.0, 25.0, 22.0, 17.0, 11.0, 4.0, 11.0, 9.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.8388671875, -10.560546875, -10.2822265625, -10.00390625, -9.7255859375, -9.447265625, -9.1689453125, -8.890625, -8.6123046875, -8.333984375, -8.0556640625, -7.77734375, -7.4990234375, -7.220703125, -6.9423828125, -6.6640625, -6.3857421875, -6.107421875, -5.8291015625, -5.55078125, -5.2724609375, -4.994140625, -4.7158203125, -4.4375, -4.1591796875, -3.880859375, -3.6025390625, -3.32421875, -3.0458984375, -2.767578125, -2.4892578125, -2.2109375, -1.9326171875, -1.654296875, -1.3759765625, -1.09765625, -0.8193359375, -0.541015625, -0.2626953125, 0.015625, 0.2939453125, 0.572265625, 0.8505859375, 1.12890625, 1.4072265625, 1.685546875, 1.9638671875, 2.2421875, 2.5205078125, 2.798828125, 3.0771484375, 3.35546875, 3.6337890625, 3.912109375, 4.1904296875, 4.46875, 4.7470703125, 5.025390625, 5.3037109375, 5.58203125, 5.8603515625, 6.138671875, 6.4169921875, 6.6953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 5.0, 17.0, 21.0, 34.0, 49.0, 68.0, 98.0, 188.0, 293.0, 631.0, 1510.0, 6423.0, 50855.0, 737955.0, 227184.0, 17954.0, 3104.0, 1005.0, 455.0, 255.0, 134.0, 86.0, 65.0, 45.0, 20.0, 19.0, 18.0, 9.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-33.46875, -32.477783203125, -31.48681640625, -30.495849609375, -29.5048828125, -28.513916015625, -27.52294921875, -26.531982421875, -25.541015625, -24.550048828125, -23.55908203125, -22.568115234375, -21.5771484375, -20.586181640625, -19.59521484375, -18.604248046875, -17.61328125, -16.622314453125, -15.63134765625, -14.640380859375, -13.6494140625, -12.658447265625, -11.66748046875, -10.676513671875, -9.685546875, -8.694580078125, -7.70361328125, -6.712646484375, -5.7216796875, -4.730712890625, -3.73974609375, -2.748779296875, -1.7578125, -0.766845703125, 0.22412109375, 1.215087890625, 2.2060546875, 3.197021484375, 4.18798828125, 5.178955078125, 6.169921875, 7.160888671875, 8.15185546875, 9.142822265625, 10.1337890625, 11.124755859375, 12.11572265625, 13.106689453125, 14.09765625, 15.088623046875, 16.07958984375, 17.070556640625, 18.0615234375, 19.052490234375, 20.04345703125, 21.034423828125, 22.025390625, 23.016357421875, 24.00732421875, 24.998291015625, 25.9892578125, 26.980224609375, 27.97119140625, 28.962158203125, 29.953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 8.0, 6.0, 13.0, 15.0, 14.0, 27.0, 17.0, 29.0, 32.0, 30.0, 39.0, 43.0, 51.0, 46.0, 43.0, 36.0, 49.0, 63.0, 60.0, 60.0, 45.0, 29.0, 43.0, 30.0, 33.0, 30.0, 15.0, 24.0, 12.0, 11.0, 9.0, 4.0, 5.0, 10.0, 3.0, 2.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.328125, -24.46923828125, -23.6103515625, -22.75146484375, -21.892578125, -21.03369140625, -20.1748046875, -19.31591796875, -18.45703125, -17.59814453125, -16.7392578125, -15.88037109375, -15.021484375, -14.16259765625, -13.3037109375, -12.44482421875, -11.5859375, -10.72705078125, -9.8681640625, -9.00927734375, -8.150390625, -7.29150390625, -6.4326171875, -5.57373046875, -4.71484375, -3.85595703125, -2.9970703125, -2.13818359375, -1.279296875, -0.42041015625, 0.4384765625, 1.29736328125, 2.15625, 3.01513671875, 3.8740234375, 4.73291015625, 5.591796875, 6.45068359375, 7.3095703125, 8.16845703125, 9.02734375, 9.88623046875, 10.7451171875, 11.60400390625, 12.462890625, 13.32177734375, 14.1806640625, 15.03955078125, 15.8984375, 16.75732421875, 17.6162109375, 18.47509765625, 19.333984375, 20.19287109375, 21.0517578125, 21.91064453125, 22.76953125, 23.62841796875, 24.4873046875, 25.34619140625, 26.205078125, 27.06396484375, 27.9228515625, 28.78173828125, 29.640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 18.0, 29.0, 50.0, 83.0, 227.0, 792.0, 5403.0, 927803.0, 110574.0, 2650.0, 540.0, 164.0, 80.0, 27.0, 28.0, 18.0, 12.0, 8.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-45.40625, -44.2666015625, -43.126953125, -41.9873046875, -40.84765625, -39.7080078125, -38.568359375, -37.4287109375, -36.2890625, -35.1494140625, -34.009765625, -32.8701171875, -31.73046875, -30.5908203125, -29.451171875, -28.3115234375, -27.171875, -26.0322265625, -24.892578125, -23.7529296875, -22.61328125, -21.4736328125, -20.333984375, -19.1943359375, -18.0546875, -16.9150390625, -15.775390625, -14.6357421875, -13.49609375, -12.3564453125, -11.216796875, -10.0771484375, -8.9375, -7.7978515625, -6.658203125, -5.5185546875, -4.37890625, -3.2392578125, -2.099609375, -0.9599609375, 0.1796875, 1.3193359375, 2.458984375, 3.5986328125, 4.73828125, 5.8779296875, 7.017578125, 8.1572265625, 9.296875, 10.4365234375, 11.576171875, 12.7158203125, 13.85546875, 14.9951171875, 16.134765625, 17.2744140625, 18.4140625, 19.5537109375, 20.693359375, 21.8330078125, 22.97265625, 24.1123046875, 25.251953125, 26.3916015625, 27.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 11.0, 12.0, 32.0, 33.0, 37.0, 89.0, 129.0, 206.0, 153.0, 78.0, 60.0, 40.0, 26.0, 19.0, 16.0, 2.0, 12.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019989013671875, -0.0019355416297912598, -0.0018721818923950195, -0.0018088221549987793, -0.001745462417602539, -0.0016821026802062988, -0.0016187429428100586, -0.0015553832054138184, -0.0014920234680175781, -0.0014286637306213379, -0.0013653039932250977, -0.0013019442558288574, -0.0012385845184326172, -0.001175224781036377, -0.0011118650436401367, -0.0010485053062438965, -0.0009851455688476562, -0.000921785831451416, -0.0008584260940551758, -0.0007950663566589355, -0.0007317066192626953, -0.0006683468818664551, -0.0006049871444702148, -0.0005416274070739746, -0.0004782676696777344, -0.00041490793228149414, -0.0003515481948852539, -0.00028818845748901367, -0.00022482872009277344, -0.0001614689826965332, -9.810924530029297e-05, -3.4749507904052734e-05, 2.86102294921875e-05, 9.196996688842773e-05, 0.00015532970428466797, 0.0002186894416809082, 0.00028204917907714844, 0.00034540891647338867, 0.0004087686538696289, 0.00047212839126586914, 0.0005354881286621094, 0.0005988478660583496, 0.0006622076034545898, 0.0007255673408508301, 0.0007889270782470703, 0.0008522868156433105, 0.0009156465530395508, 0.000979006290435791, 0.0010423660278320312, 0.0011057257652282715, 0.0011690855026245117, 0.001232445240020752, 0.0012958049774169922, 0.0013591647148132324, 0.0014225244522094727, 0.0014858841896057129, 0.0015492439270019531, 0.0016126036643981934, 0.0016759634017944336, 0.0017393231391906738, 0.001802682876586914, 0.0018660426139831543, 0.0019294023513793945, 0.0019927620887756348, 0.002056121826171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 29.0, 30.0, 26.0, 46.0, 80.0, 125.0, 226.0, 521.0, 1337.0, 4020.0, 17242.0, 167503.0, 785682.0, 57751.0, 9412.0, 2640.0, 958.0, 350.0, 192.0, 119.0, 72.0, 42.0, 27.0, 17.0, 17.0, 14.0, 10.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.28125, -15.8870849609375, -15.492919921875, -15.0987548828125, -14.70458984375, -14.3104248046875, -13.916259765625, -13.5220947265625, -13.1279296875, -12.7337646484375, -12.339599609375, -11.9454345703125, -11.55126953125, -11.1571044921875, -10.762939453125, -10.3687744140625, -9.974609375, -9.5804443359375, -9.186279296875, -8.7921142578125, -8.39794921875, -8.0037841796875, -7.609619140625, -7.2154541015625, -6.8212890625, -6.4271240234375, -6.032958984375, -5.6387939453125, -5.24462890625, -4.8504638671875, -4.456298828125, -4.0621337890625, -3.66796875, -3.2738037109375, -2.879638671875, -2.4854736328125, -2.09130859375, -1.6971435546875, -1.302978515625, -0.9088134765625, -0.5146484375, -0.1204833984375, 0.273681640625, 0.6678466796875, 1.06201171875, 1.4561767578125, 1.850341796875, 2.2445068359375, 2.638671875, 3.0328369140625, 3.427001953125, 3.8211669921875, 4.21533203125, 4.6094970703125, 5.003662109375, 5.3978271484375, 5.7919921875, 6.1861572265625, 6.580322265625, 6.9744873046875, 7.36865234375, 7.7628173828125, 8.156982421875, 8.5511474609375, 8.9453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 7.0, 2.0, 6.0, 20.0, 11.0, 25.0, 31.0, 69.0, 73.0, 125.0, 148.0, 144.0, 97.0, 79.0, 47.0, 35.0, 15.0, 19.0, 10.0, 8.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5703125, -12.2216796875, -11.873046875, -11.5244140625, -11.17578125, -10.8271484375, -10.478515625, -10.1298828125, -9.78125, -9.4326171875, -9.083984375, -8.7353515625, -8.38671875, -8.0380859375, -7.689453125, -7.3408203125, -6.9921875, -6.6435546875, -6.294921875, -5.9462890625, -5.59765625, -5.2490234375, -4.900390625, -4.5517578125, -4.203125, -3.8544921875, -3.505859375, -3.1572265625, -2.80859375, -2.4599609375, -2.111328125, -1.7626953125, -1.4140625, -1.0654296875, -0.716796875, -0.3681640625, -0.01953125, 0.3291015625, 0.677734375, 1.0263671875, 1.375, 1.7236328125, 2.072265625, 2.4208984375, 2.76953125, 3.1181640625, 3.466796875, 3.8154296875, 4.1640625, 4.5126953125, 4.861328125, 5.2099609375, 5.55859375, 5.9072265625, 6.255859375, 6.6044921875, 6.953125, 7.3017578125, 7.650390625, 7.9990234375, 8.34765625, 8.6962890625, 9.044921875, 9.3935546875, 9.7421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 15.0, 63.0, 385.0, 419.0, 94.0, 16.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-684.6006469726562, -668.6945190429688, -652.7883911132812, -636.88232421875, -620.9761962890625, -605.070068359375, -589.1639404296875, -573.2578735351562, -557.3517456054688, -541.4456176757812, -525.5394897460938, -509.6333923339844, -493.727294921875, -477.8211669921875, -461.9150695800781, -446.0089416503906, -430.10284423828125, -414.19671630859375, -398.2906188964844, -382.3844909667969, -366.4783935546875, -350.572265625, -334.6661682128906, -318.7600402832031, -302.8539123535156, -286.9477844238281, -271.04168701171875, -255.1355743408203, -239.22946166992188, -223.32333374023438, -207.417236328125, -191.5111083984375, -175.60501098632812, -159.6988983154297, -143.79278564453125, -127.88667297363281, -111.98056030273438, -96.0744400024414, -80.16832733154297, -64.26221466064453, -48.356101989746094, -32.449989318847656, -16.543874740600586, -0.6377601623535156, 15.268352508544922, 31.174468994140625, 47.08058166503906, 62.9866943359375, 78.89280700683594, 94.79891967773438, 110.70503234863281, 126.61114501953125, 142.5172576904297, 158.42337036132812, 174.32949829101562, 190.235595703125, 206.1417236328125, 222.04783630371094, 237.95394897460938, 253.8600616455078, 269.76617431640625, 285.67230224609375, 301.5783996582031, 317.4845275878906, 333.390625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 3.0, 10.0, 11.0, 11.0, 11.0, 18.0, 17.0, 27.0, 18.0, 21.0, 23.0, 48.0, 33.0, 35.0, 43.0, 55.0, 52.0, 65.0, 70.0, 52.0, 47.0, 34.0, 35.0, 38.0, 21.0, 30.0, 27.0, 23.0, 22.0, 18.0, 11.0, 15.0, 14.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.42628479003906, -88.99701690673828, -85.5677490234375, -82.13848876953125, -78.70922088623047, -75.27995300292969, -71.8506851196289, -68.42141723632812, -64.99215698242188, -61.562889099121094, -58.13362503051758, -54.7043571472168, -51.27509307861328, -47.8458251953125, -44.41655731201172, -40.98728942871094, -37.558021545410156, -34.128753662109375, -30.69948959350586, -27.270221710205078, -23.84095573425293, -20.41168975830078, -16.982421875, -13.553155899047852, -10.123889923095703, -6.6946234703063965, -3.26535701751709, 0.163909912109375, 3.5931758880615234, 7.022441864013672, 10.451709747314453, 13.880975723266602, 17.31024169921875, 20.7395076751709, 24.168773651123047, 27.598041534423828, 31.027307510375977, 34.456573486328125, 37.885841369628906, 41.31510925292969, 44.7443733215332, 48.173641204833984, 51.6029052734375, 55.03217315673828, 58.46144104003906, 61.89070510864258, 65.31997680664062, 68.74923706054688, 72.17850494384766, 75.60777282714844, 79.03704071044922, 82.46630859375, 85.89556884765625, 89.32483673095703, 92.75410461425781, 96.1833724975586, 99.61264038085938, 103.04190826416016, 106.47117614746094, 109.90043640136719, 113.32970428466797, 116.75897216796875, 120.18824005126953, 123.61750793457031, 127.04676818847656]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 11.0, 14.0, 26.0, 29.0, 57.0, 93.0, 132.0, 268.0, 530.0, 1037.0, 2577.0, 7247.0, 26377.0, 151674.0, 2370465.0, 1496385.0, 106417.0, 20737.0, 6028.0, 2159.0, 960.0, 448.0, 239.0, 131.0, 83.0, 47.0, 33.0, 26.0, 14.0, 11.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.0625, -13.6708984375, -13.279296875, -12.8876953125, -12.49609375, -12.1044921875, -11.712890625, -11.3212890625, -10.9296875, -10.5380859375, -10.146484375, -9.7548828125, -9.36328125, -8.9716796875, -8.580078125, -8.1884765625, -7.796875, -7.4052734375, -7.013671875, -6.6220703125, -6.23046875, -5.8388671875, -5.447265625, -5.0556640625, -4.6640625, -4.2724609375, -3.880859375, -3.4892578125, -3.09765625, -2.7060546875, -2.314453125, -1.9228515625, -1.53125, -1.1396484375, -0.748046875, -0.3564453125, 0.03515625, 0.4267578125, 0.818359375, 1.2099609375, 1.6015625, 1.9931640625, 2.384765625, 2.7763671875, 3.16796875, 3.5595703125, 3.951171875, 4.3427734375, 4.734375, 5.1259765625, 5.517578125, 5.9091796875, 6.30078125, 6.6923828125, 7.083984375, 7.4755859375, 7.8671875, 8.2587890625, 8.650390625, 9.0419921875, 9.43359375, 9.8251953125, 10.216796875, 10.6083984375, 11.0]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 20.0, 20.0, 23.0, 36.0, 31.0, 40.0, 60.0, 70.0, 65.0, 74.0, 68.0, 72.0, 67.0, 85.0, 50.0, 46.0, 37.0, 13.0, 33.0, 22.0, 15.0, 11.0, 13.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.737060546875, -10.45849609375, -10.179931640625, -9.9013671875, -9.622802734375, -9.34423828125, -9.065673828125, -8.787109375, -8.508544921875, -8.22998046875, -7.951416015625, -7.6728515625, -7.394287109375, -7.11572265625, -6.837158203125, -6.55859375, -6.280029296875, -6.00146484375, -5.722900390625, -5.4443359375, -5.165771484375, -4.88720703125, -4.608642578125, -4.330078125, -4.051513671875, -3.77294921875, -3.494384765625, -3.2158203125, -2.937255859375, -2.65869140625, -2.380126953125, -2.1015625, -1.822998046875, -1.54443359375, -1.265869140625, -0.9873046875, -0.708740234375, -0.43017578125, -0.151611328125, 0.126953125, 0.405517578125, 0.68408203125, 0.962646484375, 1.2412109375, 1.519775390625, 1.79833984375, 2.076904296875, 2.35546875, 2.634033203125, 2.91259765625, 3.191162109375, 3.4697265625, 3.748291015625, 4.02685546875, 4.305419921875, 4.583984375, 4.862548828125, 5.14111328125, 5.419677734375, 5.6982421875, 5.976806640625, 6.25537109375, 6.533935546875, 6.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 10.0, 10.0, 18.0, 29.0, 47.0, 60.0, 126.0, 203.0, 383.0, 849.0, 2153.0, 7195.0, 33720.0, 340310.0, 3542102.0, 230004.0, 27945.0, 6012.0, 1792.0, 634.0, 275.0, 147.0, 91.0, 57.0, 33.0, 17.0, 17.0, 11.0, 12.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.875, -20.331787109375, -19.78857421875, -19.245361328125, -18.7021484375, -18.158935546875, -17.61572265625, -17.072509765625, -16.529296875, -15.986083984375, -15.44287109375, -14.899658203125, -14.3564453125, -13.813232421875, -13.27001953125, -12.726806640625, -12.18359375, -11.640380859375, -11.09716796875, -10.553955078125, -10.0107421875, -9.467529296875, -8.92431640625, -8.381103515625, -7.837890625, -7.294677734375, -6.75146484375, -6.208251953125, -5.6650390625, -5.121826171875, -4.57861328125, -4.035400390625, -3.4921875, -2.948974609375, -2.40576171875, -1.862548828125, -1.3193359375, -0.776123046875, -0.23291015625, 0.310302734375, 0.853515625, 1.396728515625, 1.93994140625, 2.483154296875, 3.0263671875, 3.569580078125, 4.11279296875, 4.656005859375, 5.19921875, 5.742431640625, 6.28564453125, 6.828857421875, 7.3720703125, 7.915283203125, 8.45849609375, 9.001708984375, 9.544921875, 10.088134765625, 10.63134765625, 11.174560546875, 11.7177734375, 12.260986328125, 12.80419921875, 13.347412109375, 13.890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 9.0, 11.0, 8.0, 26.0, 35.0, 51.0, 75.0, 130.0, 293.0, 612.0, 980.0, 867.0, 398.0, 216.0, 100.0, 74.0, 58.0, 36.0, 17.0, 27.0, 7.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.640625, -23.061279296875, -22.48193359375, -21.902587890625, -21.3232421875, -20.743896484375, -20.16455078125, -19.585205078125, -19.005859375, -18.426513671875, -17.84716796875, -17.267822265625, -16.6884765625, -16.109130859375, -15.52978515625, -14.950439453125, -14.37109375, -13.791748046875, -13.21240234375, -12.633056640625, -12.0537109375, -11.474365234375, -10.89501953125, -10.315673828125, -9.736328125, -9.156982421875, -8.57763671875, -7.998291015625, -7.4189453125, -6.839599609375, -6.26025390625, -5.680908203125, -5.1015625, -4.522216796875, -3.94287109375, -3.363525390625, -2.7841796875, -2.204833984375, -1.62548828125, -1.046142578125, -0.466796875, 0.112548828125, 0.69189453125, 1.271240234375, 1.8505859375, 2.429931640625, 3.00927734375, 3.588623046875, 4.16796875, 4.747314453125, 5.32666015625, 5.906005859375, 6.4853515625, 7.064697265625, 7.64404296875, 8.223388671875, 8.802734375, 9.382080078125, 9.96142578125, 10.540771484375, 11.1201171875, 11.699462890625, 12.27880859375, 12.858154296875, 13.4375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 11.0, 20.0, 33.0, 91.0, 161.0, 190.0, 219.0, 135.0, 64.0, 25.0, 16.0, 7.0, 8.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.79360961914062, -111.59861755371094, -106.40362548828125, -101.20863342285156, -96.01364135742188, -90.81864929199219, -85.6236572265625, -80.42866516113281, -75.23367309570312, -70.03868103027344, -64.84368896484375, -59.64869689941406, -54.453704833984375, -49.25871276855469, -44.063720703125, -38.86872863769531, -33.673736572265625, -28.478744506835938, -23.28375244140625, -18.088760375976562, -12.893768310546875, -7.6987762451171875, -2.5037841796875, 2.6912078857421875, 7.886199951171875, 13.081192016601562, 18.27618408203125, 23.471176147460938, 28.666168212890625, 33.86116027832031, 39.05615234375, 44.25114440917969, 49.44612121582031, 54.64111328125, 59.83610534667969, 65.03109741210938, 70.22608947753906, 75.42108154296875, 80.61607360839844, 85.81106567382812, 91.00605773925781, 96.2010498046875, 101.39604187011719, 106.59103393554688, 111.78602600097656, 116.98101806640625, 122.17601013183594, 127.37100219726562, 132.5659942626953, 137.760986328125, 142.9559783935547, 148.15097045898438, 153.34596252441406, 158.54095458984375, 163.73594665527344, 168.93093872070312, 174.1259307861328, 179.3209228515625, 184.5159149169922, 189.71090698242188, 194.90589904785156, 200.10089111328125, 205.29588317871094, 210.49087524414062, 215.6858673095703]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 5.0, 19.0, 20.0, 24.0, 26.0, 27.0, 35.0, 59.0, 51.0, 44.0, 63.0, 67.0, 52.0, 59.0, 53.0, 47.0, 58.0, 44.0, 31.0, 32.0, 35.0, 22.0, 21.0, 19.0, 16.0, 12.0, 14.0, 6.0, 5.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.03072357177734, -87.42643737792969, -84.82215881347656, -82.21788024902344, -79.61359405517578, -77.00930786132812, -74.405029296875, -71.80075073242188, -69.19646453857422, -66.59217834472656, -63.98789978027344, -61.38361740112305, -58.779335021972656, -56.175052642822266, -53.570770263671875, -50.966487884521484, -48.362205505371094, -45.7579231262207, -43.15364074707031, -40.54935836791992, -37.94507598876953, -35.34079360961914, -32.73651123046875, -30.13222885131836, -27.52794647216797, -24.923664093017578, -22.319381713867188, -19.715099334716797, -17.110816955566406, -14.506534576416016, -11.902252197265625, -9.297969818115234, -6.6936798095703125, -4.089397430419922, -1.4851150512695312, 1.1191673278808594, 3.72344970703125, 6.327732086181641, 8.932014465332031, 11.536296844482422, 14.140579223632812, 16.744861602783203, 19.349143981933594, 21.953426361083984, 24.557708740234375, 27.161991119384766, 29.766273498535156, 32.37055587768555, 34.97483825683594, 37.57912063598633, 40.18340301513672, 42.78768539428711, 45.3919677734375, 47.99625015258789, 50.60053253173828, 53.20481491088867, 55.80909729003906, 58.41337966918945, 61.017662048339844, 63.621944427490234, 66.22622680664062, 68.83050537109375, 71.4347915649414, 74.03907775878906, 76.64335632324219]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 16.0, 21.0, 25.0, 38.0, 77.0, 107.0, 168.0, 287.0, 594.0, 1186.0, 2958.0, 8559.0, 29351.0, 113490.0, 403797.0, 355797.0, 95097.0, 24556.0, 7446.0, 2621.0, 1154.0, 494.0, 257.0, 157.0, 102.0, 65.0, 37.0, 25.0, 19.0, 11.0, 4.0, 9.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1015625, -14.6134033203125, -14.125244140625, -13.6370849609375, -13.14892578125, -12.6607666015625, -12.172607421875, -11.6844482421875, -11.1962890625, -10.7081298828125, -10.219970703125, -9.7318115234375, -9.24365234375, -8.7554931640625, -8.267333984375, -7.7791748046875, -7.291015625, -6.8028564453125, -6.314697265625, -5.8265380859375, -5.33837890625, -4.8502197265625, -4.362060546875, -3.8739013671875, -3.3857421875, -2.8975830078125, -2.409423828125, -1.9212646484375, -1.43310546875, -0.9449462890625, -0.456787109375, 0.0313720703125, 0.51953125, 1.0076904296875, 1.495849609375, 1.9840087890625, 2.47216796875, 2.9603271484375, 3.448486328125, 3.9366455078125, 4.4248046875, 4.9129638671875, 5.401123046875, 5.8892822265625, 6.37744140625, 6.8656005859375, 7.353759765625, 7.8419189453125, 8.330078125, 8.8182373046875, 9.306396484375, 9.7945556640625, 10.28271484375, 10.7708740234375, 11.259033203125, 11.7471923828125, 12.2353515625, 12.7235107421875, 13.211669921875, 13.6998291015625, 14.18798828125, 14.6761474609375, 15.164306640625, 15.6524658203125, 16.140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 11.0, 12.0, 16.0, 25.0, 31.0, 50.0, 54.0, 61.0, 58.0, 89.0, 63.0, 96.0, 76.0, 66.0, 56.0, 46.0, 56.0, 30.0, 30.0, 20.0, 10.0, 14.0, 13.0, 3.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.2216796875, -10.927734375, -10.6337890625, -10.33984375, -10.0458984375, -9.751953125, -9.4580078125, -9.1640625, -8.8701171875, -8.576171875, -8.2822265625, -7.98828125, -7.6943359375, -7.400390625, -7.1064453125, -6.8125, -6.5185546875, -6.224609375, -5.9306640625, -5.63671875, -5.3427734375, -5.048828125, -4.7548828125, -4.4609375, -4.1669921875, -3.873046875, -3.5791015625, -3.28515625, -2.9912109375, -2.697265625, -2.4033203125, -2.109375, -1.8154296875, -1.521484375, -1.2275390625, -0.93359375, -0.6396484375, -0.345703125, -0.0517578125, 0.2421875, 0.5361328125, 0.830078125, 1.1240234375, 1.41796875, 1.7119140625, 2.005859375, 2.2998046875, 2.59375, 2.8876953125, 3.181640625, 3.4755859375, 3.76953125, 4.0634765625, 4.357421875, 4.6513671875, 4.9453125, 5.2392578125, 5.533203125, 5.8271484375, 6.12109375, 6.4150390625, 6.708984375, 7.0029296875, 7.296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 9.0, 5.0, 8.0, 14.0, 16.0, 23.0, 31.0, 43.0, 77.0, 131.0, 202.0, 336.0, 699.0, 1373.0, 3964.0, 28745.0, 786519.0, 210371.0, 11127.0, 2497.0, 1061.0, 555.0, 289.0, 177.0, 94.0, 52.0, 48.0, 18.0, 17.0, 13.0, 11.0, 5.0, 6.0, 4.0, 3.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.5, -40.23486328125, -38.9697265625, -37.70458984375, -36.439453125, -35.17431640625, -33.9091796875, -32.64404296875, -31.37890625, -30.11376953125, -28.8486328125, -27.58349609375, -26.318359375, -25.05322265625, -23.7880859375, -22.52294921875, -21.2578125, -19.99267578125, -18.7275390625, -17.46240234375, -16.197265625, -14.93212890625, -13.6669921875, -12.40185546875, -11.13671875, -9.87158203125, -8.6064453125, -7.34130859375, -6.076171875, -4.81103515625, -3.5458984375, -2.28076171875, -1.015625, 0.24951171875, 1.5146484375, 2.77978515625, 4.044921875, 5.31005859375, 6.5751953125, 7.84033203125, 9.10546875, 10.37060546875, 11.6357421875, 12.90087890625, 14.166015625, 15.43115234375, 16.6962890625, 17.96142578125, 19.2265625, 20.49169921875, 21.7568359375, 23.02197265625, 24.287109375, 25.55224609375, 26.8173828125, 28.08251953125, 29.34765625, 30.61279296875, 31.8779296875, 33.14306640625, 34.408203125, 35.67333984375, 36.9384765625, 38.20361328125, 39.46875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 6.0, 7.0, 16.0, 24.0, 26.0, 29.0, 45.0, 47.0, 37.0, 57.0, 45.0, 51.0, 54.0, 67.0, 44.0, 53.0, 54.0, 55.0, 41.0, 45.0, 37.0, 28.0, 20.0, 24.0, 15.0, 17.0, 11.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.328125, -30.39013671875, -29.4521484375, -28.51416015625, -27.576171875, -26.63818359375, -25.7001953125, -24.76220703125, -23.82421875, -22.88623046875, -21.9482421875, -21.01025390625, -20.072265625, -19.13427734375, -18.1962890625, -17.25830078125, -16.3203125, -15.38232421875, -14.4443359375, -13.50634765625, -12.568359375, -11.63037109375, -10.6923828125, -9.75439453125, -8.81640625, -7.87841796875, -6.9404296875, -6.00244140625, -5.064453125, -4.12646484375, -3.1884765625, -2.25048828125, -1.3125, -0.37451171875, 0.5634765625, 1.50146484375, 2.439453125, 3.37744140625, 4.3154296875, 5.25341796875, 6.19140625, 7.12939453125, 8.0673828125, 9.00537109375, 9.943359375, 10.88134765625, 11.8193359375, 12.75732421875, 13.6953125, 14.63330078125, 15.5712890625, 16.50927734375, 17.447265625, 18.38525390625, 19.3232421875, 20.26123046875, 21.19921875, 22.13720703125, 23.0751953125, 24.01318359375, 24.951171875, 25.88916015625, 26.8271484375, 27.76513671875, 28.703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 0.0, 2.0, 4.0, 5.0, 8.0, 6.0, 19.0, 12.0, 27.0, 28.0, 41.0, 57.0, 92.0, 179.0, 398.0, 1227.0, 8314.0, 232663.0, 785353.0, 17166.0, 1863.0, 517.0, 220.0, 106.0, 68.0, 43.0, 32.0, 24.0, 16.0, 15.0, 5.0, 7.0, 8.0, 12.0, 7.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.8902587890625, -17.421142578125, -16.9520263671875, -16.48291015625, -16.0137939453125, -15.544677734375, -15.0755615234375, -14.6064453125, -14.1373291015625, -13.668212890625, -13.1990966796875, -12.72998046875, -12.2608642578125, -11.791748046875, -11.3226318359375, -10.853515625, -10.3843994140625, -9.915283203125, -9.4461669921875, -8.97705078125, -8.5079345703125, -8.038818359375, -7.5697021484375, -7.1005859375, -6.6314697265625, -6.162353515625, -5.6932373046875, -5.22412109375, -4.7550048828125, -4.285888671875, -3.8167724609375, -3.34765625, -2.8785400390625, -2.409423828125, -1.9403076171875, -1.47119140625, -1.0020751953125, -0.532958984375, -0.0638427734375, 0.4052734375, 0.8743896484375, 1.343505859375, 1.8126220703125, 2.28173828125, 2.7508544921875, 3.219970703125, 3.6890869140625, 4.158203125, 4.6273193359375, 5.096435546875, 5.5655517578125, 6.03466796875, 6.5037841796875, 6.972900390625, 7.4420166015625, 7.9111328125, 8.3802490234375, 8.849365234375, 9.3184814453125, 9.78759765625, 10.2567138671875, 10.725830078125, 11.1949462890625, 11.6640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 10.0, 12.0, 13.0, 9.0, 19.0, 18.0, 30.0, 39.0, 45.0, 56.0, 112.0, 167.0, 114.0, 78.0, 60.0, 40.0, 37.0, 16.0, 22.0, 25.0, 14.0, 13.0, 3.0, 13.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001667022705078125, -0.001614406704902649, -0.0015617907047271729, -0.0015091747045516968, -0.0014565587043762207, -0.0014039427042007446, -0.0013513267040252686, -0.0012987107038497925, -0.0012460947036743164, -0.0011934787034988403, -0.0011408627033233643, -0.0010882467031478882, -0.0010356307029724121, -0.000983014702796936, -0.00093039870262146, -0.0008777827024459839, -0.0008251667022705078, -0.0007725507020950317, -0.0007199347019195557, -0.0006673187017440796, -0.0006147027015686035, -0.0005620867013931274, -0.0005094707012176514, -0.0004568547010421753, -0.0004042387008666992, -0.00035162270069122314, -0.00029900670051574707, -0.000246390700340271, -0.00019377470016479492, -0.00014115869998931885, -8.854269981384277e-05, -3.59266996383667e-05, 1.6689300537109375e-05, 6.930530071258545e-05, 0.00012192130088806152, 0.0001745373010635376, 0.00022715330123901367, 0.00027976930141448975, 0.0003323853015899658, 0.0003850013017654419, 0.00043761730194091797, 0.000490233302116394, 0.0005428493022918701, 0.0005954653024673462, 0.0006480813026428223, 0.0007006973028182983, 0.0007533133029937744, 0.0008059293031692505, 0.0008585453033447266, 0.0009111613035202026, 0.0009637773036956787, 0.0010163933038711548, 0.0010690093040466309, 0.001121625304222107, 0.001174241304397583, 0.001226857304573059, 0.0012794733047485352, 0.0013320893049240112, 0.0013847053050994873, 0.0014373213052749634, 0.0014899373054504395, 0.0015425533056259155, 0.0015951693058013916, 0.0016477853059768677, 0.0017004013061523438]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 5.0, 9.0, 11.0, 16.0, 19.0, 25.0, 30.0, 38.0, 79.0, 141.0, 234.0, 449.0, 1036.0, 2752.0, 9661.0, 58743.0, 859608.0, 97296.0, 12693.0, 3421.0, 1182.0, 469.0, 231.0, 150.0, 62.0, 46.0, 36.0, 20.0, 21.0, 18.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.8515625, -13.439208984375, -13.02685546875, -12.614501953125, -12.2021484375, -11.789794921875, -11.37744140625, -10.965087890625, -10.552734375, -10.140380859375, -9.72802734375, -9.315673828125, -8.9033203125, -8.490966796875, -8.07861328125, -7.666259765625, -7.25390625, -6.841552734375, -6.42919921875, -6.016845703125, -5.6044921875, -5.192138671875, -4.77978515625, -4.367431640625, -3.955078125, -3.542724609375, -3.13037109375, -2.718017578125, -2.3056640625, -1.893310546875, -1.48095703125, -1.068603515625, -0.65625, -0.243896484375, 0.16845703125, 0.580810546875, 0.9931640625, 1.405517578125, 1.81787109375, 2.230224609375, 2.642578125, 3.054931640625, 3.46728515625, 3.879638671875, 4.2919921875, 4.704345703125, 5.11669921875, 5.529052734375, 5.94140625, 6.353759765625, 6.76611328125, 7.178466796875, 7.5908203125, 8.003173828125, 8.41552734375, 8.827880859375, 9.240234375, 9.652587890625, 10.06494140625, 10.477294921875, 10.8896484375, 11.302001953125, 11.71435546875, 12.126708984375, 12.5390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 6.0, 5.0, 11.0, 16.0, 19.0, 41.0, 54.0, 108.0, 167.0, 218.0, 156.0, 82.0, 49.0, 25.0, 6.0, 10.0, 12.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.4146728515625, -16.891845703125, -16.3690185546875, -15.84619140625, -15.3233642578125, -14.800537109375, -14.2777099609375, -13.7548828125, -13.2320556640625, -12.709228515625, -12.1864013671875, -11.66357421875, -11.1407470703125, -10.617919921875, -10.0950927734375, -9.572265625, -9.0494384765625, -8.526611328125, -8.0037841796875, -7.48095703125, -6.9581298828125, -6.435302734375, -5.9124755859375, -5.3896484375, -4.8668212890625, -4.343994140625, -3.8211669921875, -3.29833984375, -2.7755126953125, -2.252685546875, -1.7298583984375, -1.20703125, -0.6842041015625, -0.161376953125, 0.3614501953125, 0.88427734375, 1.4071044921875, 1.929931640625, 2.4527587890625, 2.9755859375, 3.4984130859375, 4.021240234375, 4.5440673828125, 5.06689453125, 5.5897216796875, 6.112548828125, 6.6353759765625, 7.158203125, 7.6810302734375, 8.203857421875, 8.7266845703125, 9.24951171875, 9.7723388671875, 10.295166015625, 10.8179931640625, 11.3408203125, 11.8636474609375, 12.386474609375, 12.9093017578125, 13.43212890625, 13.9549560546875, 14.477783203125, 15.0006103515625, 15.5234375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 22.0, 69.0, 265.0, 378.0, 149.0, 61.0, 16.0, 11.0, 5.0, 10.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-307.82684326171875, -298.22369384765625, -288.62054443359375, -279.01739501953125, -269.4142761230469, -259.8111267089844, -250.20797729492188, -240.60482788085938, -231.00167846679688, -221.39852905273438, -211.79539489746094, -202.19224548339844, -192.58909606933594, -182.9859619140625, -173.3828125, -163.7796630859375, -154.17652893066406, -144.57337951660156, -134.97024536132812, -125.36709594726562, -115.76394653320312, -106.16080474853516, -96.55766296386719, -86.95451354980469, -77.35137176513672, -67.74822998046875, -58.14508056640625, -48.54193878173828, -38.93879318237305, -29.335647583007812, -19.732505798339844, -10.129356384277344, -0.526214599609375, 9.076930046081543, 18.68007469177246, 28.283218383789062, 37.8863639831543, 47.48950958251953, 57.0926513671875, 66.69580078125, 76.29894256591797, 85.90208435058594, 95.50523376464844, 105.1083755493164, 114.71151733398438, 124.31466674804688, 133.91781616210938, 143.52096557617188, 153.1240997314453, 162.7272491455078, 172.33038330078125, 181.93353271484375, 191.53668212890625, 201.13983154296875, 210.7429656982422, 220.3461151123047, 229.94924926757812, 239.55239868164062, 249.15553283691406, 258.7586669921875, 268.36181640625, 277.9649658203125, 287.568115234375, 297.1712646484375, 306.7744140625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 2.0, 5.0, 2.0, 9.0, 7.0, 8.0, 9.0, 12.0, 13.0, 12.0, 25.0, 13.0, 27.0, 23.0, 39.0, 32.0, 40.0, 35.0, 53.0, 60.0, 67.0, 75.0, 51.0, 52.0, 36.0, 42.0, 32.0, 36.0, 19.0, 24.0, 30.0, 17.0, 17.0, 12.0, 14.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.66230773925781, -94.61557006835938, -91.5688247680664, -88.52208709716797, -85.475341796875, -82.42860412597656, -79.38186645507812, -76.33512878417969, -73.28838348388672, -70.24164581298828, -67.19490051269531, -64.14816284179688, -61.10142135620117, -58.05467987060547, -55.00794219970703, -51.96120071411133, -48.914459228515625, -45.86771774291992, -42.82097625732422, -39.77423858642578, -36.72749710083008, -33.680755615234375, -30.634016036987305, -27.587276458740234, -24.54053497314453, -21.493793487548828, -18.447053909301758, -15.400313377380371, -12.353572845458984, -9.306832313537598, -6.260091781616211, -3.2133522033691406, -0.16660308837890625, 2.8801374435424805, 5.926877975463867, 8.973618507385254, 12.02035903930664, 15.067099571228027, 18.113840103149414, 21.160579681396484, 24.207321166992188, 27.25406265258789, 30.30080223083496, 33.34754180908203, 36.394283294677734, 39.44102478027344, 42.487762451171875, 45.53450393676758, 48.58124542236328, 51.627986907958984, 54.67472839355469, 57.721466064453125, 60.76820755004883, 63.81494903564453, 66.86168670654297, 69.90843200683594, 72.95516967773438, 76.00190734863281, 79.04865264892578, 82.09539031982422, 85.14213562011719, 88.18887329101562, 91.23561096191406, 94.2823486328125, 97.32909393310547]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 8.0, 11.0, 11.0, 18.0, 23.0, 38.0, 60.0, 73.0, 125.0, 231.0, 429.0, 918.0, 2305.0, 6587.0, 26513.0, 175340.0, 2714911.0, 1158520.0, 83365.0, 16433.0, 4837.0, 1772.0, 796.0, 385.0, 218.0, 120.0, 88.0, 46.0, 28.0, 24.0, 12.0, 2.0, 5.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-14.765625, -14.3948974609375, -14.024169921875, -13.6534423828125, -13.28271484375, -12.9119873046875, -12.541259765625, -12.1705322265625, -11.7998046875, -11.4290771484375, -11.058349609375, -10.6876220703125, -10.31689453125, -9.9461669921875, -9.575439453125, -9.2047119140625, -8.833984375, -8.4632568359375, -8.092529296875, -7.7218017578125, -7.35107421875, -6.9803466796875, -6.609619140625, -6.2388916015625, -5.8681640625, -5.4974365234375, -5.126708984375, -4.7559814453125, -4.38525390625, -4.0145263671875, -3.643798828125, -3.2730712890625, -2.90234375, -2.5316162109375, -2.160888671875, -1.7901611328125, -1.41943359375, -1.0487060546875, -0.677978515625, -0.3072509765625, 0.0634765625, 0.4342041015625, 0.804931640625, 1.1756591796875, 1.54638671875, 1.9171142578125, 2.287841796875, 2.6585693359375, 3.029296875, 3.4000244140625, 3.770751953125, 4.1414794921875, 4.51220703125, 4.8829345703125, 5.253662109375, 5.6243896484375, 5.9951171875, 6.3658447265625, 6.736572265625, 7.1072998046875, 7.47802734375, 7.8487548828125, 8.219482421875, 8.5902099609375, 8.9609375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 6.0, 8.0, 12.0, 18.0, 32.0, 31.0, 48.0, 55.0, 53.0, 70.0, 78.0, 83.0, 84.0, 62.0, 82.0, 68.0, 49.0, 30.0, 41.0, 21.0, 16.0, 15.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.9769287109375, -10.688232421875, -10.3995361328125, -10.11083984375, -9.8221435546875, -9.533447265625, -9.2447509765625, -8.9560546875, -8.6673583984375, -8.378662109375, -8.0899658203125, -7.80126953125, -7.5125732421875, -7.223876953125, -6.9351806640625, -6.646484375, -6.3577880859375, -6.069091796875, -5.7803955078125, -5.49169921875, -5.2030029296875, -4.914306640625, -4.6256103515625, -4.3369140625, -4.0482177734375, -3.759521484375, -3.4708251953125, -3.18212890625, -2.8934326171875, -2.604736328125, -2.3160400390625, -2.02734375, -1.7386474609375, -1.449951171875, -1.1612548828125, -0.87255859375, -0.5838623046875, -0.295166015625, -0.0064697265625, 0.2822265625, 0.5709228515625, 0.859619140625, 1.1483154296875, 1.43701171875, 1.7257080078125, 2.014404296875, 2.3031005859375, 2.591796875, 2.8804931640625, 3.169189453125, 3.4578857421875, 3.74658203125, 4.0352783203125, 4.323974609375, 4.6126708984375, 4.9013671875, 5.1900634765625, 5.478759765625, 5.7674560546875, 6.05615234375, 6.3448486328125, 6.633544921875, 6.9222412109375, 7.2109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 9.0, 12.0, 22.0, 35.0, 40.0, 62.0, 91.0, 136.0, 210.0, 317.0, 482.0, 940.0, 2239.0, 9611.0, 111826.0, 3865079.0, 190250.0, 9545.0, 1745.0, 730.0, 400.0, 212.0, 129.0, 60.0, 33.0, 22.0, 16.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.484375, -30.66845703125, -29.8525390625, -29.03662109375, -28.220703125, -27.40478515625, -26.5888671875, -25.77294921875, -24.95703125, -24.14111328125, -23.3251953125, -22.50927734375, -21.693359375, -20.87744140625, -20.0615234375, -19.24560546875, -18.4296875, -17.61376953125, -16.7978515625, -15.98193359375, -15.166015625, -14.35009765625, -13.5341796875, -12.71826171875, -11.90234375, -11.08642578125, -10.2705078125, -9.45458984375, -8.638671875, -7.82275390625, -7.0068359375, -6.19091796875, -5.375, -4.55908203125, -3.7431640625, -2.92724609375, -2.111328125, -1.29541015625, -0.4794921875, 0.33642578125, 1.15234375, 1.96826171875, 2.7841796875, 3.60009765625, 4.416015625, 5.23193359375, 6.0478515625, 6.86376953125, 7.6796875, 8.49560546875, 9.3115234375, 10.12744140625, 10.943359375, 11.75927734375, 12.5751953125, 13.39111328125, 14.20703125, 15.02294921875, 15.8388671875, 16.65478515625, 17.470703125, 18.28662109375, 19.1025390625, 19.91845703125, 20.734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 7.0, 25.0, 32.0, 48.0, 110.0, 205.0, 713.0, 1815.0, 761.0, 198.0, 90.0, 37.0, 18.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.3125, -39.265625, -38.21875, -37.171875, -36.125, -35.078125, -34.03125, -32.984375, -31.9375, -30.890625, -29.84375, -28.796875, -27.75, -26.703125, -25.65625, -24.609375, -23.5625, -22.515625, -21.46875, -20.421875, -19.375, -18.328125, -17.28125, -16.234375, -15.1875, -14.140625, -13.09375, -12.046875, -11.0, -9.953125, -8.90625, -7.859375, -6.8125, -5.765625, -4.71875, -3.671875, -2.625, -1.578125, -0.53125, 0.515625, 1.5625, 2.609375, 3.65625, 4.703125, 5.75, 6.796875, 7.84375, 8.890625, 9.9375, 10.984375, 12.03125, 13.078125, 14.125, 15.171875, 16.21875, 17.265625, 18.3125, 19.359375, 20.40625, 21.453125, 22.5, 23.546875, 24.59375, 25.640625, 26.6875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 13.0, 35.0, 135.0, 380.0, 312.0, 78.0, 18.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-345.60614013671875, -335.3943176269531, -325.1825256347656, -314.970703125, -304.7588806152344, -294.54705810546875, -284.33526611328125, -274.1234436035156, -263.91162109375, -253.69981384277344, -243.4879913330078, -233.27618408203125, -223.06436157226562, -212.85255432128906, -202.6407470703125, -192.42892456054688, -182.2171173095703, -172.00531005859375, -161.79348754882812, -151.58168029785156, -141.36985778808594, -131.15805053710938, -120.94623565673828, -110.73442077636719, -100.5226058959961, -90.310791015625, -80.0989761352539, -69.88716125488281, -59.675350189208984, -49.46353530883789, -39.25172424316406, -29.03990936279297, -18.828094482421875, -8.616280555725098, 1.5955333709716797, 11.80734634399414, 22.019161224365234, 32.23097610473633, 42.442787170410156, 52.65460205078125, 62.866416931152344, 73.07823181152344, 83.29004669189453, 93.50186157226562, 103.71366882324219, 113.92549133300781, 124.13729858398438, 134.34912109375, 144.56092834472656, 154.77273559570312, 164.98455810546875, 175.1963653564453, 185.40818786621094, 195.6199951171875, 205.83181762695312, 216.0436248779297, 226.25543212890625, 236.4672393798828, 246.67906188964844, 256.890869140625, 267.1026916503906, 277.31451416015625, 287.52630615234375, 297.7381286621094, 307.949951171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 26.0, 28.0, 48.0, 73.0, 91.0, 102.0, 147.0, 121.0, 94.0, 99.0, 57.0, 47.0, 27.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.5036849975586, -86.66848754882812, -80.83329010009766, -74.99809265136719, -69.16288757324219, -63.32769012451172, -57.49249267578125, -51.657291412353516, -45.82209396362305, -39.98689651489258, -34.151695251464844, -28.316497802734375, -22.481298446655273, -16.646099090576172, -10.810901641845703, -4.975700378417969, 0.8594970703125, 6.694695949554443, 12.529894828796387, 18.365093231201172, 24.200292587280273, 30.035491943359375, 35.870689392089844, 41.70589065551758, 47.54108810424805, 53.376285552978516, 59.21148681640625, 65.04668426513672, 70.88188171386719, 76.71708679199219, 82.55227661132812, 88.38748168945312, 94.22267150878906, 100.05786895751953, 105.89306640625, 111.728271484375, 117.56346893310547, 123.39866638183594, 129.23385620117188, 135.06906127929688, 140.90426635742188, 146.73947143554688, 152.5746612548828, 158.4098663330078, 164.24505615234375, 170.08026123046875, 175.91546630859375, 181.7506561279297, 187.58584594726562, 193.42105102539062, 199.25624084472656, 205.09144592285156, 210.9266357421875, 216.7618408203125, 222.5970458984375, 228.43223571777344, 234.26744079589844, 240.10264587402344, 245.93783569335938, 251.77304077148438, 257.6082458496094, 263.44342041015625, 269.27862548828125, 275.11383056640625, 280.94903564453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 9.0, 6.0, 13.0, 13.0, 8.0, 28.0, 35.0, 50.0, 77.0, 133.0, 182.0, 324.0, 725.0, 1403.0, 3300.0, 8990.0, 28838.0, 104530.0, 390267.0, 370296.0, 97501.0, 27267.0, 8574.0, 3145.0, 1328.0, 602.0, 325.0, 198.0, 114.0, 76.0, 52.0, 34.0, 22.0, 17.0, 11.0, 11.0, 6.0, 9.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-14.828125, -14.3643798828125, -13.900634765625, -13.4368896484375, -12.97314453125, -12.5093994140625, -12.045654296875, -11.5819091796875, -11.1181640625, -10.6544189453125, -10.190673828125, -9.7269287109375, -9.26318359375, -8.7994384765625, -8.335693359375, -7.8719482421875, -7.408203125, -6.9444580078125, -6.480712890625, -6.0169677734375, -5.55322265625, -5.0894775390625, -4.625732421875, -4.1619873046875, -3.6982421875, -3.2344970703125, -2.770751953125, -2.3070068359375, -1.84326171875, -1.3795166015625, -0.915771484375, -0.4520263671875, 0.01171875, 0.4754638671875, 0.939208984375, 1.4029541015625, 1.86669921875, 2.3304443359375, 2.794189453125, 3.2579345703125, 3.7216796875, 4.1854248046875, 4.649169921875, 5.1129150390625, 5.57666015625, 6.0404052734375, 6.504150390625, 6.9678955078125, 7.431640625, 7.8953857421875, 8.359130859375, 8.8228759765625, 9.28662109375, 9.7503662109375, 10.214111328125, 10.6778564453125, 11.1416015625, 11.6053466796875, 12.069091796875, 12.5328369140625, 12.99658203125, 13.4603271484375, 13.924072265625, 14.3878173828125, 14.8515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 13.0, 16.0, 27.0, 24.0, 43.0, 63.0, 67.0, 59.0, 67.0, 60.0, 91.0, 86.0, 75.0, 70.0, 62.0, 49.0, 32.0, 21.0, 17.0, 20.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.2467041015625, -10.946533203125, -10.6463623046875, -10.34619140625, -10.0460205078125, -9.745849609375, -9.4456787109375, -9.1455078125, -8.8453369140625, -8.545166015625, -8.2449951171875, -7.94482421875, -7.6446533203125, -7.344482421875, -7.0443115234375, -6.744140625, -6.4439697265625, -6.143798828125, -5.8436279296875, -5.54345703125, -5.2432861328125, -4.943115234375, -4.6429443359375, -4.3427734375, -4.0426025390625, -3.742431640625, -3.4422607421875, -3.14208984375, -2.8419189453125, -2.541748046875, -2.2415771484375, -1.94140625, -1.6412353515625, -1.341064453125, -1.0408935546875, -0.74072265625, -0.4405517578125, -0.140380859375, 0.1597900390625, 0.4599609375, 0.7601318359375, 1.060302734375, 1.3604736328125, 1.66064453125, 1.9608154296875, 2.260986328125, 2.5611572265625, 2.861328125, 3.1614990234375, 3.461669921875, 3.7618408203125, 4.06201171875, 4.3621826171875, 4.662353515625, 4.9625244140625, 5.2626953125, 5.5628662109375, 5.863037109375, 6.1632080078125, 6.46337890625, 6.7635498046875, 7.063720703125, 7.3638916015625, 7.6640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 5.0, 9.0, 16.0, 14.0, 21.0, 26.0, 22.0, 43.0, 65.0, 93.0, 150.0, 233.0, 358.0, 628.0, 1193.0, 2769.0, 8976.0, 59380.0, 783727.0, 166358.0, 16576.0, 4174.0, 1634.0, 762.0, 473.0, 264.0, 193.0, 106.0, 63.0, 62.0, 30.0, 32.0, 27.0, 6.0, 15.0, 8.0, 5.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.734375, -30.763671875, -29.79296875, -28.822265625, -27.8515625, -26.880859375, -25.91015625, -24.939453125, -23.96875, -22.998046875, -22.02734375, -21.056640625, -20.0859375, -19.115234375, -18.14453125, -17.173828125, -16.203125, -15.232421875, -14.26171875, -13.291015625, -12.3203125, -11.349609375, -10.37890625, -9.408203125, -8.4375, -7.466796875, -6.49609375, -5.525390625, -4.5546875, -3.583984375, -2.61328125, -1.642578125, -0.671875, 0.298828125, 1.26953125, 2.240234375, 3.2109375, 4.181640625, 5.15234375, 6.123046875, 7.09375, 8.064453125, 9.03515625, 10.005859375, 10.9765625, 11.947265625, 12.91796875, 13.888671875, 14.859375, 15.830078125, 16.80078125, 17.771484375, 18.7421875, 19.712890625, 20.68359375, 21.654296875, 22.625, 23.595703125, 24.56640625, 25.537109375, 26.5078125, 27.478515625, 28.44921875, 29.419921875, 30.390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 8.0, 8.0, 13.0, 17.0, 20.0, 19.0, 22.0, 24.0, 34.0, 39.0, 29.0, 47.0, 34.0, 54.0, 47.0, 65.0, 48.0, 46.0, 37.0, 51.0, 37.0, 39.0, 43.0, 32.0, 36.0, 25.0, 23.0, 9.0, 18.0, 21.0, 6.0, 5.0, 8.0, 3.0, 6.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.671875, -20.950439453125, -20.22900390625, -19.507568359375, -18.7861328125, -18.064697265625, -17.34326171875, -16.621826171875, -15.900390625, -15.178955078125, -14.45751953125, -13.736083984375, -13.0146484375, -12.293212890625, -11.57177734375, -10.850341796875, -10.12890625, -9.407470703125, -8.68603515625, -7.964599609375, -7.2431640625, -6.521728515625, -5.80029296875, -5.078857421875, -4.357421875, -3.635986328125, -2.91455078125, -2.193115234375, -1.4716796875, -0.750244140625, -0.02880859375, 0.692626953125, 1.4140625, 2.135498046875, 2.85693359375, 3.578369140625, 4.2998046875, 5.021240234375, 5.74267578125, 6.464111328125, 7.185546875, 7.906982421875, 8.62841796875, 9.349853515625, 10.0712890625, 10.792724609375, 11.51416015625, 12.235595703125, 12.95703125, 13.678466796875, 14.39990234375, 15.121337890625, 15.8427734375, 16.564208984375, 17.28564453125, 18.007080078125, 18.728515625, 19.449951171875, 20.17138671875, 20.892822265625, 21.6142578125, 22.335693359375, 23.05712890625, 23.778564453125, 24.5]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 10.0, 7.0, 11.0, 10.0, 19.0, 23.0, 38.0, 62.0, 136.0, 321.0, 1218.0, 12446.0, 954617.0, 75750.0, 2894.0, 572.0, 171.0, 98.0, 51.0, 26.0, 22.0, 11.0, 11.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.6552734375, -18.919921875, -18.1845703125, -17.44921875, -16.7138671875, -15.978515625, -15.2431640625, -14.5078125, -13.7724609375, -13.037109375, -12.3017578125, -11.56640625, -10.8310546875, -10.095703125, -9.3603515625, -8.625, -7.8896484375, -7.154296875, -6.4189453125, -5.68359375, -4.9482421875, -4.212890625, -3.4775390625, -2.7421875, -2.0068359375, -1.271484375, -0.5361328125, 0.19921875, 0.9345703125, 1.669921875, 2.4052734375, 3.140625, 3.8759765625, 4.611328125, 5.3466796875, 6.08203125, 6.8173828125, 7.552734375, 8.2880859375, 9.0234375, 9.7587890625, 10.494140625, 11.2294921875, 11.96484375, 12.7001953125, 13.435546875, 14.1708984375, 14.90625, 15.6416015625, 16.376953125, 17.1123046875, 17.84765625, 18.5830078125, 19.318359375, 20.0537109375, 20.7890625, 21.5244140625, 22.259765625, 22.9951171875, 23.73046875, 24.4658203125, 25.201171875, 25.9365234375, 26.671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 6.0, 9.0, 5.0, 11.0, 17.0, 14.0, 33.0, 44.0, 71.0, 129.0, 223.0, 168.0, 96.0, 47.0, 26.0, 20.0, 17.0, 19.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002285003662109375, -0.0022079050540924072, -0.0021308064460754395, -0.0020537078380584717, -0.001976609230041504, -0.0018995106220245361, -0.0018224120140075684, -0.0017453134059906006, -0.0016682147979736328, -0.001591116189956665, -0.0015140175819396973, -0.0014369189739227295, -0.0013598203659057617, -0.001282721757888794, -0.0012056231498718262, -0.0011285245418548584, -0.0010514259338378906, -0.0009743273258209229, -0.0008972287178039551, -0.0008201301097869873, -0.0007430315017700195, -0.0006659328937530518, -0.000588834285736084, -0.0005117356777191162, -0.00043463706970214844, -0.00035753846168518066, -0.0002804398536682129, -0.00020334124565124512, -0.00012624263763427734, -4.914402961730957e-05, 2.7954578399658203e-05, 0.00010505318641662598, 0.00018215179443359375, 0.0002592504024505615, 0.0003363490104675293, 0.00041344761848449707, 0.0004905462265014648, 0.0005676448345184326, 0.0006447434425354004, 0.0007218420505523682, 0.0007989406585693359, 0.0008760392665863037, 0.0009531378746032715, 0.0010302364826202393, 0.001107335090637207, 0.0011844336986541748, 0.0012615323066711426, 0.0013386309146881104, 0.0014157295227050781, 0.001492828130722046, 0.0015699267387390137, 0.0016470253467559814, 0.0017241239547729492, 0.001801222562789917, 0.0018783211708068848, 0.0019554197788238525, 0.0020325183868408203, 0.002109616994857788, 0.002186715602874756, 0.0022638142108917236, 0.0023409128189086914, 0.002418011426925659, 0.002495110034942627, 0.0025722086429595947, 0.0026493072509765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 6.0, 9.0, 9.0, 11.0, 14.0, 21.0, 48.0, 70.0, 75.0, 135.0, 229.0, 404.0, 837.0, 2101.0, 6479.0, 29214.0, 299825.0, 652685.0, 42768.0, 8716.0, 2627.0, 1029.0, 510.0, 248.0, 162.0, 99.0, 67.0, 39.0, 24.0, 18.0, 17.0, 14.0, 12.0, 2.0, 8.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.0419921875, -7.755859375, -7.4697265625, -7.18359375, -6.8974609375, -6.611328125, -6.3251953125, -6.0390625, -5.7529296875, -5.466796875, -5.1806640625, -4.89453125, -4.6083984375, -4.322265625, -4.0361328125, -3.75, -3.4638671875, -3.177734375, -2.8916015625, -2.60546875, -2.3193359375, -2.033203125, -1.7470703125, -1.4609375, -1.1748046875, -0.888671875, -0.6025390625, -0.31640625, -0.0302734375, 0.255859375, 0.5419921875, 0.828125, 1.1142578125, 1.400390625, 1.6865234375, 1.97265625, 2.2587890625, 2.544921875, 2.8310546875, 3.1171875, 3.4033203125, 3.689453125, 3.9755859375, 4.26171875, 4.5478515625, 4.833984375, 5.1201171875, 5.40625, 5.6923828125, 5.978515625, 6.2646484375, 6.55078125, 6.8369140625, 7.123046875, 7.4091796875, 7.6953125, 7.9814453125, 8.267578125, 8.5537109375, 8.83984375, 9.1259765625, 9.412109375, 9.6982421875, 9.984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 11.0, 8.0, 14.0, 16.0, 18.0, 44.0, 65.0, 112.0, 175.0, 180.0, 118.0, 85.0, 46.0, 36.0, 25.0, 12.0, 12.0, 3.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7265625, -12.384033203125, -12.04150390625, -11.698974609375, -11.3564453125, -11.013916015625, -10.67138671875, -10.328857421875, -9.986328125, -9.643798828125, -9.30126953125, -8.958740234375, -8.6162109375, -8.273681640625, -7.93115234375, -7.588623046875, -7.24609375, -6.903564453125, -6.56103515625, -6.218505859375, -5.8759765625, -5.533447265625, -5.19091796875, -4.848388671875, -4.505859375, -4.163330078125, -3.82080078125, -3.478271484375, -3.1357421875, -2.793212890625, -2.45068359375, -2.108154296875, -1.765625, -1.423095703125, -1.08056640625, -0.738037109375, -0.3955078125, -0.052978515625, 0.28955078125, 0.632080078125, 0.974609375, 1.317138671875, 1.65966796875, 2.002197265625, 2.3447265625, 2.687255859375, 3.02978515625, 3.372314453125, 3.71484375, 4.057373046875, 4.39990234375, 4.742431640625, 5.0849609375, 5.427490234375, 5.77001953125, 6.112548828125, 6.455078125, 6.797607421875, 7.14013671875, 7.482666015625, 7.8251953125, 8.167724609375, 8.51025390625, 8.852783203125, 9.1953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 14.0, 33.0, 128.0, 407.0, 259.0, 98.0, 29.0, 8.0, 6.0, 12.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.00241088867188, -179.41204833984375, -169.8217010498047, -160.23133850097656, -150.6409912109375, -141.05062866210938, -131.46026611328125, -121.86991119384766, -112.27955627441406, -102.68920135498047, -93.09884643554688, -83.50848388671875, -73.91812896728516, -64.32777404785156, -54.7374153137207, -45.147056579589844, -35.55670166015625, -25.966344833374023, -16.375988006591797, -6.78563117980957, 2.8047256469726562, 12.39508056640625, 21.98543930053711, 31.57579803466797, 41.16615295410156, 50.756507873535156, 60.346866607666016, 69.93722534179688, 79.52758026123047, 89.11793518066406, 98.70829772949219, 108.29865264892578, 117.8890380859375, 127.4793930053711, 137.0697479248047, 146.6601104736328, 156.25045776367188, 165.8408203125, 175.43118286132812, 185.02154541015625, 194.6118927001953, 204.20225524902344, 213.7926025390625, 223.38296508789062, 232.97332763671875, 242.5636749267578, 252.15403747558594, 261.744384765625, 271.3347473144531, 280.92510986328125, 290.5154724121094, 300.1058044433594, 309.6961669921875, 319.2865295410156, 328.87689208984375, 338.4672546386719, 348.0576171875, 357.6479797363281, 367.23834228515625, 376.82867431640625, 386.4190368652344, 396.0093994140625, 405.5997619628906, 415.19012451171875, 424.78045654296875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 6.0, 9.0, 16.0, 12.0, 24.0, 17.0, 23.0, 30.0, 31.0, 28.0, 28.0, 35.0, 42.0, 54.0, 66.0, 81.0, 64.0, 67.0, 52.0, 44.0, 32.0, 28.0, 25.0, 25.0, 23.0, 31.0, 13.0, 16.0, 12.0, 12.0, 9.0, 3.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-103.44284057617188, -100.45379638671875, -97.46475219726562, -94.47571563720703, -91.4866714477539, -88.49762725830078, -85.50858306884766, -82.51954650878906, -79.53050231933594, -76.54145812988281, -73.55241394042969, -70.5633773803711, -67.57433319091797, -64.58528900146484, -61.59624481201172, -58.60720443725586, -55.618160247802734, -52.62911605834961, -49.64007568359375, -46.651031494140625, -43.661991119384766, -40.67294692993164, -37.68390655517578, -34.694862365722656, -31.705820083618164, -28.716777801513672, -25.72773551940918, -22.738693237304688, -19.749649047851562, -16.760608673095703, -13.771564483642578, -10.782522201538086, -7.793479919433594, -4.804437637329102, -1.8153948783874512, 1.1736478805541992, 4.162690162658691, 7.151732444763184, 10.140775680541992, 13.129817962646484, 16.118860244750977, 19.10790252685547, 22.09694480895996, 25.085987091064453, 28.075031280517578, 31.064071655273438, 34.05311584472656, 37.04216003417969, 40.03120040893555, 43.02024459838867, 46.00928497314453, 48.998329162597656, 51.987369537353516, 54.97641372680664, 57.9654541015625, 60.954498291015625, 63.94354248046875, 66.93258666992188, 69.921630859375, 72.9106674194336, 75.89971160888672, 78.88875579833984, 81.87779998779297, 84.86683654785156, 87.85588073730469]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 7.0, 18.0, 25.0, 30.0, 64.0, 98.0, 204.0, 440.0, 1086.0, 3553.0, 16309.0, 239188.0, 3745005.0, 168166.0, 14963.0, 3243.0, 996.0, 392.0, 190.0, 113.0, 60.0, 43.0, 21.0, 14.0, 14.0, 10.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.187255859375, -15.65576171875, -15.124267578125, -14.5927734375, -14.061279296875, -13.52978515625, -12.998291015625, -12.466796875, -11.935302734375, -11.40380859375, -10.872314453125, -10.3408203125, -9.809326171875, -9.27783203125, -8.746337890625, -8.21484375, -7.683349609375, -7.15185546875, -6.620361328125, -6.0888671875, -5.557373046875, -5.02587890625, -4.494384765625, -3.962890625, -3.431396484375, -2.89990234375, -2.368408203125, -1.8369140625, -1.305419921875, -0.77392578125, -0.242431640625, 0.2890625, 0.820556640625, 1.35205078125, 1.883544921875, 2.4150390625, 2.946533203125, 3.47802734375, 4.009521484375, 4.541015625, 5.072509765625, 5.60400390625, 6.135498046875, 6.6669921875, 7.198486328125, 7.72998046875, 8.261474609375, 8.79296875, 9.324462890625, 9.85595703125, 10.387451171875, 10.9189453125, 11.450439453125, 11.98193359375, 12.513427734375, 13.044921875, 13.576416015625, 14.10791015625, 14.639404296875, 15.1708984375, 15.702392578125, 16.23388671875, 16.765380859375, 17.296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 10.0, 30.0, 33.0, 36.0, 54.0, 67.0, 63.0, 63.0, 70.0, 87.0, 68.0, 75.0, 75.0, 56.0, 51.0, 43.0, 26.0, 23.0, 25.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.15625, -10.86688232421875, -10.5775146484375, -10.28814697265625, -9.998779296875, -9.70941162109375, -9.4200439453125, -9.13067626953125, -8.84130859375, -8.55194091796875, -8.2625732421875, -7.97320556640625, -7.683837890625, -7.39447021484375, -7.1051025390625, -6.81573486328125, -6.5263671875, -6.23699951171875, -5.9476318359375, -5.65826416015625, -5.368896484375, -5.07952880859375, -4.7901611328125, -4.50079345703125, -4.21142578125, -3.92205810546875, -3.6326904296875, -3.34332275390625, -3.053955078125, -2.76458740234375, -2.4752197265625, -2.18585205078125, -1.896484375, -1.60711669921875, -1.3177490234375, -1.02838134765625, -0.739013671875, -0.44964599609375, -0.1602783203125, 0.12908935546875, 0.41845703125, 0.70782470703125, 0.9971923828125, 1.28656005859375, 1.575927734375, 1.86529541015625, 2.1546630859375, 2.44403076171875, 2.7333984375, 3.02276611328125, 3.3121337890625, 3.60150146484375, 3.890869140625, 4.18023681640625, 4.4696044921875, 4.75897216796875, 5.04833984375, 5.33770751953125, 5.6270751953125, 5.91644287109375, 6.205810546875, 6.49517822265625, 6.7845458984375, 7.07391357421875, 7.36328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 11.0, 9.0, 19.0, 31.0, 44.0, 58.0, 99.0, 174.0, 301.0, 599.0, 1182.0, 2213.0, 4798.0, 17942.0, 244846.0, 3815909.0, 89713.0, 9999.0, 3168.0, 1408.0, 744.0, 403.0, 217.0, 135.0, 84.0, 54.0, 32.0, 18.0, 12.0, 13.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.125, -22.47119140625, -21.8173828125, -21.16357421875, -20.509765625, -19.85595703125, -19.2021484375, -18.54833984375, -17.89453125, -17.24072265625, -16.5869140625, -15.93310546875, -15.279296875, -14.62548828125, -13.9716796875, -13.31787109375, -12.6640625, -12.01025390625, -11.3564453125, -10.70263671875, -10.048828125, -9.39501953125, -8.7412109375, -8.08740234375, -7.43359375, -6.77978515625, -6.1259765625, -5.47216796875, -4.818359375, -4.16455078125, -3.5107421875, -2.85693359375, -2.203125, -1.54931640625, -0.8955078125, -0.24169921875, 0.412109375, 1.06591796875, 1.7197265625, 2.37353515625, 3.02734375, 3.68115234375, 4.3349609375, 4.98876953125, 5.642578125, 6.29638671875, 6.9501953125, 7.60400390625, 8.2578125, 8.91162109375, 9.5654296875, 10.21923828125, 10.873046875, 11.52685546875, 12.1806640625, 12.83447265625, 13.48828125, 14.14208984375, 14.7958984375, 15.44970703125, 16.103515625, 16.75732421875, 17.4111328125, 18.06494140625, 18.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 11.0, 6.0, 13.0, 17.0, 28.0, 53.0, 127.0, 286.0, 948.0, 1508.0, 695.0, 213.0, 85.0, 43.0, 16.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03125, -20.28955078125, -19.5478515625, -18.80615234375, -18.064453125, -17.32275390625, -16.5810546875, -15.83935546875, -15.09765625, -14.35595703125, -13.6142578125, -12.87255859375, -12.130859375, -11.38916015625, -10.6474609375, -9.90576171875, -9.1640625, -8.42236328125, -7.6806640625, -6.93896484375, -6.197265625, -5.45556640625, -4.7138671875, -3.97216796875, -3.23046875, -2.48876953125, -1.7470703125, -1.00537109375, -0.263671875, 0.47802734375, 1.2197265625, 1.96142578125, 2.703125, 3.44482421875, 4.1865234375, 4.92822265625, 5.669921875, 6.41162109375, 7.1533203125, 7.89501953125, 8.63671875, 9.37841796875, 10.1201171875, 10.86181640625, 11.603515625, 12.34521484375, 13.0869140625, 13.82861328125, 14.5703125, 15.31201171875, 16.0537109375, 16.79541015625, 17.537109375, 18.27880859375, 19.0205078125, 19.76220703125, 20.50390625, 21.24560546875, 21.9873046875, 22.72900390625, 23.470703125, 24.21240234375, 24.9541015625, 25.69580078125, 26.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 24.0, 29.0, 137.0, 394.0, 316.0, 63.0, 12.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-495.2306213378906, -485.6850891113281, -476.13958740234375, -466.59405517578125, -457.0485534667969, -447.5030212402344, -437.95751953125, -428.4119873046875, -418.866455078125, -409.3209228515625, -399.7754211425781, -390.2298889160156, -380.68438720703125, -371.13885498046875, -361.5933532714844, -352.0478210449219, -342.5023193359375, -332.956787109375, -323.4112854003906, -313.8657531738281, -304.32025146484375, -294.77471923828125, -285.2292175292969, -275.6836853027344, -266.13818359375, -256.5926513671875, -247.04714965820312, -237.5016326904297, -227.95611572265625, -218.41058349609375, -208.8650665283203, -199.31954956054688, -189.7740478515625, -180.22853088378906, -170.68301391601562, -161.1374969482422, -151.59197998046875, -142.04644775390625, -132.5009307861328, -122.95541381835938, -113.40989685058594, -103.8643798828125, -94.31886291503906, -84.7733383178711, -75.22782135009766, -65.68230438232422, -56.136783599853516, -46.59126281738281, -37.045745849609375, -27.500226974487305, -17.954708099365234, -8.409189224243164, 1.1363296508789062, 10.681846618652344, 20.227367401123047, 29.77288818359375, 39.31840515136719, 48.863922119140625, 58.40944290161133, 67.95496368408203, 77.50048065185547, 87.0459976196289, 96.59152221679688, 106.13703918457031, 115.68255615234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 20.0, 23.0, 80.0, 134.0, 167.0, 178.0, 151.0, 123.0, 66.0, 30.0, 12.0, 9.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-222.01504516601562, -215.07904052734375, -208.1430206298828, -201.20701599121094, -194.27101135253906, -187.33499145507812, -180.39898681640625, -173.46298217773438, -166.5269775390625, -159.59097290039062, -152.6549530029297, -145.7189483642578, -138.78294372558594, -131.846923828125, -124.91091918945312, -117.97491455078125, -111.03890228271484, -104.10289001464844, -97.16688537597656, -90.23087310791016, -83.29486846923828, -76.35885620117188, -69.4228515625, -62.486839294433594, -55.55083084106445, -48.61482238769531, -41.67881393432617, -34.74280548095703, -27.806795120239258, -20.870784759521484, -13.934776306152344, -6.998767852783203, -0.0627593994140625, 6.873249530792236, 13.809258460998535, 20.745267868041992, 27.681276321411133, 34.617286682128906, 41.55329513549805, 48.48930358886719, 55.42531204223633, 62.36132049560547, 69.29733276367188, 76.23333740234375, 83.16934967041016, 90.10536193847656, 97.04136657714844, 103.97737121582031, 110.91338348388672, 117.84939575195312, 124.785400390625, 131.72140502929688, 138.6574249267578, 145.5934295654297, 152.52943420410156, 159.4654541015625, 166.40145874023438, 173.33746337890625, 180.2734832763672, 187.20948791503906, 194.14549255371094, 201.08151245117188, 208.01751708984375, 214.95352172851562, 221.8895263671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 8.0, 21.0, 29.0, 30.0, 60.0, 65.0, 116.0, 205.0, 311.0, 601.0, 1242.0, 3083.0, 9673.0, 39161.0, 208137.0, 553017.0, 183619.0, 34966.0, 8750.0, 2818.0, 1205.0, 592.0, 309.0, 169.0, 124.0, 73.0, 46.0, 35.0, 26.0, 18.0, 6.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.296875, -17.8084716796875, -17.320068359375, -16.8316650390625, -16.34326171875, -15.8548583984375, -15.366455078125, -14.8780517578125, -14.3896484375, -13.9012451171875, -13.412841796875, -12.9244384765625, -12.43603515625, -11.9476318359375, -11.459228515625, -10.9708251953125, -10.482421875, -9.9940185546875, -9.505615234375, -9.0172119140625, -8.52880859375, -8.0404052734375, -7.552001953125, -7.0635986328125, -6.5751953125, -6.0867919921875, -5.598388671875, -5.1099853515625, -4.62158203125, -4.1331787109375, -3.644775390625, -3.1563720703125, -2.66796875, -2.1795654296875, -1.691162109375, -1.2027587890625, -0.71435546875, -0.2259521484375, 0.262451171875, 0.7508544921875, 1.2392578125, 1.7276611328125, 2.216064453125, 2.7044677734375, 3.19287109375, 3.6812744140625, 4.169677734375, 4.6580810546875, 5.146484375, 5.6348876953125, 6.123291015625, 6.6116943359375, 7.10009765625, 7.5885009765625, 8.076904296875, 8.5653076171875, 9.0537109375, 9.5421142578125, 10.030517578125, 10.5189208984375, 11.00732421875, 11.4957275390625, 11.984130859375, 12.4725341796875, 12.9609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 13.0, 16.0, 23.0, 43.0, 65.0, 64.0, 88.0, 116.0, 115.0, 71.0, 103.0, 76.0, 71.0, 50.0, 39.0, 16.0, 14.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.888671875, -10.49609375, -10.103515625, -9.7109375, -9.318359375, -8.92578125, -8.533203125, -8.140625, -7.748046875, -7.35546875, -6.962890625, -6.5703125, -6.177734375, -5.78515625, -5.392578125, -5.0, -4.607421875, -4.21484375, -3.822265625, -3.4296875, -3.037109375, -2.64453125, -2.251953125, -1.859375, -1.466796875, -1.07421875, -0.681640625, -0.2890625, 0.103515625, 0.49609375, 0.888671875, 1.28125, 1.673828125, 2.06640625, 2.458984375, 2.8515625, 3.244140625, 3.63671875, 4.029296875, 4.421875, 4.814453125, 5.20703125, 5.599609375, 5.9921875, 6.384765625, 6.77734375, 7.169921875, 7.5625, 7.955078125, 8.34765625, 8.740234375, 9.1328125, 9.525390625, 9.91796875, 10.310546875, 10.703125, 11.095703125, 11.48828125, 11.880859375, 12.2734375, 12.666015625, 13.05859375, 13.451171875, 13.84375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 11.0, 16.0, 26.0, 22.0, 32.0, 40.0, 71.0, 88.0, 153.0, 260.0, 408.0, 730.0, 1507.0, 3385.0, 8093.0, 22978.0, 78342.0, 318335.0, 484471.0, 88297.0, 25045.0, 8855.0, 3678.0, 1640.0, 821.0, 440.0, 264.0, 130.0, 131.0, 85.0, 47.0, 45.0, 22.0, 16.0, 10.0, 14.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7421875, -11.337890625, -10.93359375, -10.529296875, -10.125, -9.720703125, -9.31640625, -8.912109375, -8.5078125, -8.103515625, -7.69921875, -7.294921875, -6.890625, -6.486328125, -6.08203125, -5.677734375, -5.2734375, -4.869140625, -4.46484375, -4.060546875, -3.65625, -3.251953125, -2.84765625, -2.443359375, -2.0390625, -1.634765625, -1.23046875, -0.826171875, -0.421875, -0.017578125, 0.38671875, 0.791015625, 1.1953125, 1.599609375, 2.00390625, 2.408203125, 2.8125, 3.216796875, 3.62109375, 4.025390625, 4.4296875, 4.833984375, 5.23828125, 5.642578125, 6.046875, 6.451171875, 6.85546875, 7.259765625, 7.6640625, 8.068359375, 8.47265625, 8.876953125, 9.28125, 9.685546875, 10.08984375, 10.494140625, 10.8984375, 11.302734375, 11.70703125, 12.111328125, 12.515625, 12.919921875, 13.32421875, 13.728515625, 14.1328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 7.0, 12.0, 11.0, 18.0, 26.0, 19.0, 24.0, 32.0, 40.0, 41.0, 49.0, 42.0, 48.0, 60.0, 43.0, 49.0, 53.0, 47.0, 46.0, 40.0, 45.0, 36.0, 34.0, 24.0, 38.0, 17.0, 10.0, 19.0, 13.0, 8.0, 9.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-26.640625, -25.88623046875, -25.1318359375, -24.37744140625, -23.623046875, -22.86865234375, -22.1142578125, -21.35986328125, -20.60546875, -19.85107421875, -19.0966796875, -18.34228515625, -17.587890625, -16.83349609375, -16.0791015625, -15.32470703125, -14.5703125, -13.81591796875, -13.0615234375, -12.30712890625, -11.552734375, -10.79833984375, -10.0439453125, -9.28955078125, -8.53515625, -7.78076171875, -7.0263671875, -6.27197265625, -5.517578125, -4.76318359375, -4.0087890625, -3.25439453125, -2.5, -1.74560546875, -0.9912109375, -0.23681640625, 0.517578125, 1.27197265625, 2.0263671875, 2.78076171875, 3.53515625, 4.28955078125, 5.0439453125, 5.79833984375, 6.552734375, 7.30712890625, 8.0615234375, 8.81591796875, 9.5703125, 10.32470703125, 11.0791015625, 11.83349609375, 12.587890625, 13.34228515625, 14.0966796875, 14.85107421875, 15.60546875, 16.35986328125, 17.1142578125, 17.86865234375, 18.623046875, 19.37744140625, 20.1318359375, 20.88623046875, 21.640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 35.0, 44.0, 76.0, 112.0, 257.0, 504.0, 1249.0, 3785.0, 13672.0, 64986.0, 624276.0, 282924.0, 42184.0, 9792.0, 2769.0, 990.0, 418.0, 187.0, 93.0, 61.0, 28.0, 26.0, 15.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.10211181640625, -4.9190673828125, -4.73602294921875, -4.552978515625, -4.36993408203125, -4.1868896484375, -4.00384521484375, -3.82080078125, -3.63775634765625, -3.4547119140625, -3.27166748046875, -3.088623046875, -2.90557861328125, -2.7225341796875, -2.53948974609375, -2.3564453125, -2.17340087890625, -1.9903564453125, -1.80731201171875, -1.624267578125, -1.44122314453125, -1.2581787109375, -1.07513427734375, -0.89208984375, -0.70904541015625, -0.5260009765625, -0.34295654296875, -0.159912109375, 0.02313232421875, 0.2061767578125, 0.38922119140625, 0.572265625, 0.75531005859375, 0.9383544921875, 1.12139892578125, 1.304443359375, 1.48748779296875, 1.6705322265625, 1.85357666015625, 2.03662109375, 2.21966552734375, 2.4027099609375, 2.58575439453125, 2.768798828125, 2.95184326171875, 3.1348876953125, 3.31793212890625, 3.5009765625, 3.68402099609375, 3.8670654296875, 4.05010986328125, 4.233154296875, 4.41619873046875, 4.5992431640625, 4.78228759765625, 4.96533203125, 5.14837646484375, 5.3314208984375, 5.51446533203125, 5.697509765625, 5.88055419921875, 6.0635986328125, 6.24664306640625, 6.4296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 10.0, 10.0, 14.0, 19.0, 22.0, 34.0, 42.0, 64.0, 77.0, 94.0, 115.0, 108.0, 87.0, 60.0, 53.0, 32.0, 31.0, 28.0, 13.0, 14.0, 12.0, 10.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0011930465698242188, -0.0011605098843574524, -0.001127973198890686, -0.0010954365134239197, -0.0010628998279571533, -0.001030363142490387, -0.0009978264570236206, -0.0009652897715568542, -0.0009327530860900879, -0.0009002164006233215, -0.0008676797151565552, -0.0008351430296897888, -0.0008026063442230225, -0.0007700696587562561, -0.0007375329732894897, -0.0007049962878227234, -0.000672459602355957, -0.0006399229168891907, -0.0006073862314224243, -0.000574849545955658, -0.0005423128604888916, -0.0005097761750221252, -0.0004772394895553589, -0.00044470280408859253, -0.00041216611862182617, -0.0003796294331550598, -0.00034709274768829346, -0.0003145560622215271, -0.00028201937675476074, -0.0002494826912879944, -0.00021694600582122803, -0.00018440932035446167, -0.0001518726348876953, -0.00011933594942092896, -8.67992639541626e-05, -5.426257848739624e-05, -2.1725893020629883e-05, 1.0810792446136475e-05, 4.334747791290283e-05, 7.588416337966919e-05, 0.00010842084884643555, 0.0001409575343132019, 0.00017349421977996826, 0.00020603090524673462, 0.00023856759071350098, 0.00027110427618026733, 0.0003036409616470337, 0.00033617764711380005, 0.0003687143325805664, 0.00040125101804733276, 0.0004337877035140991, 0.0004663243889808655, 0.0004988610744476318, 0.0005313977599143982, 0.0005639344453811646, 0.0005964711308479309, 0.0006290078163146973, 0.0006615445017814636, 0.00069408118724823, 0.0007266178727149963, 0.0007591545581817627, 0.000791691243648529, 0.0008242279291152954, 0.0008567646145820618, 0.0008893013000488281]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 13.0, 6.0, 14.0, 32.0, 64.0, 104.0, 207.0, 343.0, 658.0, 1579.0, 3876.0, 10958.0, 37166.0, 179200.0, 649352.0, 122816.0, 27967.0, 8604.0, 3134.0, 1225.0, 581.0, 276.0, 141.0, 101.0, 53.0, 28.0, 17.0, 13.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.04248046875, -4.8818359375, -4.72119140625, -4.560546875, -4.39990234375, -4.2392578125, -4.07861328125, -3.91796875, -3.75732421875, -3.5966796875, -3.43603515625, -3.275390625, -3.11474609375, -2.9541015625, -2.79345703125, -2.6328125, -2.47216796875, -2.3115234375, -2.15087890625, -1.990234375, -1.82958984375, -1.6689453125, -1.50830078125, -1.34765625, -1.18701171875, -1.0263671875, -0.86572265625, -0.705078125, -0.54443359375, -0.3837890625, -0.22314453125, -0.0625, 0.09814453125, 0.2587890625, 0.41943359375, 0.580078125, 0.74072265625, 0.9013671875, 1.06201171875, 1.22265625, 1.38330078125, 1.5439453125, 1.70458984375, 1.865234375, 2.02587890625, 2.1865234375, 2.34716796875, 2.5078125, 2.66845703125, 2.8291015625, 2.98974609375, 3.150390625, 3.31103515625, 3.4716796875, 3.63232421875, 3.79296875, 3.95361328125, 4.1142578125, 4.27490234375, 4.435546875, 4.59619140625, 4.7568359375, 4.91748046875, 5.078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 4.0, 4.0, 21.0, 32.0, 32.0, 43.0, 48.0, 74.0, 108.0, 134.0, 125.0, 106.0, 86.0, 47.0, 35.0, 33.0, 14.0, 10.0, 15.0, 4.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30859375, -5.09661865234375, -4.8846435546875, -4.67266845703125, -4.460693359375, -4.24871826171875, -4.0367431640625, -3.82476806640625, -3.61279296875, -3.40081787109375, -3.1888427734375, -2.97686767578125, -2.764892578125, -2.55291748046875, -2.3409423828125, -2.12896728515625, -1.9169921875, -1.70501708984375, -1.4930419921875, -1.28106689453125, -1.069091796875, -0.85711669921875, -0.6451416015625, -0.43316650390625, -0.22119140625, -0.00921630859375, 0.2027587890625, 0.41473388671875, 0.626708984375, 0.83868408203125, 1.0506591796875, 1.26263427734375, 1.474609375, 1.68658447265625, 1.8985595703125, 2.11053466796875, 2.322509765625, 2.53448486328125, 2.7464599609375, 2.95843505859375, 3.17041015625, 3.38238525390625, 3.5943603515625, 3.80633544921875, 4.018310546875, 4.23028564453125, 4.4422607421875, 4.65423583984375, 4.8662109375, 5.07818603515625, 5.2901611328125, 5.50213623046875, 5.714111328125, 5.92608642578125, 6.1380615234375, 6.35003662109375, 6.56201171875, 6.77398681640625, 6.9859619140625, 7.19793701171875, 7.409912109375, 7.62188720703125, 7.8338623046875, 8.04583740234375, 8.2578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 0.0, 2.0, 9.0, 9.0, 24.0, 60.0, 124.0, 263.0, 260.0, 140.0, 61.0, 21.0, 11.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-151.759033203125, -146.1371307373047, -140.51522827148438, -134.89332580566406, -129.27142333984375, -123.64952850341797, -118.02763366699219, -112.40573120117188, -106.78382873535156, -101.16192626953125, -95.54002380371094, -89.91812896728516, -84.29622650146484, -78.67432403564453, -73.05242919921875, -67.43052673339844, -61.808624267578125, -56.18672180175781, -50.564823150634766, -44.94292449951172, -39.321022033691406, -33.699119567871094, -28.077220916748047, -22.455322265625, -16.833419799804688, -11.211519241333008, -5.589618682861328, 0.03228187561035156, 5.654182434082031, 11.276082992553711, 16.89798355102539, 22.519882202148438, 28.141769409179688, 33.763671875, 39.38557052612305, 45.007469177246094, 50.629371643066406, 56.25127410888672, 61.873172760009766, 67.49507141113281, 73.11697387695312, 78.73887634277344, 84.36077880859375, 89.98267364501953, 95.60457611083984, 101.22647857666016, 106.84837341308594, 112.47027587890625, 118.09217834472656, 123.71408081054688, 129.3359832763672, 134.9578857421875, 140.57977294921875, 146.20167541503906, 151.82357788085938, 157.4454803466797, 163.0673828125, 168.6892852783203, 174.31118774414062, 179.93309020996094, 185.55499267578125, 191.1768798828125, 196.7987823486328, 202.42068481445312, 208.04258728027344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 16.0, 10.0, 11.0, 10.0, 20.0, 20.0, 25.0, 29.0, 27.0, 31.0, 42.0, 34.0, 60.0, 59.0, 78.0, 83.0, 73.0, 59.0, 43.0, 45.0, 39.0, 22.0, 24.0, 25.0, 19.0, 26.0, 18.0, 11.0, 7.0, 8.0, 12.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-103.9564437866211, -100.84193420410156, -97.72743225097656, -94.61293029785156, -91.49842071533203, -88.3839111328125, -85.2694091796875, -82.1549072265625, -79.04039764404297, -75.92588806152344, -72.81138610839844, -69.69688415527344, -66.5823745727539, -63.46786880493164, -60.353363037109375, -57.23885726928711, -54.124351501464844, -51.00984573364258, -47.89533996582031, -44.78083419799805, -41.66632843017578, -38.551822662353516, -35.43731689453125, -32.322811126708984, -29.20830535888672, -26.093799591064453, -22.979293823242188, -19.864788055419922, -16.750282287597656, -13.63577651977539, -10.521270751953125, -7.406764984130859, -4.292266845703125, -1.1777610778808594, 1.9367446899414062, 5.051250457763672, 8.165756225585938, 11.280261993408203, 14.394767761230469, 17.509273529052734, 20.623779296875, 23.738285064697266, 26.85279083251953, 29.967296600341797, 33.08180236816406, 36.19630813598633, 39.310813903808594, 42.42531967163086, 45.539825439453125, 48.65433120727539, 51.768836975097656, 54.88334274291992, 57.99784851074219, 61.11235427856445, 64.22686004638672, 67.34136962890625, 70.45587158203125, 73.57037353515625, 76.68488311767578, 79.79939270019531, 82.91389465332031, 86.02839660644531, 89.14290618896484, 92.25741577148438, 95.37191772460938]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 13.0, 13.0, 24.0, 25.0, 58.0, 112.0, 188.0, 439.0, 1043.0, 2801.0, 9185.0, 57951.0, 1964138.0, 2082285.0, 61467.0, 9897.0, 2665.0, 1031.0, 480.0, 191.0, 116.0, 62.0, 30.0, 16.0, 11.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.875, -17.42822265625, -16.9814453125, -16.53466796875, -16.087890625, -15.64111328125, -15.1943359375, -14.74755859375, -14.30078125, -13.85400390625, -13.4072265625, -12.96044921875, -12.513671875, -12.06689453125, -11.6201171875, -11.17333984375, -10.7265625, -10.27978515625, -9.8330078125, -9.38623046875, -8.939453125, -8.49267578125, -8.0458984375, -7.59912109375, -7.15234375, -6.70556640625, -6.2587890625, -5.81201171875, -5.365234375, -4.91845703125, -4.4716796875, -4.02490234375, -3.578125, -3.13134765625, -2.6845703125, -2.23779296875, -1.791015625, -1.34423828125, -0.8974609375, -0.45068359375, -0.00390625, 0.44287109375, 0.8896484375, 1.33642578125, 1.783203125, 2.22998046875, 2.6767578125, 3.12353515625, 3.5703125, 4.01708984375, 4.4638671875, 4.91064453125, 5.357421875, 5.80419921875, 6.2509765625, 6.69775390625, 7.14453125, 7.59130859375, 8.0380859375, 8.48486328125, 8.931640625, 9.37841796875, 9.8251953125, 10.27197265625, 10.71875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 16.0, 10.0, 20.0, 29.0, 42.0, 52.0, 73.0, 76.0, 78.0, 104.0, 92.0, 90.0, 72.0, 62.0, 56.0, 43.0, 28.0, 18.0, 15.0, 9.0, 7.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.735107421875, -10.39990234375, -10.064697265625, -9.7294921875, -9.394287109375, -9.05908203125, -8.723876953125, -8.388671875, -8.053466796875, -7.71826171875, -7.383056640625, -7.0478515625, -6.712646484375, -6.37744140625, -6.042236328125, -5.70703125, -5.371826171875, -5.03662109375, -4.701416015625, -4.3662109375, -4.031005859375, -3.69580078125, -3.360595703125, -3.025390625, -2.690185546875, -2.35498046875, -2.019775390625, -1.6845703125, -1.349365234375, -1.01416015625, -0.678955078125, -0.34375, -0.008544921875, 0.32666015625, 0.661865234375, 0.9970703125, 1.332275390625, 1.66748046875, 2.002685546875, 2.337890625, 2.673095703125, 3.00830078125, 3.343505859375, 3.6787109375, 4.013916015625, 4.34912109375, 4.684326171875, 5.01953125, 5.354736328125, 5.68994140625, 6.025146484375, 6.3603515625, 6.695556640625, 7.03076171875, 7.365966796875, 7.701171875, 8.036376953125, 8.37158203125, 8.706787109375, 9.0419921875, 9.377197265625, 9.71240234375, 10.047607421875, 10.3828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 10.0, 12.0, 13.0, 32.0, 46.0, 91.0, 145.0, 326.0, 707.0, 2222.0, 14249.0, 817005.0, 3328022.0, 26574.0, 3290.0, 845.0, 355.0, 152.0, 80.0, 36.0, 26.0, 14.0, 8.0, 10.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.19140625, -23.4140625, -22.63671875, -21.859375, -21.08203125, -20.3046875, -19.52734375, -18.75, -17.97265625, -17.1953125, -16.41796875, -15.640625, -14.86328125, -14.0859375, -13.30859375, -12.53125, -11.75390625, -10.9765625, -10.19921875, -9.421875, -8.64453125, -7.8671875, -7.08984375, -6.3125, -5.53515625, -4.7578125, -3.98046875, -3.203125, -2.42578125, -1.6484375, -0.87109375, -0.09375, 0.68359375, 1.4609375, 2.23828125, 3.015625, 3.79296875, 4.5703125, 5.34765625, 6.125, 6.90234375, 7.6796875, 8.45703125, 9.234375, 10.01171875, 10.7890625, 11.56640625, 12.34375, 13.12109375, 13.8984375, 14.67578125, 15.453125, 16.23046875, 17.0078125, 17.78515625, 18.5625, 19.33984375, 20.1171875, 20.89453125, 21.671875, 22.44921875, 23.2265625, 24.00390625, 24.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 10.0, 5.0, 32.0, 31.0, 34.0, 66.0, 146.0, 350.0, 769.0, 1116.0, 765.0, 373.0, 167.0, 87.0, 48.0, 33.0, 11.0, 13.0, 4.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.3876953125, -16.853515625, -16.3193359375, -15.78515625, -15.2509765625, -14.716796875, -14.1826171875, -13.6484375, -13.1142578125, -12.580078125, -12.0458984375, -11.51171875, -10.9775390625, -10.443359375, -9.9091796875, -9.375, -8.8408203125, -8.306640625, -7.7724609375, -7.23828125, -6.7041015625, -6.169921875, -5.6357421875, -5.1015625, -4.5673828125, -4.033203125, -3.4990234375, -2.96484375, -2.4306640625, -1.896484375, -1.3623046875, -0.828125, -0.2939453125, 0.240234375, 0.7744140625, 1.30859375, 1.8427734375, 2.376953125, 2.9111328125, 3.4453125, 3.9794921875, 4.513671875, 5.0478515625, 5.58203125, 6.1162109375, 6.650390625, 7.1845703125, 7.71875, 8.2529296875, 8.787109375, 9.3212890625, 9.85546875, 10.3896484375, 10.923828125, 11.4580078125, 11.9921875, 12.5263671875, 13.060546875, 13.5947265625, 14.12890625, 14.6630859375, 15.197265625, 15.7314453125, 16.265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 6.0, 9.0, 21.0, 39.0, 58.0, 134.0, 186.0, 226.0, 158.0, 82.0, 36.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.17530822753906, -132.91171264648438, -128.64810180664062, -124.3844985961914, -120.12089538574219, -115.8572998046875, -111.59369659423828, -107.33009338378906, -103.06649017333984, -98.80288696289062, -94.5392837524414, -90.27568054199219, -86.0120849609375, -81.74847412109375, -77.48487854003906, -73.22127532958984, -68.95767211914062, -64.6940689086914, -60.43046569824219, -56.166866302490234, -51.903263092041016, -47.6396598815918, -43.376060485839844, -39.112457275390625, -34.848854064941406, -30.585250854492188, -26.3216495513916, -22.058048248291016, -17.794445037841797, -13.530841827392578, -9.267240524291992, -5.003639221191406, -0.7400360107421875, 3.523566246032715, 7.787168502807617, 12.05077075958252, 16.314373016357422, 20.57797622680664, 24.841577529907227, 29.105178833007812, 33.36878204345703, 37.63238525390625, 41.89598846435547, 46.15958786010742, 50.42319107055664, 54.68679428100586, 58.95039367675781, 63.21399688720703, 67.47760009765625, 71.74120330810547, 76.00480651855469, 80.2684097290039, 84.53201293945312, 88.79560852050781, 93.05921173095703, 97.32281494140625, 101.58641815185547, 105.85002136230469, 110.1136245727539, 114.37722778320312, 118.64082336425781, 122.90443420410156, 127.16802978515625, 131.431640625, 135.6952362060547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 8.0, 12.0, 19.0, 24.0, 17.0, 24.0, 27.0, 40.0, 32.0, 45.0, 50.0, 60.0, 37.0, 44.0, 49.0, 59.0, 48.0, 67.0, 49.0, 48.0, 43.0, 30.0, 32.0, 30.0, 20.0, 20.0, 11.0, 11.0, 5.0, 10.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.948997497558594, -61.10185623168945, -59.25471878051758, -57.40757751464844, -55.56044006347656, -53.71329879760742, -51.86615753173828, -50.019020080566406, -48.171878814697266, -46.324737548828125, -44.47760009765625, -42.63045883178711, -40.78331756591797, -38.936180114746094, -37.08903884887695, -35.24189758300781, -33.39476013183594, -31.54762077331543, -29.700481414794922, -27.85334014892578, -26.006200790405273, -24.159061431884766, -22.311920166015625, -20.464780807495117, -18.61764144897461, -16.7705020904541, -14.923361778259277, -13.076221466064453, -11.229082107543945, -9.381942749023438, -7.534802436828613, -5.687662124633789, -3.8405227661132812, -1.9933829307556152, -0.14624309539794922, 1.7008967399597168, 3.548036575317383, 5.395175933837891, 7.242316246032715, 9.089456558227539, 10.936595916748047, 12.783735275268555, 14.630875587463379, 16.478015899658203, 18.32515525817871, 20.17229461669922, 22.01943588256836, 23.866575241088867, 25.713714599609375, 27.560853958129883, 29.40799331665039, 31.25513458251953, 33.102272033691406, 34.94941329956055, 36.79655456542969, 38.64369201660156, 40.4908332824707, 42.337974548339844, 44.18511199951172, 46.03225326538086, 47.87939453125, 49.726531982421875, 51.573673248291016, 53.420814514160156, 55.26795196533203]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 16.0, 15.0, 37.0, 29.0, 48.0, 92.0, 139.0, 211.0, 359.0, 609.0, 1159.0, 2534.0, 5590.0, 15180.0, 48288.0, 176382.0, 459863.0, 240771.0, 64592.0, 19381.0, 7073.0, 2941.0, 1421.0, 729.0, 409.0, 220.0, 136.0, 82.0, 61.0, 55.0, 30.0, 25.0, 11.0, 9.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1268310546875, -9.784912109375, -9.4429931640625, -9.10107421875, -8.7591552734375, -8.417236328125, -8.0753173828125, -7.7333984375, -7.3914794921875, -7.049560546875, -6.7076416015625, -6.36572265625, -6.0238037109375, -5.681884765625, -5.3399658203125, -4.998046875, -4.6561279296875, -4.314208984375, -3.9722900390625, -3.63037109375, -3.2884521484375, -2.946533203125, -2.6046142578125, -2.2626953125, -1.9207763671875, -1.578857421875, -1.2369384765625, -0.89501953125, -0.5531005859375, -0.211181640625, 0.1307373046875, 0.47265625, 0.8145751953125, 1.156494140625, 1.4984130859375, 1.84033203125, 2.1822509765625, 2.524169921875, 2.8660888671875, 3.2080078125, 3.5499267578125, 3.891845703125, 4.2337646484375, 4.57568359375, 4.9176025390625, 5.259521484375, 5.6014404296875, 5.943359375, 6.2852783203125, 6.627197265625, 6.9691162109375, 7.31103515625, 7.6529541015625, 7.994873046875, 8.3367919921875, 8.6787109375, 9.0206298828125, 9.362548828125, 9.7044677734375, 10.04638671875, 10.3883056640625, 10.730224609375, 11.0721435546875, 11.4140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 9.0, 14.0, 31.0, 35.0, 50.0, 56.0, 45.0, 86.0, 71.0, 86.0, 84.0, 94.0, 83.0, 70.0, 41.0, 44.0, 30.0, 27.0, 13.0, 12.0, 2.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.69677734375, -10.3623046875, -10.02783203125, -9.693359375, -9.35888671875, -9.0244140625, -8.68994140625, -8.35546875, -8.02099609375, -7.6865234375, -7.35205078125, -7.017578125, -6.68310546875, -6.3486328125, -6.01416015625, -5.6796875, -5.34521484375, -5.0107421875, -4.67626953125, -4.341796875, -4.00732421875, -3.6728515625, -3.33837890625, -3.00390625, -2.66943359375, -2.3349609375, -2.00048828125, -1.666015625, -1.33154296875, -0.9970703125, -0.66259765625, -0.328125, 0.00634765625, 0.3408203125, 0.67529296875, 1.009765625, 1.34423828125, 1.6787109375, 2.01318359375, 2.34765625, 2.68212890625, 3.0166015625, 3.35107421875, 3.685546875, 4.02001953125, 4.3544921875, 4.68896484375, 5.0234375, 5.35791015625, 5.6923828125, 6.02685546875, 6.361328125, 6.69580078125, 7.0302734375, 7.36474609375, 7.69921875, 8.03369140625, 8.3681640625, 8.70263671875, 9.037109375, 9.37158203125, 9.7060546875, 10.04052734375, 10.375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 7.0, 10.0, 22.0, 17.0, 26.0, 30.0, 51.0, 85.0, 113.0, 154.0, 238.0, 397.0, 616.0, 1267.0, 3389.0, 14239.0, 108305.0, 781648.0, 116271.0, 15063.0, 3503.0, 1259.0, 642.0, 397.0, 234.0, 149.0, 103.0, 102.0, 47.0, 35.0, 33.0, 18.0, 18.0, 11.0, 8.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.21875, -19.615478515625, -19.01220703125, -18.408935546875, -17.8056640625, -17.202392578125, -16.59912109375, -15.995849609375, -15.392578125, -14.789306640625, -14.18603515625, -13.582763671875, -12.9794921875, -12.376220703125, -11.77294921875, -11.169677734375, -10.56640625, -9.963134765625, -9.35986328125, -8.756591796875, -8.1533203125, -7.550048828125, -6.94677734375, -6.343505859375, -5.740234375, -5.136962890625, -4.53369140625, -3.930419921875, -3.3271484375, -2.723876953125, -2.12060546875, -1.517333984375, -0.9140625, -0.310791015625, 0.29248046875, 0.895751953125, 1.4990234375, 2.102294921875, 2.70556640625, 3.308837890625, 3.912109375, 4.515380859375, 5.11865234375, 5.721923828125, 6.3251953125, 6.928466796875, 7.53173828125, 8.135009765625, 8.73828125, 9.341552734375, 9.94482421875, 10.548095703125, 11.1513671875, 11.754638671875, 12.35791015625, 12.961181640625, 13.564453125, 14.167724609375, 14.77099609375, 15.374267578125, 15.9775390625, 16.580810546875, 17.18408203125, 17.787353515625, 18.390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 17.0, 8.0, 14.0, 18.0, 13.0, 27.0, 31.0, 32.0, 26.0, 35.0, 45.0, 36.0, 54.0, 45.0, 52.0, 40.0, 45.0, 59.0, 39.0, 56.0, 44.0, 39.0, 42.0, 32.0, 33.0, 15.0, 19.0, 11.0, 9.0, 9.0, 7.0, 11.0, 6.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.734375, -18.013916015625, -17.29345703125, -16.572998046875, -15.8525390625, -15.132080078125, -14.41162109375, -13.691162109375, -12.970703125, -12.250244140625, -11.52978515625, -10.809326171875, -10.0888671875, -9.368408203125, -8.64794921875, -7.927490234375, -7.20703125, -6.486572265625, -5.76611328125, -5.045654296875, -4.3251953125, -3.604736328125, -2.88427734375, -2.163818359375, -1.443359375, -0.722900390625, -0.00244140625, 0.718017578125, 1.4384765625, 2.158935546875, 2.87939453125, 3.599853515625, 4.3203125, 5.040771484375, 5.76123046875, 6.481689453125, 7.2021484375, 7.922607421875, 8.64306640625, 9.363525390625, 10.083984375, 10.804443359375, 11.52490234375, 12.245361328125, 12.9658203125, 13.686279296875, 14.40673828125, 15.127197265625, 15.84765625, 16.568115234375, 17.28857421875, 18.009033203125, 18.7294921875, 19.449951171875, 20.17041015625, 20.890869140625, 21.611328125, 22.331787109375, 23.05224609375, 23.772705078125, 24.4931640625, 25.213623046875, 25.93408203125, 26.654541015625, 27.375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 15.0, 17.0, 22.0, 29.0, 58.0, 105.0, 162.0, 315.0, 623.0, 1589.0, 4531.0, 17281.0, 89827.0, 811079.0, 97058.0, 17921.0, 4803.0, 1661.0, 677.0, 300.0, 163.0, 113.0, 53.0, 41.0, 21.0, 21.0, 19.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.79681396484375, -6.5740966796875, -6.35137939453125, -6.128662109375, -5.90594482421875, -5.6832275390625, -5.46051025390625, -5.23779296875, -5.01507568359375, -4.7923583984375, -4.56964111328125, -4.346923828125, -4.12420654296875, -3.9014892578125, -3.67877197265625, -3.4560546875, -3.23333740234375, -3.0106201171875, -2.78790283203125, -2.565185546875, -2.34246826171875, -2.1197509765625, -1.89703369140625, -1.67431640625, -1.45159912109375, -1.2288818359375, -1.00616455078125, -0.783447265625, -0.56072998046875, -0.3380126953125, -0.11529541015625, 0.107421875, 0.33013916015625, 0.5528564453125, 0.77557373046875, 0.998291015625, 1.22100830078125, 1.4437255859375, 1.66644287109375, 1.88916015625, 2.11187744140625, 2.3345947265625, 2.55731201171875, 2.780029296875, 3.00274658203125, 3.2254638671875, 3.44818115234375, 3.6708984375, 3.89361572265625, 4.1163330078125, 4.33905029296875, 4.561767578125, 4.78448486328125, 5.0072021484375, 5.22991943359375, 5.45263671875, 5.67535400390625, 5.8980712890625, 6.12078857421875, 6.343505859375, 6.56622314453125, 6.7889404296875, 7.01165771484375, 7.234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 1.0, 7.0, 9.0, 11.0, 9.0, 8.0, 15.0, 28.0, 29.0, 49.0, 74.0, 144.0, 174.0, 135.0, 79.0, 54.0, 47.0, 25.0, 16.0, 16.0, 14.0, 12.0, 8.0, 7.0, 7.0, 5.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0015573501586914062, -0.0015123635530471802, -0.001467376947402954, -0.001422390341758728, -0.001377403736114502, -0.0013324171304702759, -0.0012874305248260498, -0.0012424439191818237, -0.0011974573135375977, -0.0011524707078933716, -0.0011074841022491455, -0.0010624974966049194, -0.0010175108909606934, -0.0009725242853164673, -0.0009275376796722412, -0.0008825510740280151, -0.0008375644683837891, -0.000792577862739563, -0.0007475912570953369, -0.0007026046514511108, -0.0006576180458068848, -0.0006126314401626587, -0.0005676448345184326, -0.0005226582288742065, -0.00047767162322998047, -0.0004326850175857544, -0.0003876984119415283, -0.00034271180629730225, -0.00029772520065307617, -0.0002527385950088501, -0.00020775198936462402, -0.00016276538372039795, -0.00011777877807617188, -7.27921724319458e-05, -2.7805566787719727e-05, 1.7181038856506348e-05, 6.216764450073242e-05, 0.0001071542501449585, 0.00015214085578918457, 0.00019712746143341064, 0.00024211406707763672, 0.0002871006727218628, 0.00033208727836608887, 0.00037707388401031494, 0.000422060489654541, 0.0004670470952987671, 0.0005120337009429932, 0.0005570203065872192, 0.0006020069122314453, 0.0006469935178756714, 0.0006919801235198975, 0.0007369667291641235, 0.0007819533348083496, 0.0008269399404525757, 0.0008719265460968018, 0.0009169131517410278, 0.0009618997573852539, 0.00100688636302948, 0.001051872968673706, 0.0010968595743179321, 0.0011418461799621582, 0.0011868327856063843, 0.0012318193912506104, 0.0012768059968948364, 0.0013217926025390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 9.0, 7.0, 7.0, 7.0, 28.0, 16.0, 31.0, 68.0, 110.0, 172.0, 368.0, 724.0, 1846.0, 5878.0, 25173.0, 194394.0, 752768.0, 51898.0, 10178.0, 2781.0, 1036.0, 480.0, 230.0, 116.0, 61.0, 43.0, 28.0, 22.0, 14.0, 12.0, 11.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.45257568359375, -7.2137451171875, -6.97491455078125, -6.736083984375, -6.49725341796875, -6.2584228515625, -6.01959228515625, -5.78076171875, -5.54193115234375, -5.3031005859375, -5.06427001953125, -4.825439453125, -4.58660888671875, -4.3477783203125, -4.10894775390625, -3.8701171875, -3.63128662109375, -3.3924560546875, -3.15362548828125, -2.914794921875, -2.67596435546875, -2.4371337890625, -2.19830322265625, -1.95947265625, -1.72064208984375, -1.4818115234375, -1.24298095703125, -1.004150390625, -0.76531982421875, -0.5264892578125, -0.28765869140625, -0.048828125, 0.19000244140625, 0.4288330078125, 0.66766357421875, 0.906494140625, 1.14532470703125, 1.3841552734375, 1.62298583984375, 1.86181640625, 2.10064697265625, 2.3394775390625, 2.57830810546875, 2.817138671875, 3.05596923828125, 3.2947998046875, 3.53363037109375, 3.7724609375, 4.01129150390625, 4.2501220703125, 4.48895263671875, 4.727783203125, 4.96661376953125, 5.2054443359375, 5.44427490234375, 5.68310546875, 5.92193603515625, 6.1607666015625, 6.39959716796875, 6.638427734375, 6.87725830078125, 7.1160888671875, 7.35491943359375, 7.59375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 17.0, 20.0, 27.0, 37.0, 56.0, 84.0, 116.0, 154.0, 134.0, 98.0, 53.0, 46.0, 37.0, 24.0, 18.0, 11.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0390625, -4.8349609375, -4.630859375, -4.4267578125, -4.22265625, -4.0185546875, -3.814453125, -3.6103515625, -3.40625, -3.2021484375, -2.998046875, -2.7939453125, -2.58984375, -2.3857421875, -2.181640625, -1.9775390625, -1.7734375, -1.5693359375, -1.365234375, -1.1611328125, -0.95703125, -0.7529296875, -0.548828125, -0.3447265625, -0.140625, 0.0634765625, 0.267578125, 0.4716796875, 0.67578125, 0.8798828125, 1.083984375, 1.2880859375, 1.4921875, 1.6962890625, 1.900390625, 2.1044921875, 2.30859375, 2.5126953125, 2.716796875, 2.9208984375, 3.125, 3.3291015625, 3.533203125, 3.7373046875, 3.94140625, 4.1455078125, 4.349609375, 4.5537109375, 4.7578125, 4.9619140625, 5.166015625, 5.3701171875, 5.57421875, 5.7783203125, 5.982421875, 6.1865234375, 6.390625, 6.5947265625, 6.798828125, 7.0029296875, 7.20703125, 7.4111328125, 7.615234375, 7.8193359375, 8.0234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 23.0, 68.0, 227.0, 456.0, 133.0, 45.0, 19.0, 4.0, 13.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.66421508789062, -241.41119384765625, -233.15817260742188, -224.90513610839844, -216.65211486816406, -208.3990936279297, -200.14605712890625, -191.89303588867188, -183.6400146484375, -175.38699340820312, -167.13397216796875, -158.8809356689453, -150.62791442871094, -142.37489318847656, -134.12185668945312, -125.86883544921875, -117.61581420898438, -109.36279296875, -101.1097640991211, -92.85673522949219, -84.60371398925781, -76.35069274902344, -68.09766387939453, -59.84463882446289, -51.59161376953125, -43.33858871459961, -35.08556365966797, -26.832538604736328, -18.579513549804688, -10.326488494873047, -2.0734634399414062, 6.179561614990234, 14.432586669921875, 22.685611724853516, 30.938636779785156, 39.1916618347168, 47.44468688964844, 55.69771194458008, 63.95073699951172, 72.20376586914062, 80.456787109375, 88.70980834960938, 96.96283721923828, 105.21586608886719, 113.46888732910156, 121.72190856933594, 129.97494506835938, 138.22796630859375, 146.48098754882812, 154.7340087890625, 162.98703002929688, 171.2400665283203, 179.4930877685547, 187.74610900878906, 195.9991455078125, 204.25216674804688, 212.50518798828125, 220.75820922851562, 229.01123046875, 237.26426696777344, 245.5172882080078, 253.7703094482422, 262.0233459472656, 270.2763671875, 278.5293884277344]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 6.0, 8.0, 8.0, 12.0, 10.0, 11.0, 16.0, 11.0, 16.0, 15.0, 27.0, 32.0, 32.0, 33.0, 24.0, 33.0, 40.0, 56.0, 86.0, 97.0, 59.0, 52.0, 41.0, 35.0, 27.0, 32.0, 21.0, 25.0, 21.0, 18.0, 18.0, 17.0, 7.0, 7.0, 11.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-81.42921447753906, -78.80274963378906, -76.17628479003906, -73.54981231689453, -70.92334747314453, -68.29688262939453, -65.67041778564453, -63.04395294189453, -60.417484283447266, -57.791019439697266, -55.16455078125, -52.5380859375, -49.91162109375, -47.285152435302734, -44.658687591552734, -42.03221893310547, -39.40575408935547, -36.77928924560547, -34.1528205871582, -31.526355743408203, -28.89988899230957, -26.273422241210938, -23.646957397460938, -21.020490646362305, -18.394023895263672, -15.767557144165039, -13.141091346740723, -10.514625549316406, -7.888158798217773, -5.261692047119141, -2.635226249694824, -0.008760452270507812, 2.617706298828125, 5.2441725730896, 7.870638847351074, 10.49710464477539, 13.123571395874023, 15.750038146972656, 18.376502990722656, 21.00296974182129, 23.629436492919922, 26.255903244018555, 28.882369995117188, 31.508834838867188, 34.13529968261719, 36.76176834106445, 39.38823318481445, 42.01470184326172, 44.64116668701172, 47.26763153076172, 49.894100189208984, 52.520565032958984, 55.14703369140625, 57.77349853515625, 60.39996337890625, 63.02642822265625, 65.65289306640625, 68.27935791015625, 70.90582275390625, 73.53229522705078, 76.15876007080078, 78.78522491455078, 81.41168975830078, 84.03815460205078, 86.66462707519531]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 13.0, 14.0, 25.0, 32.0, 52.0, 90.0, 180.0, 339.0, 715.0, 1765.0, 5551.0, 24913.0, 311656.0, 3310606.0, 495172.0, 32936.0, 6607.0, 1987.0, 777.0, 382.0, 184.0, 119.0, 57.0, 53.0, 17.0, 13.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.5390625, -15.1141357421875, -14.689208984375, -14.2642822265625, -13.83935546875, -13.4144287109375, -12.989501953125, -12.5645751953125, -12.1396484375, -11.7147216796875, -11.289794921875, -10.8648681640625, -10.43994140625, -10.0150146484375, -9.590087890625, -9.1651611328125, -8.740234375, -8.3153076171875, -7.890380859375, -7.4654541015625, -7.04052734375, -6.6156005859375, -6.190673828125, -5.7657470703125, -5.3408203125, -4.9158935546875, -4.490966796875, -4.0660400390625, -3.64111328125, -3.2161865234375, -2.791259765625, -2.3663330078125, -1.94140625, -1.5164794921875, -1.091552734375, -0.6666259765625, -0.24169921875, 0.1832275390625, 0.608154296875, 1.0330810546875, 1.4580078125, 1.8829345703125, 2.307861328125, 2.7327880859375, 3.15771484375, 3.5826416015625, 4.007568359375, 4.4324951171875, 4.857421875, 5.2823486328125, 5.707275390625, 6.1322021484375, 6.55712890625, 6.9820556640625, 7.406982421875, 7.8319091796875, 8.2568359375, 8.6817626953125, 9.106689453125, 9.5316162109375, 9.95654296875, 10.3814697265625, 10.806396484375, 11.2313232421875, 11.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 9.0, 8.0, 15.0, 12.0, 34.0, 27.0, 46.0, 53.0, 49.0, 66.0, 65.0, 64.0, 82.0, 76.0, 71.0, 62.0, 56.0, 52.0, 33.0, 34.0, 24.0, 29.0, 11.0, 8.0, 8.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0078125, -10.72186279296875, -10.4359130859375, -10.14996337890625, -9.864013671875, -9.57806396484375, -9.2921142578125, -9.00616455078125, -8.72021484375, -8.43426513671875, -8.1483154296875, -7.86236572265625, -7.576416015625, -7.29046630859375, -7.0045166015625, -6.71856689453125, -6.4326171875, -6.14666748046875, -5.8607177734375, -5.57476806640625, -5.288818359375, -5.00286865234375, -4.7169189453125, -4.43096923828125, -4.14501953125, -3.85906982421875, -3.5731201171875, -3.28717041015625, -3.001220703125, -2.71527099609375, -2.4293212890625, -2.14337158203125, -1.857421875, -1.57147216796875, -1.2855224609375, -0.99957275390625, -0.713623046875, -0.42767333984375, -0.1417236328125, 0.14422607421875, 0.43017578125, 0.71612548828125, 1.0020751953125, 1.28802490234375, 1.573974609375, 1.85992431640625, 2.1458740234375, 2.43182373046875, 2.7177734375, 3.00372314453125, 3.2896728515625, 3.57562255859375, 3.861572265625, 4.14752197265625, 4.4334716796875, 4.71942138671875, 5.00537109375, 5.29132080078125, 5.5772705078125, 5.86322021484375, 6.149169921875, 6.43511962890625, 6.7210693359375, 7.00701904296875, 7.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 14.0, 24.0, 26.0, 50.0, 68.0, 128.0, 233.0, 462.0, 1060.0, 3982.0, 40920.0, 3860066.0, 274568.0, 9637.0, 1741.0, 623.0, 308.0, 153.0, 74.0, 50.0, 26.0, 18.0, 14.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.705078125, -25.86328125, -25.021484375, -24.1796875, -23.337890625, -22.49609375, -21.654296875, -20.8125, -19.970703125, -19.12890625, -18.287109375, -17.4453125, -16.603515625, -15.76171875, -14.919921875, -14.078125, -13.236328125, -12.39453125, -11.552734375, -10.7109375, -9.869140625, -9.02734375, -8.185546875, -7.34375, -6.501953125, -5.66015625, -4.818359375, -3.9765625, -3.134765625, -2.29296875, -1.451171875, -0.609375, 0.232421875, 1.07421875, 1.916015625, 2.7578125, 3.599609375, 4.44140625, 5.283203125, 6.125, 6.966796875, 7.80859375, 8.650390625, 9.4921875, 10.333984375, 11.17578125, 12.017578125, 12.859375, 13.701171875, 14.54296875, 15.384765625, 16.2265625, 17.068359375, 17.91015625, 18.751953125, 19.59375, 20.435546875, 21.27734375, 22.119140625, 22.9609375, 23.802734375, 24.64453125, 25.486328125, 26.328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 13.0, 7.0, 14.0, 24.0, 33.0, 46.0, 93.0, 179.0, 323.0, 747.0, 1050.0, 738.0, 375.0, 181.0, 93.0, 57.0, 31.0, 23.0, 17.0, 13.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.3125, -22.751953125, -22.19140625, -21.630859375, -21.0703125, -20.509765625, -19.94921875, -19.388671875, -18.828125, -18.267578125, -17.70703125, -17.146484375, -16.5859375, -16.025390625, -15.46484375, -14.904296875, -14.34375, -13.783203125, -13.22265625, -12.662109375, -12.1015625, -11.541015625, -10.98046875, -10.419921875, -9.859375, -9.298828125, -8.73828125, -8.177734375, -7.6171875, -7.056640625, -6.49609375, -5.935546875, -5.375, -4.814453125, -4.25390625, -3.693359375, -3.1328125, -2.572265625, -2.01171875, -1.451171875, -0.890625, -0.330078125, 0.23046875, 0.791015625, 1.3515625, 1.912109375, 2.47265625, 3.033203125, 3.59375, 4.154296875, 4.71484375, 5.275390625, 5.8359375, 6.396484375, 6.95703125, 7.517578125, 8.078125, 8.638671875, 9.19921875, 9.759765625, 10.3203125, 10.880859375, 11.44140625, 12.001953125, 12.5625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 10.0, 18.0, 27.0, 37.0, 72.0, 98.0, 151.0, 158.0, 134.0, 104.0, 62.0, 48.0, 21.0, 14.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.6511001586914, -109.38550567626953, -106.11991119384766, -102.85432434082031, -99.58872985839844, -96.32313537597656, -93.05754089355469, -89.79194641113281, -86.52635192871094, -83.26075744628906, -79.99516296386719, -76.72956848144531, -73.46398162841797, -70.1983871459961, -66.93279266357422, -63.667198181152344, -60.401611328125, -57.136016845703125, -53.870426177978516, -50.60483169555664, -47.33924102783203, -44.073646545410156, -40.80805206298828, -37.542457580566406, -34.2768669128418, -31.011274337768555, -27.745681762695312, -24.480087280273438, -21.214494705200195, -17.948902130126953, -14.683307647705078, -11.417715072631836, -8.152130126953125, -4.886537075042725, -1.6209440231323242, 1.6446495056152344, 4.910242080688477, 8.175834655761719, 11.441429138183594, 14.707021713256836, 17.972614288330078, 21.23820686340332, 24.503799438476562, 27.769393920898438, 31.03498649597168, 34.30057907104492, 37.5661735534668, 40.831764221191406, 44.09735870361328, 47.362953186035156, 50.628543853759766, 53.89413833618164, 57.15972900390625, 60.425323486328125, 63.69091796875, 66.95651245117188, 70.22210693359375, 73.48770141601562, 76.7532958984375, 80.01889038085938, 83.28447723388672, 86.5500717163086, 89.81566619873047, 93.08126068115234, 96.34684753417969]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 9.0, 9.0, 19.0, 20.0, 17.0, 19.0, 25.0, 28.0, 34.0, 39.0, 35.0, 28.0, 49.0, 39.0, 50.0, 42.0, 38.0, 53.0, 53.0, 32.0, 43.0, 27.0, 31.0, 30.0, 36.0, 20.0, 36.0, 26.0, 16.0, 13.0, 14.0, 9.0, 13.0, 5.0, 3.0, 5.0, 10.0, 7.0, 3.0, 4.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0], "bins": [-63.84431457519531, -62.00426483154297, -60.16421890258789, -58.32416915893555, -56.4841194152832, -54.644073486328125, -52.80402374267578, -50.96397399902344, -49.123924255371094, -47.28387451171875, -45.44382858276367, -43.60377883911133, -41.763729095458984, -39.923683166503906, -38.08363342285156, -36.24358367919922, -34.403533935546875, -32.56348419189453, -30.72343635559082, -28.88338851928711, -27.043338775634766, -25.203290939331055, -23.363243103027344, -21.523193359375, -19.683147430419922, -17.84309959411621, -16.003049850463867, -14.163002014160156, -12.322952270507812, -10.482904434204102, -8.642855644226074, -6.802806854248047, -4.962757110595703, -3.122708320617676, -1.2826597690582275, 0.5573887825012207, 2.397437572479248, 4.237485885620117, 6.0775346755981445, 7.917583465576172, 9.7576322555542, 11.597681045532227, 13.437729835510254, 15.277778625488281, 17.117826461791992, 18.957874298095703, 20.797924041748047, 22.63797378540039, 24.4780216217041, 26.318069458007812, 28.158119201660156, 29.998167037963867, 31.83821678161621, 33.67826461791992, 35.518314361572266, 37.358360290527344, 39.19841003417969, 41.03845977783203, 42.87850570678711, 44.71855545043945, 46.5586051940918, 48.398651123046875, 50.23870086669922, 52.07875061035156, 53.918800354003906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 5.0, 9.0, 15.0, 14.0, 40.0, 32.0, 43.0, 63.0, 86.0, 152.0, 224.0, 357.0, 630.0, 1129.0, 2143.0, 4005.0, 8379.0, 18828.0, 47030.0, 131872.0, 365076.0, 299671.0, 101172.0, 37063.0, 15785.0, 6884.0, 3504.0, 1876.0, 960.0, 566.0, 335.0, 203.0, 133.0, 93.0, 48.0, 37.0, 22.0, 19.0, 14.0, 10.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.627685546875, -9.32568359375, -9.023681640625, -8.7216796875, -8.419677734375, -8.11767578125, -7.815673828125, -7.513671875, -7.211669921875, -6.90966796875, -6.607666015625, -6.3056640625, -6.003662109375, -5.70166015625, -5.399658203125, -5.09765625, -4.795654296875, -4.49365234375, -4.191650390625, -3.8896484375, -3.587646484375, -3.28564453125, -2.983642578125, -2.681640625, -2.379638671875, -2.07763671875, -1.775634765625, -1.4736328125, -1.171630859375, -0.86962890625, -0.567626953125, -0.265625, 0.036376953125, 0.33837890625, 0.640380859375, 0.9423828125, 1.244384765625, 1.54638671875, 1.848388671875, 2.150390625, 2.452392578125, 2.75439453125, 3.056396484375, 3.3583984375, 3.660400390625, 3.96240234375, 4.264404296875, 4.56640625, 4.868408203125, 5.17041015625, 5.472412109375, 5.7744140625, 6.076416015625, 6.37841796875, 6.680419921875, 6.982421875, 7.284423828125, 7.58642578125, 7.888427734375, 8.1904296875, 8.492431640625, 8.79443359375, 9.096435546875, 9.3984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 15.0, 18.0, 17.0, 20.0, 19.0, 33.0, 49.0, 42.0, 42.0, 63.0, 73.0, 78.0, 62.0, 64.0, 57.0, 68.0, 55.0, 46.0, 44.0, 25.0, 30.0, 24.0, 14.0, 12.0, 9.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.4630126953125, -10.183837890625, -9.9046630859375, -9.62548828125, -9.3463134765625, -9.067138671875, -8.7879638671875, -8.5087890625, -8.2296142578125, -7.950439453125, -7.6712646484375, -7.39208984375, -7.1129150390625, -6.833740234375, -6.5545654296875, -6.275390625, -5.9962158203125, -5.717041015625, -5.4378662109375, -5.15869140625, -4.8795166015625, -4.600341796875, -4.3211669921875, -4.0419921875, -3.7628173828125, -3.483642578125, -3.2044677734375, -2.92529296875, -2.6461181640625, -2.366943359375, -2.0877685546875, -1.80859375, -1.5294189453125, -1.250244140625, -0.9710693359375, -0.69189453125, -0.4127197265625, -0.133544921875, 0.1456298828125, 0.4248046875, 0.7039794921875, 0.983154296875, 1.2623291015625, 1.54150390625, 1.8206787109375, 2.099853515625, 2.3790283203125, 2.658203125, 2.9373779296875, 3.216552734375, 3.4957275390625, 3.77490234375, 4.0540771484375, 4.333251953125, 4.6124267578125, 4.8916015625, 5.1707763671875, 5.449951171875, 5.7291259765625, 6.00830078125, 6.2874755859375, 6.566650390625, 6.8458251953125, 7.125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 10.0, 17.0, 16.0, 22.0, 25.0, 46.0, 56.0, 65.0, 109.0, 157.0, 204.0, 341.0, 492.0, 905.0, 1793.0, 5360.0, 33022.0, 780183.0, 203256.0, 15524.0, 3505.0, 1327.0, 705.0, 437.0, 266.0, 185.0, 129.0, 107.0, 88.0, 57.0, 32.0, 30.0, 29.0, 21.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.453125, -26.686767578125, -25.92041015625, -25.154052734375, -24.3876953125, -23.621337890625, -22.85498046875, -22.088623046875, -21.322265625, -20.555908203125, -19.78955078125, -19.023193359375, -18.2568359375, -17.490478515625, -16.72412109375, -15.957763671875, -15.19140625, -14.425048828125, -13.65869140625, -12.892333984375, -12.1259765625, -11.359619140625, -10.59326171875, -9.826904296875, -9.060546875, -8.294189453125, -7.52783203125, -6.761474609375, -5.9951171875, -5.228759765625, -4.46240234375, -3.696044921875, -2.9296875, -2.163330078125, -1.39697265625, -0.630615234375, 0.1357421875, 0.902099609375, 1.66845703125, 2.434814453125, 3.201171875, 3.967529296875, 4.73388671875, 5.500244140625, 6.2666015625, 7.032958984375, 7.79931640625, 8.565673828125, 9.33203125, 10.098388671875, 10.86474609375, 11.631103515625, 12.3974609375, 13.163818359375, 13.93017578125, 14.696533203125, 15.462890625, 16.229248046875, 16.99560546875, 17.761962890625, 18.5283203125, 19.294677734375, 20.06103515625, 20.827392578125, 21.59375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 13.0, 7.0, 13.0, 12.0, 10.0, 13.0, 20.0, 16.0, 20.0, 37.0, 41.0, 35.0, 58.0, 62.0, 73.0, 64.0, 57.0, 50.0, 62.0, 47.0, 41.0, 44.0, 47.0, 23.0, 20.0, 14.0, 18.0, 12.0, 16.0, 12.0, 7.0, 10.0, 5.0, 4.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.90625, -26.07421875, -25.2421875, -24.41015625, -23.578125, -22.74609375, -21.9140625, -21.08203125, -20.25, -19.41796875, -18.5859375, -17.75390625, -16.921875, -16.08984375, -15.2578125, -14.42578125, -13.59375, -12.76171875, -11.9296875, -11.09765625, -10.265625, -9.43359375, -8.6015625, -7.76953125, -6.9375, -6.10546875, -5.2734375, -4.44140625, -3.609375, -2.77734375, -1.9453125, -1.11328125, -0.28125, 0.55078125, 1.3828125, 2.21484375, 3.046875, 3.87890625, 4.7109375, 5.54296875, 6.375, 7.20703125, 8.0390625, 8.87109375, 9.703125, 10.53515625, 11.3671875, 12.19921875, 13.03125, 13.86328125, 14.6953125, 15.52734375, 16.359375, 17.19140625, 18.0234375, 18.85546875, 19.6875, 20.51953125, 21.3515625, 22.18359375, 23.015625, 23.84765625, 24.6796875, 25.51171875, 26.34375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 13.0, 20.0, 17.0, 34.0, 43.0, 60.0, 81.0, 172.0, 241.0, 600.0, 1421.0, 4405.0, 19561.0, 215394.0, 765153.0, 31567.0, 6270.0, 1916.0, 683.0, 337.0, 182.0, 115.0, 79.0, 54.0, 40.0, 25.0, 11.0, 12.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.44921875, -7.20196533203125, -6.9547119140625, -6.70745849609375, -6.460205078125, -6.21295166015625, -5.9656982421875, -5.71844482421875, -5.47119140625, -5.22393798828125, -4.9766845703125, -4.72943115234375, -4.482177734375, -4.23492431640625, -3.9876708984375, -3.74041748046875, -3.4931640625, -3.24591064453125, -2.9986572265625, -2.75140380859375, -2.504150390625, -2.25689697265625, -2.0096435546875, -1.76239013671875, -1.51513671875, -1.26788330078125, -1.0206298828125, -0.77337646484375, -0.526123046875, -0.27886962890625, -0.0316162109375, 0.21563720703125, 0.462890625, 0.71014404296875, 0.9573974609375, 1.20465087890625, 1.451904296875, 1.69915771484375, 1.9464111328125, 2.19366455078125, 2.44091796875, 2.68817138671875, 2.9354248046875, 3.18267822265625, 3.429931640625, 3.67718505859375, 3.9244384765625, 4.17169189453125, 4.4189453125, 4.66619873046875, 4.9134521484375, 5.16070556640625, 5.407958984375, 5.65521240234375, 5.9024658203125, 6.14971923828125, 6.39697265625, 6.64422607421875, 6.8914794921875, 7.13873291015625, 7.385986328125, 7.63323974609375, 7.8804931640625, 8.12774658203125, 8.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 15.0, 17.0, 32.0, 68.0, 189.0, 306.0, 152.0, 60.0, 36.0, 23.0, 14.0, 11.0, 6.0, 12.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0035247802734375, -0.0034376978874206543, -0.0033506155014038086, -0.003263533115386963, -0.003176450729370117, -0.0030893683433532715, -0.0030022859573364258, -0.00291520357131958, -0.0028281211853027344, -0.0027410387992858887, -0.002653956413269043, -0.0025668740272521973, -0.0024797916412353516, -0.002392709255218506, -0.00230562686920166, -0.0022185444831848145, -0.0021314620971679688, -0.002044379711151123, -0.0019572973251342773, -0.0018702149391174316, -0.001783132553100586, -0.0016960501670837402, -0.0016089677810668945, -0.0015218853950500488, -0.0014348030090332031, -0.0013477206230163574, -0.0012606382369995117, -0.001173555850982666, -0.0010864734649658203, -0.0009993910789489746, -0.0009123086929321289, -0.0008252263069152832, -0.0007381439208984375, -0.0006510615348815918, -0.0005639791488647461, -0.0004768967628479004, -0.0003898143768310547, -0.000302731990814209, -0.00021564960479736328, -0.00012856721878051758, -4.1484832763671875e-05, 4.559755325317383e-05, 0.00013267993927001953, 0.00021976232528686523, 0.00030684471130371094, 0.00039392709732055664, 0.00048100948333740234, 0.000568091869354248, 0.0006551742553710938, 0.0007422566413879395, 0.0008293390274047852, 0.0009164214134216309, 0.0010035037994384766, 0.0010905861854553223, 0.001177668571472168, 0.0012647509574890137, 0.0013518333435058594, 0.001438915729522705, 0.0015259981155395508, 0.0016130805015563965, 0.0017001628875732422, 0.0017872452735900879, 0.0018743276596069336, 0.0019614100456237793, 0.002048492431640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 14.0, 20.0, 23.0, 43.0, 64.0, 140.0, 244.0, 487.0, 1021.0, 3115.0, 13278.0, 141445.0, 840187.0, 38998.0, 6211.0, 1750.0, 693.0, 376.0, 162.0, 103.0, 58.0, 21.0, 24.0, 21.0, 15.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.0234375, -7.75830078125, -7.4931640625, -7.22802734375, -6.962890625, -6.69775390625, -6.4326171875, -6.16748046875, -5.90234375, -5.63720703125, -5.3720703125, -5.10693359375, -4.841796875, -4.57666015625, -4.3115234375, -4.04638671875, -3.78125, -3.51611328125, -3.2509765625, -2.98583984375, -2.720703125, -2.45556640625, -2.1904296875, -1.92529296875, -1.66015625, -1.39501953125, -1.1298828125, -0.86474609375, -0.599609375, -0.33447265625, -0.0693359375, 0.19580078125, 0.4609375, 0.72607421875, 0.9912109375, 1.25634765625, 1.521484375, 1.78662109375, 2.0517578125, 2.31689453125, 2.58203125, 2.84716796875, 3.1123046875, 3.37744140625, 3.642578125, 3.90771484375, 4.1728515625, 4.43798828125, 4.703125, 4.96826171875, 5.2333984375, 5.49853515625, 5.763671875, 6.02880859375, 6.2939453125, 6.55908203125, 6.82421875, 7.08935546875, 7.3544921875, 7.61962890625, 7.884765625, 8.14990234375, 8.4150390625, 8.68017578125, 8.9453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 6.0, 12.0, 20.0, 24.0, 18.0, 20.0, 33.0, 51.0, 50.0, 67.0, 60.0, 85.0, 86.0, 69.0, 58.0, 40.0, 33.0, 34.0, 26.0, 25.0, 27.0, 21.0, 18.0, 23.0, 5.0, 5.0, 8.0, 4.0, 5.0, 9.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.833984375, -2.73016357421875, -2.6263427734375, -2.52252197265625, -2.418701171875, -2.31488037109375, -2.2110595703125, -2.10723876953125, -2.00341796875, -1.89959716796875, -1.7957763671875, -1.69195556640625, -1.588134765625, -1.48431396484375, -1.3804931640625, -1.27667236328125, -1.1728515625, -1.06903076171875, -0.9652099609375, -0.86138916015625, -0.757568359375, -0.65374755859375, -0.5499267578125, -0.44610595703125, -0.34228515625, -0.23846435546875, -0.1346435546875, -0.03082275390625, 0.072998046875, 0.17681884765625, 0.2806396484375, 0.38446044921875, 0.48828125, 0.59210205078125, 0.6959228515625, 0.79974365234375, 0.903564453125, 1.00738525390625, 1.1112060546875, 1.21502685546875, 1.31884765625, 1.42266845703125, 1.5264892578125, 1.63031005859375, 1.734130859375, 1.83795166015625, 1.9417724609375, 2.04559326171875, 2.1494140625, 2.25323486328125, 2.3570556640625, 2.46087646484375, 2.564697265625, 2.66851806640625, 2.7723388671875, 2.87615966796875, 2.97998046875, 3.08380126953125, 3.1876220703125, 3.29144287109375, 3.395263671875, 3.49908447265625, 3.6029052734375, 3.70672607421875, 3.810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 28.0, 93.0, 517.0, 240.0, 74.0, 21.0, 12.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.7628479003906, -281.60247802734375, -272.44207763671875, -263.2817077636719, -254.121337890625, -244.96096801757812, -235.8005828857422, -226.64019775390625, -217.47982788085938, -208.3194580078125, -199.15907287597656, -189.99868774414062, -180.83831787109375, -171.67794799804688, -162.51756286621094, -153.357177734375, -144.19680786132812, -135.03643798828125, -125.87605285644531, -116.7156753540039, -107.5552978515625, -98.3949203491211, -89.23454284667969, -80.07416534423828, -70.91378784179688, -61.75341033935547, -52.59303283691406, -43.432655334472656, -34.27227783203125, -25.111900329589844, -15.951522827148438, -6.791145324707031, 2.3692626953125, 11.529640197753906, 20.690017700195312, 29.85039520263672, 39.010772705078125, 48.17115020751953, 57.33152770996094, 66.49190521240234, 75.65228271484375, 84.81266021728516, 93.97303771972656, 103.13341522216797, 112.29379272460938, 121.45417022705078, 130.6145477294922, 139.77493286132812, 148.935302734375, 158.09567260742188, 167.2560577392578, 176.41644287109375, 185.57681274414062, 194.7371826171875, 203.89756774902344, 213.05795288085938, 222.21832275390625, 231.37869262695312, 240.53907775878906, 249.699462890625, 258.8598327636719, 268.02020263671875, 277.18060302734375, 286.3409729003906, 295.5013427734375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 10.0, 5.0, 7.0, 10.0, 11.0, 17.0, 17.0, 23.0, 16.0, 19.0, 23.0, 23.0, 24.0, 28.0, 38.0, 39.0, 63.0, 118.0, 124.0, 77.0, 30.0, 28.0, 35.0, 24.0, 26.0, 21.0, 12.0, 20.0, 21.0, 20.0, 14.0, 7.0, 16.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.82524871826172, -83.22760772705078, -80.62996673583984, -78.03231811523438, -75.43467712402344, -72.8370361328125, -70.23939514160156, -67.64175415039062, -65.04411315917969, -62.44647216796875, -59.84882736206055, -57.25118637084961, -54.653541564941406, -52.05590057373047, -49.45825958251953, -46.860618591308594, -44.262969970703125, -41.66532897949219, -39.067684173583984, -36.47004318237305, -33.872398376464844, -31.274757385253906, -28.67711639404297, -26.0794734954834, -23.481830596923828, -20.884187698364258, -18.286544799804688, -15.68890380859375, -13.09126091003418, -10.49361801147461, -7.8959760665893555, -5.298334121704102, -2.7006912231445312, -0.10304880142211914, 2.494593620300293, 5.092236042022705, 7.689878463745117, 10.287521362304688, 12.885163307189941, 15.482805252075195, 18.080448150634766, 20.678091049194336, 23.275733947753906, 25.873374938964844, 28.471017837524414, 31.068660736083984, 33.66630172729492, 36.263946533203125, 38.86158752441406, 41.459228515625, 44.0568733215332, 46.65451431274414, 49.252159118652344, 51.84980010986328, 54.44744110107422, 57.045082092285156, 59.64272689819336, 62.2403678894043, 64.8380126953125, 67.43565368652344, 70.03329467773438, 72.63093566894531, 75.22858428955078, 77.82622528076172, 80.42386627197266]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 6.0, 22.0, 19.0, 49.0, 97.0, 150.0, 337.0, 645.0, 1562.0, 4067.0, 14939.0, 125739.0, 1921525.0, 1977961.0, 123615.0, 16222.0, 4251.0, 1622.0, 709.0, 333.0, 178.0, 100.0, 53.0, 33.0, 14.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.546875, -20.0577392578125, -19.568603515625, -19.0794677734375, -18.59033203125, -18.1011962890625, -17.612060546875, -17.1229248046875, -16.6337890625, -16.1446533203125, -15.655517578125, -15.1663818359375, -14.67724609375, -14.1881103515625, -13.698974609375, -13.2098388671875, -12.720703125, -12.2315673828125, -11.742431640625, -11.2532958984375, -10.76416015625, -10.2750244140625, -9.785888671875, -9.2967529296875, -8.8076171875, -8.3184814453125, -7.829345703125, -7.3402099609375, -6.85107421875, -6.3619384765625, -5.872802734375, -5.3836669921875, -4.89453125, -4.4053955078125, -3.916259765625, -3.4271240234375, -2.93798828125, -2.4488525390625, -1.959716796875, -1.4705810546875, -0.9814453125, -0.4923095703125, -0.003173828125, 0.4859619140625, 0.97509765625, 1.4642333984375, 1.953369140625, 2.4425048828125, 2.931640625, 3.4207763671875, 3.909912109375, 4.3990478515625, 4.88818359375, 5.3773193359375, 5.866455078125, 6.3555908203125, 6.8447265625, 7.3338623046875, 7.822998046875, 8.3121337890625, 8.80126953125, 9.2904052734375, 9.779541015625, 10.2686767578125, 10.7578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 6.0, 8.0, 16.0, 15.0, 16.0, 32.0, 47.0, 47.0, 46.0, 58.0, 63.0, 51.0, 79.0, 72.0, 72.0, 68.0, 57.0, 50.0, 33.0, 42.0, 37.0, 21.0, 23.0, 14.0, 5.0, 6.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.765625, -10.5037841796875, -10.241943359375, -9.9801025390625, -9.71826171875, -9.4564208984375, -9.194580078125, -8.9327392578125, -8.6708984375, -8.4090576171875, -8.147216796875, -7.8853759765625, -7.62353515625, -7.3616943359375, -7.099853515625, -6.8380126953125, -6.576171875, -6.3143310546875, -6.052490234375, -5.7906494140625, -5.52880859375, -5.2669677734375, -5.005126953125, -4.7432861328125, -4.4814453125, -4.2196044921875, -3.957763671875, -3.6959228515625, -3.43408203125, -3.1722412109375, -2.910400390625, -2.6485595703125, -2.38671875, -2.1248779296875, -1.863037109375, -1.6011962890625, -1.33935546875, -1.0775146484375, -0.815673828125, -0.5538330078125, -0.2919921875, -0.0301513671875, 0.231689453125, 0.4935302734375, 0.75537109375, 1.0172119140625, 1.279052734375, 1.5408935546875, 1.802734375, 2.0645751953125, 2.326416015625, 2.5882568359375, 2.85009765625, 3.1119384765625, 3.373779296875, 3.6356201171875, 3.8974609375, 4.1593017578125, 4.421142578125, 4.6829833984375, 4.94482421875, 5.2066650390625, 5.468505859375, 5.7303466796875, 5.9921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 11.0, 17.0, 13.0, 18.0, 40.0, 55.0, 93.0, 117.0, 211.0, 341.0, 655.0, 1407.0, 4855.0, 54440.0, 4035787.0, 86419.0, 6220.0, 1814.0, 721.0, 402.0, 232.0, 133.0, 84.0, 65.0, 36.0, 27.0, 20.0, 8.0, 10.0, 10.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.0, -42.7265625, -41.453125, -40.1796875, -38.90625, -37.6328125, -36.359375, -35.0859375, -33.8125, -32.5390625, -31.265625, -29.9921875, -28.71875, -27.4453125, -26.171875, -24.8984375, -23.625, -22.3515625, -21.078125, -19.8046875, -18.53125, -17.2578125, -15.984375, -14.7109375, -13.4375, -12.1640625, -10.890625, -9.6171875, -8.34375, -7.0703125, -5.796875, -4.5234375, -3.25, -1.9765625, -0.703125, 0.5703125, 1.84375, 3.1171875, 4.390625, 5.6640625, 6.9375, 8.2109375, 9.484375, 10.7578125, 12.03125, 13.3046875, 14.578125, 15.8515625, 17.125, 18.3984375, 19.671875, 20.9453125, 22.21875, 23.4921875, 24.765625, 26.0390625, 27.3125, 28.5859375, 29.859375, 31.1328125, 32.40625, 33.6796875, 34.953125, 36.2265625, 37.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 8.0, 15.0, 12.0, 31.0, 41.0, 70.0, 141.0, 201.0, 436.0, 727.0, 830.0, 629.0, 364.0, 194.0, 145.0, 82.0, 53.0, 28.0, 16.0, 12.0, 14.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.359375, -28.5068359375, -27.654296875, -26.8017578125, -25.94921875, -25.0966796875, -24.244140625, -23.3916015625, -22.5390625, -21.6865234375, -20.833984375, -19.9814453125, -19.12890625, -18.2763671875, -17.423828125, -16.5712890625, -15.71875, -14.8662109375, -14.013671875, -13.1611328125, -12.30859375, -11.4560546875, -10.603515625, -9.7509765625, -8.8984375, -8.0458984375, -7.193359375, -6.3408203125, -5.48828125, -4.6357421875, -3.783203125, -2.9306640625, -2.078125, -1.2255859375, -0.373046875, 0.4794921875, 1.33203125, 2.1845703125, 3.037109375, 3.8896484375, 4.7421875, 5.5947265625, 6.447265625, 7.2998046875, 8.15234375, 9.0048828125, 9.857421875, 10.7099609375, 11.5625, 12.4150390625, 13.267578125, 14.1201171875, 14.97265625, 15.8251953125, 16.677734375, 17.5302734375, 18.3828125, 19.2353515625, 20.087890625, 20.9404296875, 21.79296875, 22.6455078125, 23.498046875, 24.3505859375, 25.203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 9.0, 11.0, 44.0, 100.0, 189.0, 271.0, 195.0, 66.0, 45.0, 21.0, 12.0, 7.0, 5.0, 9.0, 4.0, 0.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.5740966796875, -181.1441192626953, -170.7141571044922, -160.2841796875, -149.85421752929688, -139.4242401123047, -128.9942626953125, -118.56430053710938, -108.13433074951172, -97.70436096191406, -87.2743911743164, -76.84442138671875, -66.41444396972656, -55.98447799682617, -45.55450439453125, -35.124534606933594, -24.694564819335938, -14.264594078063965, -3.834623336791992, 6.595348358154297, 17.025318145751953, 27.45528793334961, 37.88526153564453, 48.31523132324219, 58.745201110839844, 69.1751708984375, 79.60514068603516, 90.03511047363281, 100.465087890625, 110.89505004882812, 121.32502746582031, 131.7550048828125, 142.18496704101562, 152.6149444580078, 163.04490661621094, 173.47488403320312, 183.90484619140625, 194.33482360839844, 204.76480102539062, 215.19476318359375, 225.62472534179688, 236.05470275878906, 246.4846649169922, 256.9146423339844, 267.3446044921875, 277.7745666503906, 288.2045593261719, 298.634521484375, 309.06451416015625, 319.4944763183594, 329.9244689941406, 340.35443115234375, 350.7843933105469, 361.21435546875, 371.64434814453125, 382.0743103027344, 392.5042724609375, 402.9342346191406, 413.3642272949219, 423.794189453125, 434.2241516113281, 444.65411376953125, 455.0841064453125, 465.5140686035156, 475.94403076171875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 11.0, 13.0, 26.0, 28.0, 39.0, 51.0, 47.0, 60.0, 61.0, 76.0, 62.0, 82.0, 71.0, 59.0, 42.0, 42.0, 41.0, 36.0, 30.0, 18.0, 23.0, 16.0, 16.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.4095458984375, -147.69061279296875, -142.97169494628906, -138.2527618408203, -133.53384399414062, -128.81491088867188, -124.09597778320312, -119.3770523071289, -114.65812683105469, -109.93920135498047, -105.22027587890625, -100.5013427734375, -95.78241729736328, -91.06349182128906, -86.34455871582031, -81.6256332397461, -76.90670776367188, -72.18778228759766, -67.46885681152344, -62.74992370605469, -58.03099822998047, -53.31207275390625, -48.593143463134766, -43.87421417236328, -39.15528869628906, -34.436363220214844, -29.71743392944336, -24.998506546020508, -20.279579162597656, -15.560651779174805, -10.841724395751953, -6.122795104980469, -1.4038848876953125, 3.315042495727539, 8.03396987915039, 12.752897262573242, 17.471824645996094, 22.190752029418945, 26.909679412841797, 31.62860870361328, 36.3475341796875, 41.06645965576172, 45.7853889465332, 50.50431823730469, 55.223243713378906, 59.942169189453125, 64.66110229492188, 69.3800277709961, 74.09895324707031, 78.81787872314453, 83.53680419921875, 88.2557373046875, 92.97466278076172, 97.69358825683594, 102.41252136230469, 107.1314468383789, 111.85037231445312, 116.56929779052734, 121.28822326660156, 126.00715637207031, 130.72607421875, 135.44500732421875, 140.1639404296875, 144.88287353515625, 149.60179138183594]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 19.0, 24.0, 28.0, 42.0, 85.0, 119.0, 254.0, 479.0, 914.0, 1849.0, 4196.0, 10534.0, 33370.0, 154210.0, 657863.0, 136662.0, 30449.0, 9797.0, 4002.0, 1790.0, 859.0, 402.0, 246.0, 140.0, 71.0, 57.0, 22.0, 9.0, 16.0, 10.0, 14.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.1484375, -10.8153076171875, -10.482177734375, -10.1490478515625, -9.81591796875, -9.4827880859375, -9.149658203125, -8.8165283203125, -8.4833984375, -8.1502685546875, -7.817138671875, -7.4840087890625, -7.15087890625, -6.8177490234375, -6.484619140625, -6.1514892578125, -5.818359375, -5.4852294921875, -5.152099609375, -4.8189697265625, -4.48583984375, -4.1527099609375, -3.819580078125, -3.4864501953125, -3.1533203125, -2.8201904296875, -2.487060546875, -2.1539306640625, -1.82080078125, -1.4876708984375, -1.154541015625, -0.8214111328125, -0.48828125, -0.1551513671875, 0.177978515625, 0.5111083984375, 0.84423828125, 1.1773681640625, 1.510498046875, 1.8436279296875, 2.1767578125, 2.5098876953125, 2.843017578125, 3.1761474609375, 3.50927734375, 3.8424072265625, 4.175537109375, 4.5086669921875, 4.841796875, 5.1749267578125, 5.508056640625, 5.8411865234375, 6.17431640625, 6.5074462890625, 6.840576171875, 7.1737060546875, 7.5068359375, 7.8399658203125, 8.173095703125, 8.5062255859375, 8.83935546875, 9.1724853515625, 9.505615234375, 9.8387451171875, 10.171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 9.0, 22.0, 28.0, 22.0, 39.0, 65.0, 65.0, 70.0, 84.0, 82.0, 87.0, 72.0, 81.0, 62.0, 55.0, 44.0, 23.0, 19.0, 22.0, 9.0, 10.0, 12.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.576416015625, -9.20751953125, -8.838623046875, -8.4697265625, -8.100830078125, -7.73193359375, -7.363037109375, -6.994140625, -6.625244140625, -6.25634765625, -5.887451171875, -5.5185546875, -5.149658203125, -4.78076171875, -4.411865234375, -4.04296875, -3.674072265625, -3.30517578125, -2.936279296875, -2.5673828125, -2.198486328125, -1.82958984375, -1.460693359375, -1.091796875, -0.722900390625, -0.35400390625, 0.014892578125, 0.3837890625, 0.752685546875, 1.12158203125, 1.490478515625, 1.859375, 2.228271484375, 2.59716796875, 2.966064453125, 3.3349609375, 3.703857421875, 4.07275390625, 4.441650390625, 4.810546875, 5.179443359375, 5.54833984375, 5.917236328125, 6.2861328125, 6.655029296875, 7.02392578125, 7.392822265625, 7.76171875, 8.130615234375, 8.49951171875, 8.868408203125, 9.2373046875, 9.606201171875, 9.97509765625, 10.343994140625, 10.712890625, 11.081787109375, 11.45068359375, 11.819580078125, 12.1884765625, 12.557373046875, 12.92626953125, 13.295166015625, 13.6640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 13.0, 16.0, 25.0, 28.0, 36.0, 47.0, 86.0, 111.0, 159.0, 263.0, 458.0, 1051.0, 3338.0, 22980.0, 883171.0, 124556.0, 8757.0, 1783.0, 689.0, 350.0, 189.0, 129.0, 81.0, 61.0, 47.0, 32.0, 26.0, 16.0, 14.0, 7.0, 7.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.578125, -15.0880126953125, -14.597900390625, -14.1077880859375, -13.61767578125, -13.1275634765625, -12.637451171875, -12.1473388671875, -11.6572265625, -11.1671142578125, -10.677001953125, -10.1868896484375, -9.69677734375, -9.2066650390625, -8.716552734375, -8.2264404296875, -7.736328125, -7.2462158203125, -6.756103515625, -6.2659912109375, -5.77587890625, -5.2857666015625, -4.795654296875, -4.3055419921875, -3.8154296875, -3.3253173828125, -2.835205078125, -2.3450927734375, -1.85498046875, -1.3648681640625, -0.874755859375, -0.3846435546875, 0.10546875, 0.5955810546875, 1.085693359375, 1.5758056640625, 2.06591796875, 2.5560302734375, 3.046142578125, 3.5362548828125, 4.0263671875, 4.5164794921875, 5.006591796875, 5.4967041015625, 5.98681640625, 6.4769287109375, 6.967041015625, 7.4571533203125, 7.947265625, 8.4373779296875, 8.927490234375, 9.4176025390625, 9.90771484375, 10.3978271484375, 10.887939453125, 11.3780517578125, 11.8681640625, 12.3582763671875, 12.848388671875, 13.3385009765625, 13.82861328125, 14.3187255859375, 14.808837890625, 15.2989501953125, 15.7890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 8.0, 5.0, 4.0, 12.0, 13.0, 7.0, 11.0, 14.0, 23.0, 18.0, 27.0, 22.0, 35.0, 47.0, 42.0, 47.0, 58.0, 63.0, 68.0, 80.0, 72.0, 42.0, 43.0, 26.0, 24.0, 29.0, 24.0, 22.0, 18.0, 18.0, 12.0, 8.0, 12.0, 7.0, 7.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.40283203125, -20.6806640625, -19.95849609375, -19.236328125, -18.51416015625, -17.7919921875, -17.06982421875, -16.34765625, -15.62548828125, -14.9033203125, -14.18115234375, -13.458984375, -12.73681640625, -12.0146484375, -11.29248046875, -10.5703125, -9.84814453125, -9.1259765625, -8.40380859375, -7.681640625, -6.95947265625, -6.2373046875, -5.51513671875, -4.79296875, -4.07080078125, -3.3486328125, -2.62646484375, -1.904296875, -1.18212890625, -0.4599609375, 0.26220703125, 0.984375, 1.70654296875, 2.4287109375, 3.15087890625, 3.873046875, 4.59521484375, 5.3173828125, 6.03955078125, 6.76171875, 7.48388671875, 8.2060546875, 8.92822265625, 9.650390625, 10.37255859375, 11.0947265625, 11.81689453125, 12.5390625, 13.26123046875, 13.9833984375, 14.70556640625, 15.427734375, 16.14990234375, 16.8720703125, 17.59423828125, 18.31640625, 19.03857421875, 19.7607421875, 20.48291015625, 21.205078125, 21.92724609375, 22.6494140625, 23.37158203125, 24.09375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 14.0, 9.0, 18.0, 25.0, 26.0, 34.0, 52.0, 99.0, 117.0, 207.0, 339.0, 724.0, 1734.0, 5374.0, 26546.0, 893309.0, 102813.0, 11758.0, 3080.0, 1051.0, 489.0, 246.0, 151.0, 100.0, 59.0, 46.0, 20.0, 22.0, 23.0, 14.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.576446533203125, -2.48687744140625, -2.397308349609375, -2.3077392578125, -2.218170166015625, -2.12860107421875, -2.039031982421875, -1.949462890625, -1.859893798828125, -1.77032470703125, -1.680755615234375, -1.5911865234375, -1.501617431640625, -1.41204833984375, -1.322479248046875, -1.23291015625, -1.143341064453125, -1.05377197265625, -0.964202880859375, -0.8746337890625, -0.785064697265625, -0.69549560546875, -0.605926513671875, -0.516357421875, -0.426788330078125, -0.33721923828125, -0.247650146484375, -0.1580810546875, -0.068511962890625, 0.02105712890625, 0.110626220703125, 0.2001953125, 0.289764404296875, 0.37933349609375, 0.468902587890625, 0.5584716796875, 0.648040771484375, 0.73760986328125, 0.827178955078125, 0.916748046875, 1.006317138671875, 1.09588623046875, 1.185455322265625, 1.2750244140625, 1.364593505859375, 1.45416259765625, 1.543731689453125, 1.63330078125, 1.722869873046875, 1.81243896484375, 1.902008056640625, 1.9915771484375, 2.081146240234375, 2.17071533203125, 2.260284423828125, 2.349853515625, 2.439422607421875, 2.52899169921875, 2.618560791015625, 2.7081298828125, 2.797698974609375, 2.88726806640625, 2.976837158203125, 3.06640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 10.0, 9.0, 18.0, 18.0, 33.0, 39.0, 66.0, 170.0, 220.0, 149.0, 84.0, 46.0, 19.0, 26.0, 21.0, 11.0, 12.0, 5.0, 10.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008778572082519531, -0.0008499771356582642, -0.0008220970630645752, -0.0007942169904708862, -0.0007663369178771973, -0.0007384568452835083, -0.0007105767726898193, -0.0006826967000961304, -0.0006548166275024414, -0.0006269365549087524, -0.0005990564823150635, -0.0005711764097213745, -0.0005432963371276855, -0.0005154162645339966, -0.0004875361919403076, -0.00045965611934661865, -0.0004317760467529297, -0.0004038959741592407, -0.00037601590156555176, -0.0003481358289718628, -0.00032025575637817383, -0.00029237568378448486, -0.0002644956111907959, -0.00023661553859710693, -0.00020873546600341797, -0.000180855393409729, -0.00015297532081604004, -0.00012509524822235107, -9.721517562866211e-05, -6.933510303497314e-05, -4.145503044128418e-05, -1.3574957847595215e-05, 1.430511474609375e-05, 4.2185187339782715e-05, 7.006525993347168e-05, 9.794533252716064e-05, 0.0001258254051208496, 0.00015370547771453857, 0.00018158555030822754, 0.0002094656229019165, 0.00023734569549560547, 0.00026522576808929443, 0.0002931058406829834, 0.00032098591327667236, 0.00034886598587036133, 0.0003767460584640503, 0.00040462613105773926, 0.0004325062036514282, 0.0004603862762451172, 0.00048826634883880615, 0.0005161464214324951, 0.0005440264940261841, 0.000571906566619873, 0.000599786639213562, 0.000627666711807251, 0.0006555467844009399, 0.0006834268569946289, 0.0007113069295883179, 0.0007391870021820068, 0.0007670670747756958, 0.0007949471473693848, 0.0008228272199630737, 0.0008507072925567627, 0.0008785873651504517, 0.0009064674377441406]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 11.0, 15.0, 21.0, 19.0, 29.0, 66.0, 88.0, 149.0, 201.0, 386.0, 691.0, 1188.0, 2567.0, 5680.0, 15600.0, 66203.0, 840785.0, 84377.0, 18114.0, 6504.0, 2738.0, 1327.0, 707.0, 398.0, 227.0, 159.0, 111.0, 65.0, 40.0, 26.0, 20.0, 16.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.845703125, -1.78326416015625, -1.7208251953125, -1.65838623046875, -1.595947265625, -1.53350830078125, -1.4710693359375, -1.40863037109375, -1.34619140625, -1.28375244140625, -1.2213134765625, -1.15887451171875, -1.096435546875, -1.03399658203125, -0.9715576171875, -0.90911865234375, -0.8466796875, -0.78424072265625, -0.7218017578125, -0.65936279296875, -0.596923828125, -0.53448486328125, -0.4720458984375, -0.40960693359375, -0.34716796875, -0.28472900390625, -0.2222900390625, -0.15985107421875, -0.097412109375, -0.03497314453125, 0.0274658203125, 0.08990478515625, 0.15234375, 0.21478271484375, 0.2772216796875, 0.33966064453125, 0.402099609375, 0.46453857421875, 0.5269775390625, 0.58941650390625, 0.65185546875, 0.71429443359375, 0.7767333984375, 0.83917236328125, 0.901611328125, 0.96405029296875, 1.0264892578125, 1.08892822265625, 1.1513671875, 1.21380615234375, 1.2762451171875, 1.33868408203125, 1.401123046875, 1.46356201171875, 1.5260009765625, 1.58843994140625, 1.65087890625, 1.71331787109375, 1.7757568359375, 1.83819580078125, 1.900634765625, 1.96307373046875, 2.0255126953125, 2.08795166015625, 2.150390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 3.0, 5.0, 8.0, 10.0, 10.0, 10.0, 22.0, 24.0, 24.0, 30.0, 47.0, 70.0, 90.0, 140.0, 127.0, 88.0, 81.0, 52.0, 30.0, 22.0, 23.0, 14.0, 10.0, 12.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.786041259765625, -1.72442626953125, -1.662811279296875, -1.6011962890625, -1.539581298828125, -1.47796630859375, -1.416351318359375, -1.354736328125, -1.293121337890625, -1.23150634765625, -1.169891357421875, -1.1082763671875, -1.046661376953125, -0.98504638671875, -0.923431396484375, -0.86181640625, -0.800201416015625, -0.73858642578125, -0.676971435546875, -0.6153564453125, -0.553741455078125, -0.49212646484375, -0.430511474609375, -0.368896484375, -0.307281494140625, -0.24566650390625, -0.184051513671875, -0.1224365234375, -0.060821533203125, 0.00079345703125, 0.062408447265625, 0.1240234375, 0.185638427734375, 0.24725341796875, 0.308868408203125, 0.3704833984375, 0.432098388671875, 0.49371337890625, 0.555328369140625, 0.616943359375, 0.678558349609375, 0.74017333984375, 0.801788330078125, 0.8634033203125, 0.925018310546875, 0.98663330078125, 1.048248291015625, 1.10986328125, 1.171478271484375, 1.23309326171875, 1.294708251953125, 1.3563232421875, 1.417938232421875, 1.47955322265625, 1.541168212890625, 1.602783203125, 1.664398193359375, 1.72601318359375, 1.787628173828125, 1.8492431640625, 1.910858154296875, 1.97247314453125, 2.034088134765625, 2.095703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 16.0, 28.0, 56.0, 110.0, 573.0, 109.0, 46.0, 27.0, 19.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-166.68460083007812, -162.76943969726562, -158.8542938232422, -154.9391326904297, -151.0239715576172, -147.10882568359375, -143.19366455078125, -139.27850341796875, -135.36334228515625, -131.44818115234375, -127.53302764892578, -123.61787414550781, -119.70271301269531, -115.78755950927734, -111.87240600585938, -107.95724487304688, -104.04209899902344, -100.12694549560547, -96.21178436279297, -92.296630859375, -88.3814697265625, -84.46631622314453, -80.55116271972656, -76.63600158691406, -72.7208480834961, -68.80569458007812, -64.89053344726562, -60.975379943847656, -57.06022262573242, -53.14506530761719, -49.22991180419922, -45.314754486083984, -41.39960479736328, -37.48444747924805, -33.56929016113281, -29.654136657714844, -25.73897933959961, -21.823822021484375, -17.908666610717773, -13.993511199951172, -10.078353881835938, -6.1631975173950195, -2.2480411529541016, 1.6671152114868164, 5.582271575927734, 9.497428894042969, 13.41258430480957, 17.327739715576172, 21.242897033691406, 25.15805435180664, 29.073209762573242, 32.988365173339844, 36.90352249145508, 40.81867980957031, 44.73383331298828, 48.648990631103516, 52.56414794921875, 56.479305267333984, 60.39446258544922, 64.30961608886719, 68.22477722167969, 72.13993072509766, 76.05508422851562, 79.97024536132812, 83.8853988647461]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 8.0, 13.0, 11.0, 21.0, 14.0, 17.0, 16.0, 16.0, 19.0, 19.0, 20.0, 31.0, 37.0, 148.0, 263.0, 85.0, 27.0, 28.0, 19.0, 23.0, 24.0, 20.0, 15.0, 15.0, 14.0, 10.0, 8.0, 6.0, 11.0, 2.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.65248107910156, -64.59014892578125, -62.52781677246094, -60.465484619140625, -58.40315246582031, -56.3408203125, -54.27848815917969, -52.216156005859375, -50.15382385253906, -48.09149169921875, -46.02915954589844, -43.966827392578125, -41.90449523925781, -39.8421630859375, -37.77983093261719, -35.717498779296875, -33.65517044067383, -31.592838287353516, -29.530506134033203, -27.46817398071289, -25.405841827392578, -23.343509674072266, -21.281179428100586, -19.218847274780273, -17.15651512145996, -15.094182968139648, -13.031850814819336, -10.96951961517334, -8.907187461853027, -6.844855308532715, -4.782524108886719, -2.7201919555664062, -0.6578598022460938, 1.4044721126556396, 3.466804027557373, 5.529135704040527, 7.59146785736084, 9.653800010681152, 11.716131210327148, 13.778463363647461, 15.840795516967773, 17.903127670288086, 19.9654598236084, 22.027790069580078, 24.09012222290039, 26.152454376220703, 28.214786529541016, 30.277118682861328, 32.33945083618164, 34.40178298950195, 36.464115142822266, 38.52644729614258, 40.58877944946289, 42.6511116027832, 44.71343994140625, 46.77577209472656, 48.838104248046875, 50.90043640136719, 52.9627685546875, 55.02510070800781, 57.087432861328125, 59.14976501464844, 61.21209716796875, 63.27442932128906, 65.33676147460938]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 13.0, 17.0, 18.0, 26.0, 28.0, 44.0, 45.0, 39.0, 140.0, 274.0, 81.0, 55.0, 45.0, 27.0, 29.0, 22.0, 18.0, 17.0, 15.0, 3.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.578125, -9.2801513671875, -8.982177734375, -8.6842041015625, -8.38623046875, -8.0882568359375, -7.790283203125, -7.4923095703125, -7.1943359375, -6.8963623046875, -6.598388671875, -6.3004150390625, -6.00244140625, -5.7044677734375, -5.406494140625, -5.1085205078125, -4.810546875, -4.5125732421875, -4.214599609375, -3.9166259765625, -3.61865234375, -3.3206787109375, -3.022705078125, -2.7247314453125, -2.4267578125, -2.1287841796875, -1.830810546875, -1.5328369140625, -1.23486328125, -0.9368896484375, -0.638916015625, -0.3409423828125, -0.04296875, 0.2550048828125, 0.552978515625, 0.8509521484375, 1.14892578125, 1.4468994140625, 1.744873046875, 2.0428466796875, 2.3408203125, 2.6387939453125, 2.936767578125, 3.2347412109375, 3.53271484375, 3.8306884765625, 4.128662109375, 4.4266357421875, 4.724609375, 5.0225830078125, 5.320556640625, 5.6185302734375, 5.91650390625, 6.2144775390625, 6.512451171875, 6.8104248046875, 7.1083984375, 7.4063720703125, 7.704345703125, 8.0023193359375, 8.30029296875, 8.5982666015625, 8.896240234375, 9.1942138671875, 9.4921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 10.0, 2.0, 5.0, 6.0, 13.0, 11.0, 27.0, 33.0, 69.0, 112.0, 190.0, 365.0, 875.0, 3021.0, 20213.0, 8346843.0, 12815.0, 2378.0, 753.0, 367.0, 153.0, 92.0, 82.0, 46.0, 34.0, 17.0, 14.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-83.78472900390625, -81.27714538574219, -78.76956176757812, -76.2619857788086, -73.75440216064453, -71.24681854248047, -68.73924255371094, -66.23165893554688, -63.72407531738281, -61.21649169921875, -58.70891189575195, -56.201332092285156, -53.693748474121094, -51.18616485595703, -48.678585052490234, -46.17100524902344, -43.663421630859375, -41.15583801269531, -38.648258209228516, -36.14067840576172, -33.633094787597656, -31.125513076782227, -28.617931365966797, -26.110349655151367, -23.602767944335938, -21.095186233520508, -18.587604522705078, -16.08002281188965, -13.572441101074219, -11.064859390258789, -8.55727767944336, -6.04969596862793, -3.5421066284179688, -1.034524917602539, 1.4730567932128906, 3.9806385040283203, 6.48822021484375, 8.99580192565918, 11.50338363647461, 14.010965347290039, 16.51854705810547, 19.0261287689209, 21.533710479736328, 24.041292190551758, 26.548873901367188, 29.056455612182617, 31.564037322998047, 34.071617126464844, 36.579200744628906, 39.08678436279297, 41.594364166259766, 44.10194396972656, 46.609527587890625, 49.11711120605469, 51.624691009521484, 54.13227081298828, 56.639854431152344, 59.147438049316406, 61.6550178527832, 64.16259765625, 66.67018127441406, 69.17776489257812, 71.68534851074219, 74.19292449951172, 76.70050811767578]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 9.0, 3.0, 3.0, 9.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-91.52945709228516, -87.53781127929688, -83.54617309570312, -79.55453491210938, -75.5628890991211, -71.57124328613281, -67.57960510253906, -63.58796310424805, -59.59632110595703, -55.604679107666016, -51.613037109375, -47.621395111083984, -43.62975311279297, -39.63811111450195, -35.64646911621094, -31.654827117919922, -27.663185119628906, -23.67154312133789, -19.679901123046875, -15.68825912475586, -11.696617126464844, -7.704975128173828, -3.7133331298828125, 0.2783088684082031, 4.269950866699219, 8.261592864990234, 12.25323486328125, 16.244876861572266, 20.23651885986328, 24.228160858154297, 28.219802856445312, 32.21144485473633, 36.203094482421875, 40.19473648071289, 44.186378479003906, 48.17802047729492, 52.16966247558594, 56.16130447387695, 60.15294647216797, 64.14459228515625, 68.13623046875, 72.12786865234375, 76.11951446533203, 80.11116027832031, 84.10279846191406, 88.09443664550781, 92.0860824584961, 96.07772827148438, 100.06936645507812, 104.06100463867188, 108.05265045166016, 112.04429626464844, 116.03593444824219, 120.02757263183594, 124.01921844482422, 128.0108642578125, 132.00250244140625, 135.994140625, 139.98577880859375, 143.97743225097656, 147.9690704345703, 151.96070861816406, 155.95236206054688, 159.94400024414062, 163.93563842773438]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 13.0, 14.0, 17.0, 31.0, 48.0, 47.0, 88.0, 130.0, 204.0, 306.0, 502.0, 863.0, 1681.0, 3483.0, 8300.0, 23164.0, 69405.0, 191181.0, 147907.0, 48317.0, 16064.0, 6263.0, 2656.0, 1370.0, 757.0, 461.0, 313.0, 182.0, 140.0, 92.0, 72.0, 53.0, 35.0, 22.0, 21.0, 12.0, 9.0, 3.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -46.873046875, -45.05859375, -43.244140625, -41.4296875, -39.615234375, -37.80078125, -35.986328125, -34.171875, -32.357421875, -30.54296875, -28.728515625, -26.9140625, -25.099609375, -23.28515625, -21.470703125, -19.65625, -17.841796875, -16.02734375, -14.212890625, -12.3984375, -10.583984375, -8.76953125, -6.955078125, -5.140625, -3.326171875, -1.51171875, 0.302734375, 2.1171875, 3.931640625, 5.74609375, 7.560546875, 9.375, 11.189453125, 13.00390625, 14.818359375, 16.6328125, 18.447265625, 20.26171875, 22.076171875, 23.890625, 25.705078125, 27.51953125, 29.333984375, 31.1484375, 32.962890625, 34.77734375, 36.591796875, 38.40625, 40.220703125, 42.03515625, 43.849609375, 45.6640625, 47.478515625, 49.29296875, 51.107421875, 52.921875, 54.736328125, 56.55078125, 58.365234375, 60.1796875, 61.994140625, 63.80859375, 65.623046875, 67.4375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 9.0, 10.0, 13.0, 20.0, 26.0, 39.0, 56.0, 53.0, 67.0, 85.0, 97.0, 82.0, 85.0, 78.0, 63.0, 39.0, 33.0, 28.0, 25.0, 13.0, 15.0, 16.0, 12.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.59033203125, -8.2353515625, -7.88037109375, -7.525390625, -7.17041015625, -6.8154296875, -6.46044921875, -6.10546875, -5.75048828125, -5.3955078125, -5.04052734375, -4.685546875, -4.33056640625, -3.9755859375, -3.62060546875, -3.265625, -2.91064453125, -2.5556640625, -2.20068359375, -1.845703125, -1.49072265625, -1.1357421875, -0.78076171875, -0.42578125, -0.07080078125, 0.2841796875, 0.63916015625, 0.994140625, 1.34912109375, 1.7041015625, 2.05908203125, 2.4140625, 2.76904296875, 3.1240234375, 3.47900390625, 3.833984375, 4.18896484375, 4.5439453125, 4.89892578125, 5.25390625, 5.60888671875, 5.9638671875, 6.31884765625, 6.673828125, 7.02880859375, 7.3837890625, 7.73876953125, 8.09375, 8.44873046875, 8.8037109375, 9.15869140625, 9.513671875, 9.86865234375, 10.2236328125, 10.57861328125, 10.93359375, 11.28857421875, 11.6435546875, 11.99853515625, 12.353515625, 12.70849609375, 13.0634765625, 13.41845703125, 13.7734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 4.0, 9.0, 17.0, 51.0, 87.0, 135.0, 87.0, 33.0, 14.0, 11.0, 6.0, 5.0, 8.0, 6.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.61805725097656, -107.09553527832031, -103.57301330566406, -100.05049133300781, -96.52796936035156, -93.00544738769531, -89.48291778564453, -85.96039581298828, -82.43787384033203, -78.91535186767578, -75.39282989501953, -71.87030792236328, -68.3477783203125, -64.82525634765625, -61.302734375, -57.78021240234375, -54.2576904296875, -50.73516845703125, -47.212646484375, -43.690120697021484, -40.167598724365234, -36.645076751708984, -33.12255096435547, -29.60002899169922, -26.07750701904297, -22.55498504638672, -19.032461166381836, -15.50993824005127, -11.987415313720703, -8.464893341064453, -4.94236946105957, -1.4198455810546875, 2.1026840209960938, 5.62520694732666, 9.147729873657227, 12.670252799987793, 16.19277572631836, 19.71529769897461, 23.237821578979492, 26.760345458984375, 30.282867431640625, 33.805389404296875, 37.327911376953125, 40.85043716430664, 44.37295913696289, 47.89548110961914, 51.418006896972656, 54.940528869628906, 58.463050842285156, 61.985572814941406, 65.50809478759766, 69.0306167602539, 72.55314636230469, 76.07566833496094, 79.59819030761719, 83.12071228027344, 86.64323425292969, 90.16575622558594, 93.68827819824219, 97.21080017089844, 100.73332214355469, 104.25584411621094, 107.77837371826172, 111.30089569091797, 114.82341766357422]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 7.0, 10.0, 21.0, 18.0, 44.0, 57.0, 66.0, 78.0, 55.0, 25.0, 13.0, 10.0, 12.0, 5.0, 7.0, 6.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.90000915527344, -62.269432067871094, -60.638858795166016, -59.00828170776367, -57.377708435058594, -55.74713134765625, -54.116554260253906, -52.48597717285156, -50.855403900146484, -49.22482681274414, -47.59425354003906, -45.96367645263672, -44.333099365234375, -42.7025260925293, -41.07194900512695, -39.441375732421875, -37.81079864501953, -36.18022155761719, -34.54964828491211, -32.919071197509766, -31.288496017456055, -29.657920837402344, -28.02734375, -26.39676856994629, -24.766193389892578, -23.135618209838867, -21.505043029785156, -19.874465942382812, -18.2438907623291, -16.61331558227539, -14.982739448547363, -13.352163314819336, -11.72159194946289, -10.09101676940918, -8.460440635681152, -6.829864978790283, -5.199289321899414, -3.568714141845703, -1.9381380081176758, -0.30756187438964844, 1.3230133056640625, 2.9535889625549316, 4.584164619445801, 6.21474027633667, 7.845315933227539, 9.47589111328125, 11.106467247009277, 12.737043380737305, 14.367618560791016, 15.998193740844727, 17.628768920898438, 19.25934600830078, 20.889921188354492, 22.520496368408203, 24.151073455810547, 25.781648635864258, 27.41222381591797, 29.04279899597168, 30.67337417602539, 32.303951263427734, 33.93452453613281, 35.565101623535156, 37.1956787109375, 38.826255798339844, 40.45682907104492]}, "eval/loss": 5.21882963180542, "eval/wer": 0.9237653034902871, "eval/runtime": 426.2702, "eval/samples_per_second": 6.198, "eval/steps_per_second": 0.389} \ No newline at end of file +{"train/loss": 3.7537, "train/learning_rate": 1.7341040462427747e-08, "train/epoch": 20.0, "train/global_step": 4460, "_runtime": 83793, "_timestamp": 1646818761, "_step": 4462, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 94.0, 92.0, 33.0, 16.0, 7.0, 7.0, 15.0, 7.0, 5.0, 6.0, 29752.0, 269.0, 65.0, 35.0, 23.0, 13.0, 4.0, 6.0, 9.0, 0.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.359375, -28.677490234375, -27.99560546875, -27.313720703125, -26.6318359375, -25.949951171875, -25.26806640625, -24.586181640625, -23.904296875, -23.222412109375, -22.54052734375, -21.858642578125, -21.1767578125, -20.494873046875, -19.81298828125, -19.131103515625, -18.44921875, -17.767333984375, -17.08544921875, -16.403564453125, -15.7216796875, -15.039794921875, -14.35791015625, -13.676025390625, -12.994140625, -12.312255859375, -11.63037109375, -10.948486328125, -10.2666015625, -9.584716796875, -8.90283203125, -8.220947265625, -7.5390625, -6.857177734375, -6.17529296875, -5.493408203125, -4.8115234375, -4.129638671875, -3.44775390625, -2.765869140625, -2.083984375, -1.402099609375, -0.72021484375, -0.038330078125, 0.6435546875, 1.325439453125, 2.00732421875, 2.689208984375, 3.37109375, 4.052978515625, 4.73486328125, 5.416748046875, 6.0986328125, 6.780517578125, 7.46240234375, 8.144287109375, 8.826171875, 9.508056640625, 10.18994140625, 10.871826171875, 11.5537109375, 12.235595703125, 12.91748046875, 13.599365234375, 14.28125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 8.0, 10.0, 12.0, 14.0, 11.0, 12.0, 16.0, 24.0, 24.0, 18.0, 33.0, 35.0, 32.0, 50.0, 42.0, 35.0, 48.0, 41.0, 48.0, 48.0, 51.0, 44.0, 42.0, 55.0, 35.0, 34.0, 25.0, 26.0, 24.0, 24.0, 16.0, 15.0, 13.0, 12.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.739181518554688, -15.377793312072754, -15.01640510559082, -14.655016899108887, -14.293628692626953, -13.932239532470703, -13.57085132598877, -13.209463119506836, -12.848074913024902, -12.486686706542969, -12.125298500061035, -11.763910293579102, -11.402521133422852, -11.041132926940918, -10.679744720458984, -10.31835651397705, -9.956968307495117, -9.595580101013184, -9.23419189453125, -8.872803688049316, -8.511415481567383, -8.150026321411133, -7.788638114929199, -7.427249908447266, -7.065861701965332, -6.704473495483398, -6.343085289001465, -5.981696605682373, -5.6203083992004395, -5.258920192718506, -4.897531509399414, -4.5361433029174805, -4.174756050109863, -3.8133678436279297, -3.451979398727417, -3.0905909538269043, -2.7292027473449707, -2.367814540863037, -2.0064260959625244, -1.6450376510620117, -1.2836494445800781, -0.922261118888855, -0.5608727931976318, -0.1994844675064087, 0.16190385818481445, 0.5232921838760376, 0.8846805095672607, 1.2460689544677734, 1.607457160949707, 1.9688454866409302, 2.3302338123321533, 2.691622257232666, 3.0530104637145996, 3.414398670196533, 3.775787115097046, 4.137175559997559, 4.498563766479492, 4.859951972961426, 5.221340179443359, 5.582728862762451, 5.944117069244385, 6.305505275726318, 6.66689395904541, 7.028282165527344, 7.389670372009277]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 9.0, 7.0, 13.0, 16.0, 15.0, 21.0, 22.0, 32.0, 33.0, 36.0, 34.0, 45.0, 48.0, 41.0, 46.0, 45.0, 34.0, 46.0, 41.0, 56.0, 37.0, 35.0, 41.0, 36.0, 39.0, 24.0, 14.0, 24.0, 10.0, 17.0, 12.0, 10.0, 6.0, 12.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0720853805542, -9.721322059631348, -9.370558738708496, -9.019794464111328, -8.669031143188477, -8.318267822265625, -7.967504501342773, -7.616741180419922, -7.265977382659912, -6.9152140617370605, -6.564450263977051, -6.213686943054199, -5.862923622131348, -5.512159824371338, -5.161396503448486, -4.810632705688477, -4.459869384765625, -4.109106063842773, -3.7583422660827637, -3.407578945159912, -3.0568153858184814, -2.706051826477051, -2.355288505554199, -2.0045249462127686, -1.653761386871338, -1.3029978275299072, -0.9522343873977661, -0.601470947265625, -0.25070738792419434, 0.10005617141723633, 0.4508194923400879, 0.8015830516815186, 1.1523475646972656, 1.5031111240386963, 1.8538745641708374, 2.2046380043029785, 2.555401563644409, 2.90616512298584, 3.2569284439086914, 3.607692003250122, 3.9584555625915527, 4.309218883514404, 4.659982681274414, 5.010746002197266, 5.361509323120117, 5.712273120880127, 6.0630364418029785, 6.413800239562988, 6.76456356048584, 7.115326881408691, 7.466090679168701, 7.816854000091553, 8.167617797851562, 8.518381118774414, 8.869144439697266, 9.219907760620117, 9.570671081542969, 9.92143440246582, 10.272197723388672, 10.622961044311523, 10.973725318908691, 11.324488639831543, 11.675251960754395, 12.026015281677246, 12.376779556274414]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 4.0, 10.0, 28.0, 36.0, 76.0, 110.0, 174.0, 277.0, 412.0, 653.0, 988.0, 1541.0, 2274.0, 3497.0, 5092.0, 7387.0, 10679.0, 14543.0, 19452.0, 26366.0, 34236.0, 43746.0, 54985.0, 66497.0, 79222.0, 93125.0, 107000.0, 94681.0, 80789.0, 67502.0, 56142.0, 44722.0, 35548.0, 27342.0, 20436.0, 14839.0, 10715.0, 7571.0, 5301.0, 3562.0, 2456.0, 1605.0, 1078.0, 673.0, 498.0, 283.0, 161.0, 105.0, 53.0, 43.0, 21.0, 13.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.703125, -24.86181640625, -24.0205078125, -23.17919921875, -22.337890625, -21.49658203125, -20.6552734375, -19.81396484375, -18.97265625, -18.13134765625, -17.2900390625, -16.44873046875, -15.607421875, -14.76611328125, -13.9248046875, -13.08349609375, -12.2421875, -11.40087890625, -10.5595703125, -9.71826171875, -8.876953125, -8.03564453125, -7.1943359375, -6.35302734375, -5.51171875, -4.67041015625, -3.8291015625, -2.98779296875, -2.146484375, -1.30517578125, -0.4638671875, 0.37744140625, 1.21875, 2.06005859375, 2.9013671875, 3.74267578125, 4.583984375, 5.42529296875, 6.2666015625, 7.10791015625, 7.94921875, 8.79052734375, 9.6318359375, 10.47314453125, 11.314453125, 12.15576171875, 12.9970703125, 13.83837890625, 14.6796875, 15.52099609375, 16.3623046875, 17.20361328125, 18.044921875, 18.88623046875, 19.7275390625, 20.56884765625, 21.41015625, 22.25146484375, 23.0927734375, 23.93408203125, 24.775390625, 25.61669921875, 26.4580078125, 27.29931640625, 28.140625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 2.0, 0.0, 6.0, 6.0, 6.0, 3.0, 12.0, 10.0, 8.0, 10.0, 16.0, 25.0, 22.0, 25.0, 29.0, 35.0, 39.0, 37.0, 35.0, 37.0, 53.0, 56.0, 69.0, 54.0, 53.0, 50.0, 42.0, 18.0, 31.0, 24.0, 31.0, 23.0, 23.0, 13.0, 14.0, 16.0, 7.0, 18.0, 8.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.6248779296875, -13.171630859375, -12.7183837890625, -12.26513671875, -11.8118896484375, -11.358642578125, -10.9053955078125, -10.4521484375, -9.9989013671875, -9.545654296875, -9.0924072265625, -8.63916015625, -8.1859130859375, -7.732666015625, -7.2794189453125, -6.826171875, -6.3729248046875, -5.919677734375, -5.4664306640625, -5.01318359375, -4.5599365234375, -4.106689453125, -3.6534423828125, -3.2001953125, -2.7469482421875, -2.293701171875, -1.8404541015625, -1.38720703125, -0.9339599609375, -0.480712890625, -0.0274658203125, 0.42578125, 0.8790283203125, 1.332275390625, 1.7855224609375, 2.23876953125, 2.6920166015625, 3.145263671875, 3.5985107421875, 4.0517578125, 4.5050048828125, 4.958251953125, 5.4114990234375, 5.86474609375, 6.3179931640625, 6.771240234375, 7.2244873046875, 7.677734375, 8.1309814453125, 8.584228515625, 9.0374755859375, 9.49072265625, 9.9439697265625, 10.397216796875, 10.8504638671875, 11.3037109375, 11.7569580078125, 12.210205078125, 12.6634521484375, 13.11669921875, 13.5699462890625, 14.023193359375, 14.4764404296875, 14.9296875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 3.0, 8.0, 2.0, 3.0, 3.0, 10.0, 8.0, 10.0, 10.0, 12.0, 13.0, 10.0, 16.0, 29.0, 26.0, 24.0, 33.0, 42.0, 28.0, 33.0, 31.0, 33.0, 41.0, 29.0, 42.0, 39.0, 37.0, 42.0, 35.0, 31.0, 25.0, 37.0, 31.0, 26.0, 17.0, 21.0, 29.0, 18.0, 22.0, 14.0, 15.0, 12.0, 14.0, 12.0, 9.0, 2.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.108541488647461, -8.822488784790039, -8.536436080932617, -8.250383377075195, -7.964330673217773, -7.678277969360352, -7.3922247886657715, -7.10617208480835, -6.820119380950928, -6.534066677093506, -6.248013973236084, -5.961961269378662, -5.675908088684082, -5.38985538482666, -5.103802680969238, -4.817749977111816, -4.5316972732543945, -4.245644569396973, -3.959591865539551, -3.67353892326355, -3.387486219406128, -3.101433515548706, -2.815380573272705, -2.529327869415283, -2.2432751655578613, -1.9572224617004395, -1.671169638633728, -1.3851168155670166, -1.0990641117095947, -0.8130114078521729, -0.5269585847854614, -0.24090576171875, 0.04514789581298828, 0.33120065927505493, 0.6172534227371216, 0.9033061861991882, 1.1893589496612549, 1.4754116535186768, 1.7614644765853882, 2.0475172996520996, 2.3335700035095215, 2.6196227073669434, 2.9056754112243652, 3.191728353500366, 3.477781057357788, 3.76383376121521, 4.049886703491211, 4.335939407348633, 4.621992111206055, 4.908044815063477, 5.194097518920898, 5.48015022277832, 5.766202926635742, 6.052255630493164, 6.338308811187744, 6.624361515045166, 6.910414218902588, 7.19646692276001, 7.482519626617432, 7.7685723304748535, 8.054625511169434, 8.340678215026855, 8.626730918884277, 8.9127836227417, 9.198836326599121]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 7.0, 13.0, 10.0, 17.0, 21.0, 15.0, 13.0, 12.0, 27.0, 28.0, 18.0, 41.0, 36.0, 34.0, 34.0, 36.0, 40.0, 56.0, 48.0, 32.0, 27.0, 46.0, 40.0, 37.0, 38.0, 35.0, 23.0, 29.0, 28.0, 22.0, 28.0, 18.0, 20.0, 9.0, 9.0, 10.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101076126098633, -8.788050651550293, -8.475024223327637, -8.161998748779297, -7.848972797393799, -7.535946846008301, -7.222921371459961, -6.909895420074463, -6.596869468688965, -6.283843517303467, -5.970817565917969, -5.657792091369629, -5.344766139984131, -5.031740188598633, -4.718714714050293, -4.405688762664795, -4.092662811279297, -3.779636859893799, -3.46661114692688, -3.153585433959961, -2.840559482574463, -2.527533531188965, -2.214507818222046, -1.901482105255127, -1.588456153869629, -1.2754303216934204, -0.9624044895172119, -0.6493786573410034, -0.3363528251647949, -0.023326992988586426, 0.28969883918762207, 0.602724552154541, 0.9157514572143555, 1.228777289390564, 1.5418031215667725, 1.854828953742981, 2.1678547859191895, 2.4808807373046875, 2.7939064502716064, 3.1069321632385254, 3.4199581146240234, 3.7329840660095215, 4.0460100173950195, 4.359035491943359, 4.672061443328857, 4.9850873947143555, 5.298112869262695, 5.611138820648193, 5.924164772033691, 6.2371907234191895, 6.5502166748046875, 6.863242149353027, 7.176268100738525, 7.489294052124023, 7.802319526672363, 8.115345001220703, 8.42837142944336, 8.7413969039917, 9.054423332214355, 9.367448806762695, 9.680475234985352, 9.993500709533691, 10.306526184082031, 10.619552612304688, 10.932578086853027]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 3.0, 12.0, 5.0, 17.0, 15.0, 41.0, 68.0, 120.0, 187.0, 341.0, 535.0, 936.0, 1605.0, 2671.0, 4416.0, 7126.0, 11676.0, 18767.0, 29684.0, 45639.0, 70595.0, 104761.0, 149746.0, 207970.0, 276577.0, 345542.0, 404598.0, 438396.0, 436884.0, 400867.0, 339563.0, 269909.0, 202714.0, 144412.0, 99586.0, 66003.0, 43533.0, 27201.0, 16724.0, 10115.0, 6112.0, 3601.0, 2156.0, 1197.0, 711.0, 439.0, 227.0, 124.0, 62.0, 49.0, 28.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.828125, -8.5517578125, -8.275390625, -7.9990234375, -7.72265625, -7.4462890625, -7.169921875, -6.8935546875, -6.6171875, -6.3408203125, -6.064453125, -5.7880859375, -5.51171875, -5.2353515625, -4.958984375, -4.6826171875, -4.40625, -4.1298828125, -3.853515625, -3.5771484375, -3.30078125, -3.0244140625, -2.748046875, -2.4716796875, -2.1953125, -1.9189453125, -1.642578125, -1.3662109375, -1.08984375, -0.8134765625, -0.537109375, -0.2607421875, 0.015625, 0.2919921875, 0.568359375, 0.8447265625, 1.12109375, 1.3974609375, 1.673828125, 1.9501953125, 2.2265625, 2.5029296875, 2.779296875, 3.0556640625, 3.33203125, 3.6083984375, 3.884765625, 4.1611328125, 4.4375, 4.7138671875, 4.990234375, 5.2666015625, 5.54296875, 5.8193359375, 6.095703125, 6.3720703125, 6.6484375, 6.9248046875, 7.201171875, 7.4775390625, 7.75390625, 8.0302734375, 8.306640625, 8.5830078125, 8.859375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 6.0, 11.0, 13.0, 15.0, 17.0, 21.0, 21.0, 26.0, 23.0, 27.0, 29.0, 32.0, 34.0, 45.0, 28.0, 41.0, 32.0, 37.0, 46.0, 50.0, 44.0, 37.0, 44.0, 40.0, 34.0, 35.0, 23.0, 27.0, 24.0, 20.0, 13.0, 16.0, 16.0, 15.0, 11.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3834228515625, -8.110595703125, -7.8377685546875, -7.56494140625, -7.2921142578125, -7.019287109375, -6.7464599609375, -6.4736328125, -6.2008056640625, -5.927978515625, -5.6551513671875, -5.38232421875, -5.1094970703125, -4.836669921875, -4.5638427734375, -4.291015625, -4.0181884765625, -3.745361328125, -3.4725341796875, -3.19970703125, -2.9268798828125, -2.654052734375, -2.3812255859375, -2.1083984375, -1.8355712890625, -1.562744140625, -1.2899169921875, -1.01708984375, -0.7442626953125, -0.471435546875, -0.1986083984375, 0.07421875, 0.3470458984375, 0.619873046875, 0.8927001953125, 1.16552734375, 1.4383544921875, 1.711181640625, 1.9840087890625, 2.2568359375, 2.5296630859375, 2.802490234375, 3.0753173828125, 3.34814453125, 3.6209716796875, 3.893798828125, 4.1666259765625, 4.439453125, 4.7122802734375, 4.985107421875, 5.2579345703125, 5.53076171875, 5.8035888671875, 6.076416015625, 6.3492431640625, 6.6220703125, 6.8948974609375, 7.167724609375, 7.4405517578125, 7.71337890625, 7.9862060546875, 8.259033203125, 8.5318603515625, 8.8046875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 14.0, 20.0, 28.0, 32.0, 61.0, 108.0, 178.0, 289.0, 514.0, 810.0, 1434.0, 2320.0, 3776.0, 6128.0, 9826.0, 15324.0, 23634.0, 36067.0, 53189.0, 77239.0, 109166.0, 147586.0, 194021.0, 244651.0, 293056.0, 335804.0, 363448.0, 373901.0, 362769.0, 333617.0, 290771.0, 241331.0, 191858.0, 146428.0, 107206.0, 76194.0, 53039.0, 35251.0, 23472.0, 15099.0, 9550.0, 5930.0, 3665.0, 2249.0, 1308.0, 771.0, 509.0, 274.0, 140.0, 84.0, 65.0, 42.0, 19.0, 12.0, 6.0, 5.0, 5.0, 1.0, 1.0], "bins": [-8.234375, -7.9808349609375, -7.727294921875, -7.4737548828125, -7.22021484375, -6.9666748046875, -6.713134765625, -6.4595947265625, -6.2060546875, -5.9525146484375, -5.698974609375, -5.4454345703125, -5.19189453125, -4.9383544921875, -4.684814453125, -4.4312744140625, -4.177734375, -3.9241943359375, -3.670654296875, -3.4171142578125, -3.16357421875, -2.9100341796875, -2.656494140625, -2.4029541015625, -2.1494140625, -1.8958740234375, -1.642333984375, -1.3887939453125, -1.13525390625, -0.8817138671875, -0.628173828125, -0.3746337890625, -0.12109375, 0.1324462890625, 0.385986328125, 0.6395263671875, 0.89306640625, 1.1466064453125, 1.400146484375, 1.6536865234375, 1.9072265625, 2.1607666015625, 2.414306640625, 2.6678466796875, 2.92138671875, 3.1749267578125, 3.428466796875, 3.6820068359375, 3.935546875, 4.1890869140625, 4.442626953125, 4.6961669921875, 4.94970703125, 5.2032470703125, 5.456787109375, 5.7103271484375, 5.9638671875, 6.2174072265625, 6.470947265625, 6.7244873046875, 6.97802734375, 7.2315673828125, 7.485107421875, 7.7386474609375, 7.9921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 7.0, 10.0, 13.0, 28.0, 36.0, 45.0, 55.0, 65.0, 104.0, 97.0, 125.0, 145.0, 183.0, 217.0, 201.0, 222.0, 274.0, 223.0, 242.0, 260.0, 225.0, 201.0, 188.0, 178.0, 145.0, 126.0, 111.0, 73.0, 52.0, 55.0, 48.0, 38.0, 20.0, 22.0, 9.0, 10.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.8203125, -6.640625, -6.4609375, -6.28125, -6.1015625, -5.921875, -5.7421875, -5.5625, -5.3828125, -5.203125, -5.0234375, -4.84375, -4.6640625, -4.484375, -4.3046875, -4.125, -3.9453125, -3.765625, -3.5859375, -3.40625, -3.2265625, -3.046875, -2.8671875, -2.6875, -2.5078125, -2.328125, -2.1484375, -1.96875, -1.7890625, -1.609375, -1.4296875, -1.25, -1.0703125, -0.890625, -0.7109375, -0.53125, -0.3515625, -0.171875, 0.0078125, 0.1875, 0.3671875, 0.546875, 0.7265625, 0.90625, 1.0859375, 1.265625, 1.4453125, 1.625, 1.8046875, 1.984375, 2.1640625, 2.34375, 2.5234375, 2.703125, 2.8828125, 3.0625, 3.2421875, 3.421875, 3.6015625, 3.78125, 3.9609375, 4.140625, 4.3203125, 4.5, 4.6796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 9.0, 10.0, 9.0, 11.0, 14.0, 19.0, 13.0, 19.0, 23.0, 25.0, 28.0, 37.0, 34.0, 35.0, 25.0, 34.0, 38.0, 40.0, 37.0, 42.0, 36.0, 40.0, 38.0, 46.0, 49.0, 40.0, 29.0, 31.0, 29.0, 20.0, 17.0, 25.0, 12.0, 14.0, 11.0, 4.0, 11.0, 8.0, 3.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.557665824890137, -10.21833610534668, -9.879007339477539, -9.539677619934082, -9.200348854064941, -8.861019134521484, -8.521690368652344, -8.182360649108887, -7.843031406402588, -7.503702163696289, -7.16437292098999, -6.825043678283691, -6.485713958740234, -6.146385192871094, -5.807055473327637, -5.467726230621338, -5.128396987915039, -4.78906774520874, -4.449738502502441, -4.110408782958984, -3.7710797786712646, -3.431750535964966, -3.092421054840088, -2.753091812133789, -2.4137625694274902, -2.0744333267211914, -1.735103964805603, -1.3957746028900146, -1.0564453601837158, -0.717116117477417, -0.37778663635253906, -0.038457393646240234, 0.300872802734375, 0.6402021050453186, 0.9795314073562622, 1.3188607692718506, 1.6581900119781494, 1.9975192546844482, 2.336848735809326, 2.676177978515625, 3.015507221221924, 3.3548364639282227, 3.6941657066345215, 4.03349494934082, 4.372824668884277, 4.712153434753418, 5.051483154296875, 5.390812397003174, 5.730141639709473, 6.0694708824157715, 6.40880012512207, 6.748129844665527, 7.087458610534668, 7.426788330078125, 7.766117572784424, 8.105446815490723, 8.44477653503418, 8.784106254577637, 9.123435020446777, 9.462764739990234, 9.802093505859375, 10.141423225402832, 10.480752944946289, 10.82008171081543, 11.15941047668457]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 9.0, 7.0, 19.0, 12.0, 13.0, 21.0, 18.0, 31.0, 21.0, 35.0, 29.0, 26.0, 35.0, 27.0, 29.0, 44.0, 41.0, 38.0, 48.0, 33.0, 36.0, 42.0, 42.0, 32.0, 50.0, 40.0, 27.0, 30.0, 25.0, 22.0, 23.0, 14.0, 10.0, 8.0, 12.0, 14.0, 6.0, 10.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.936174392700195, -11.571666717529297, -11.207158088684082, -10.842650413513184, -10.478142738342285, -10.11363410949707, -9.749126434326172, -9.384618759155273, -9.020110130310059, -8.65560245513916, -8.291093826293945, -7.926586151123047, -7.56207799911499, -7.197569847106934, -6.833062171936035, -6.4685540199279785, -6.10404634475708, -5.739538192749023, -5.375030517578125, -5.010522365570068, -4.646014213562012, -4.281506538391113, -3.9169983863830566, -3.552490234375, -3.1879823207855225, -2.823474407196045, -2.4589662551879883, -2.0944583415985107, -1.7299503087997437, -1.3654422760009766, -1.000934362411499, -0.6364262104034424, -0.27191829681396484, 0.09258970618247986, 0.45709770917892456, 0.8216056823730469, 1.186113715171814, 1.550621747970581, 1.9151296615600586, 2.2796378135681152, 2.6441457271575928, 3.0086536407470703, 3.373161792755127, 3.7376697063446045, 4.102177619934082, 4.466685771942139, 4.831193923950195, 5.195701599121094, 5.56020975112915, 5.924717903137207, 6.2892255783081055, 6.653733730316162, 7.018241882324219, 7.382749557495117, 7.747257709503174, 8.11176586151123, 8.476273536682129, 8.840781211853027, 9.205289840698242, 9.56979751586914, 9.934305191040039, 10.298813819885254, 10.663321495056152, 11.027830123901367, 11.392337799072266]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 10.0, 7.0, 8.0, 19.0, 23.0, 41.0, 75.0, 94.0, 119.0, 214.0, 320.0, 418.0, 643.0, 965.0, 1371.0, 2008.0, 3072.0, 4587.0, 6974.0, 10261.0, 15274.0, 22922.0, 33937.0, 48866.0, 69033.0, 94089.0, 119378.0, 133834.0, 126682.0, 102968.0, 77431.0, 55030.0, 38154.0, 26299.0, 17621.0, 11879.0, 7922.0, 5312.0, 3502.0, 2378.0, 1535.0, 1020.0, 676.0, 508.0, 330.0, 233.0, 175.0, 121.0, 70.0, 49.0, 37.0, 28.0, 16.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.508544921875, -14.98583984375, -14.463134765625, -13.9404296875, -13.417724609375, -12.89501953125, -12.372314453125, -11.849609375, -11.326904296875, -10.80419921875, -10.281494140625, -9.7587890625, -9.236083984375, -8.71337890625, -8.190673828125, -7.66796875, -7.145263671875, -6.62255859375, -6.099853515625, -5.5771484375, -5.054443359375, -4.53173828125, -4.009033203125, -3.486328125, -2.963623046875, -2.44091796875, -1.918212890625, -1.3955078125, -0.872802734375, -0.35009765625, 0.172607421875, 0.6953125, 1.218017578125, 1.74072265625, 2.263427734375, 2.7861328125, 3.308837890625, 3.83154296875, 4.354248046875, 4.876953125, 5.399658203125, 5.92236328125, 6.445068359375, 6.9677734375, 7.490478515625, 8.01318359375, 8.535888671875, 9.05859375, 9.581298828125, 10.10400390625, 10.626708984375, 11.1494140625, 11.672119140625, 12.19482421875, 12.717529296875, 13.240234375, 13.762939453125, 14.28564453125, 14.808349609375, 15.3310546875, 15.853759765625, 16.37646484375, 16.899169921875, 17.421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 8.0, 17.0, 28.0, 23.0, 26.0, 16.0, 23.0, 41.0, 36.0, 39.0, 40.0, 42.0, 34.0, 52.0, 48.0, 37.0, 38.0, 44.0, 43.0, 54.0, 52.0, 32.0, 31.0, 29.0, 20.0, 27.0, 14.0, 17.0, 10.0, 13.0, 9.0, 11.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.60498046875, -12.2099609375, -11.81494140625, -11.419921875, -11.02490234375, -10.6298828125, -10.23486328125, -9.83984375, -9.44482421875, -9.0498046875, -8.65478515625, -8.259765625, -7.86474609375, -7.4697265625, -7.07470703125, -6.6796875, -6.28466796875, -5.8896484375, -5.49462890625, -5.099609375, -4.70458984375, -4.3095703125, -3.91455078125, -3.51953125, -3.12451171875, -2.7294921875, -2.33447265625, -1.939453125, -1.54443359375, -1.1494140625, -0.75439453125, -0.359375, 0.03564453125, 0.4306640625, 0.82568359375, 1.220703125, 1.61572265625, 2.0107421875, 2.40576171875, 2.80078125, 3.19580078125, 3.5908203125, 3.98583984375, 4.380859375, 4.77587890625, 5.1708984375, 5.56591796875, 5.9609375, 6.35595703125, 6.7509765625, 7.14599609375, 7.541015625, 7.93603515625, 8.3310546875, 8.72607421875, 9.12109375, 9.51611328125, 9.9111328125, 10.30615234375, 10.701171875, 11.09619140625, 11.4912109375, 11.88623046875, 12.28125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 4.0, 11.0, 28.0, 25.0, 35.0, 49.0, 69.0, 94.0, 169.0, 251.0, 464.0, 713.0, 1158.0, 1822.0, 3084.0, 5305.0, 9451.0, 16879.0, 31285.0, 60682.0, 120401.0, 235118.0, 263338.0, 143666.0, 71421.0, 37011.0, 19879.0, 10743.0, 6148.0, 3597.0, 2129.0, 1276.0, 834.0, 479.0, 339.0, 179.0, 130.0, 86.0, 66.0, 38.0, 40.0, 14.0, 9.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.1875, -25.318359375, -24.44921875, -23.580078125, -22.7109375, -21.841796875, -20.97265625, -20.103515625, -19.234375, -18.365234375, -17.49609375, -16.626953125, -15.7578125, -14.888671875, -14.01953125, -13.150390625, -12.28125, -11.412109375, -10.54296875, -9.673828125, -8.8046875, -7.935546875, -7.06640625, -6.197265625, -5.328125, -4.458984375, -3.58984375, -2.720703125, -1.8515625, -0.982421875, -0.11328125, 0.755859375, 1.625, 2.494140625, 3.36328125, 4.232421875, 5.1015625, 5.970703125, 6.83984375, 7.708984375, 8.578125, 9.447265625, 10.31640625, 11.185546875, 12.0546875, 12.923828125, 13.79296875, 14.662109375, 15.53125, 16.400390625, 17.26953125, 18.138671875, 19.0078125, 19.876953125, 20.74609375, 21.615234375, 22.484375, 23.353515625, 24.22265625, 25.091796875, 25.9609375, 26.830078125, 27.69921875, 28.568359375, 29.4375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 5.0, 10.0, 9.0, 7.0, 18.0, 13.0, 20.0, 29.0, 32.0, 26.0, 27.0, 32.0, 46.0, 42.0, 48.0, 43.0, 46.0, 48.0, 56.0, 53.0, 48.0, 51.0, 42.0, 42.0, 25.0, 28.0, 18.0, 21.0, 21.0, 21.0, 11.0, 12.0, 5.0, 10.0, 4.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.375, -10.024169921875, -9.67333984375, -9.322509765625, -8.9716796875, -8.620849609375, -8.27001953125, -7.919189453125, -7.568359375, -7.217529296875, -6.86669921875, -6.515869140625, -6.1650390625, -5.814208984375, -5.46337890625, -5.112548828125, -4.76171875, -4.410888671875, -4.06005859375, -3.709228515625, -3.3583984375, -3.007568359375, -2.65673828125, -2.305908203125, -1.955078125, -1.604248046875, -1.25341796875, -0.902587890625, -0.5517578125, -0.200927734375, 0.14990234375, 0.500732421875, 0.8515625, 1.202392578125, 1.55322265625, 1.904052734375, 2.2548828125, 2.605712890625, 2.95654296875, 3.307373046875, 3.658203125, 4.009033203125, 4.35986328125, 4.710693359375, 5.0615234375, 5.412353515625, 5.76318359375, 6.114013671875, 6.46484375, 6.815673828125, 7.16650390625, 7.517333984375, 7.8681640625, 8.218994140625, 8.56982421875, 8.920654296875, 9.271484375, 9.622314453125, 9.97314453125, 10.323974609375, 10.6748046875, 11.025634765625, 11.37646484375, 11.727294921875, 12.078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 0.0, 4.0, 2.0, 4.0, 12.0, 6.0, 7.0, 11.0, 12.0, 16.0, 28.0, 32.0, 84.0, 77.0, 117.0, 151.0, 221.0, 335.0, 513.0, 779.0, 1166.0, 1864.0, 3222.0, 5661.0, 11127.0, 23595.0, 61277.0, 233206.0, 480281.0, 143195.0, 42909.0, 17640.0, 8650.0, 4772.0, 2706.0, 1635.0, 1061.0, 695.0, 429.0, 329.0, 206.0, 159.0, 105.0, 68.0, 52.0, 31.0, 29.0, 20.0, 16.0, 13.0, 10.0, 5.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-41.875, -40.53857421875, -39.2021484375, -37.86572265625, -36.529296875, -35.19287109375, -33.8564453125, -32.52001953125, -31.18359375, -29.84716796875, -28.5107421875, -27.17431640625, -25.837890625, -24.50146484375, -23.1650390625, -21.82861328125, -20.4921875, -19.15576171875, -17.8193359375, -16.48291015625, -15.146484375, -13.81005859375, -12.4736328125, -11.13720703125, -9.80078125, -8.46435546875, -7.1279296875, -5.79150390625, -4.455078125, -3.11865234375, -1.7822265625, -0.44580078125, 0.890625, 2.22705078125, 3.5634765625, 4.89990234375, 6.236328125, 7.57275390625, 8.9091796875, 10.24560546875, 11.58203125, 12.91845703125, 14.2548828125, 15.59130859375, 16.927734375, 18.26416015625, 19.6005859375, 20.93701171875, 22.2734375, 23.60986328125, 24.9462890625, 26.28271484375, 27.619140625, 28.95556640625, 30.2919921875, 31.62841796875, 32.96484375, 34.30126953125, 35.6376953125, 36.97412109375, 38.310546875, 39.64697265625, 40.9833984375, 42.31982421875, 43.65625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 14.0, 7.0, 15.0, 21.0, 38.0, 35.0, 57.0, 61.0, 124.0, 190.0, 136.0, 93.0, 44.0, 37.0, 23.0, 22.0, 11.0, 14.0, 13.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004306793212890625, -0.004194796085357666, -0.004082798957824707, -0.003970801830291748, -0.003858804702758789, -0.00374680757522583, -0.003634810447692871, -0.003522813320159912, -0.003410816192626953, -0.003298819065093994, -0.003186821937561035, -0.003074824810028076, -0.002962827682495117, -0.002850830554962158, -0.0027388334274291992, -0.0026268362998962402, -0.0025148391723632812, -0.0024028420448303223, -0.0022908449172973633, -0.0021788477897644043, -0.0020668506622314453, -0.0019548535346984863, -0.0018428564071655273, -0.0017308592796325684, -0.0016188621520996094, -0.0015068650245666504, -0.0013948678970336914, -0.0012828707695007324, -0.0011708736419677734, -0.0010588765144348145, -0.0009468793869018555, -0.0008348822593688965, -0.0007228851318359375, -0.0006108880043029785, -0.0004988908767700195, -0.00038689374923706055, -0.00027489662170410156, -0.00016289949417114258, -5.0902366638183594e-05, 6.109476089477539e-05, 0.00017309188842773438, 0.00028508901596069336, 0.00039708614349365234, 0.0005090832710266113, 0.0006210803985595703, 0.0007330775260925293, 0.0008450746536254883, 0.0009570717811584473, 0.0010690689086914062, 0.0011810660362243652, 0.0012930631637573242, 0.0014050602912902832, 0.0015170574188232422, 0.0016290545463562012, 0.0017410516738891602, 0.0018530488014221191, 0.001965045928955078, 0.002077043056488037, 0.002189040184020996, 0.002301037311553955, 0.002413034439086914, 0.002525031566619873, 0.002637028694152832, 0.002749025821685791, 0.00286102294921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 12.0, 18.0, 30.0, 44.0, 63.0, 125.0, 160.0, 215.0, 379.0, 530.0, 869.0, 1341.0, 2120.0, 3204.0, 5068.0, 8013.0, 12468.0, 20666.0, 34998.0, 59447.0, 100758.0, 153935.0, 188494.0, 168163.0, 114725.0, 69092.0, 40116.0, 23918.0, 14530.0, 9134.0, 5611.0, 3639.0, 2279.0, 1513.0, 1015.0, 647.0, 383.0, 294.0, 194.0, 114.0, 76.0, 48.0, 29.0, 18.0, 13.0, 8.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.773681640625, -16.18798828125, -15.602294921875, -15.0166015625, -14.430908203125, -13.84521484375, -13.259521484375, -12.673828125, -12.088134765625, -11.50244140625, -10.916748046875, -10.3310546875, -9.745361328125, -9.15966796875, -8.573974609375, -7.98828125, -7.402587890625, -6.81689453125, -6.231201171875, -5.6455078125, -5.059814453125, -4.47412109375, -3.888427734375, -3.302734375, -2.717041015625, -2.13134765625, -1.545654296875, -0.9599609375, -0.374267578125, 0.21142578125, 0.797119140625, 1.3828125, 1.968505859375, 2.55419921875, 3.139892578125, 3.7255859375, 4.311279296875, 4.89697265625, 5.482666015625, 6.068359375, 6.654052734375, 7.23974609375, 7.825439453125, 8.4111328125, 8.996826171875, 9.58251953125, 10.168212890625, 10.75390625, 11.339599609375, 11.92529296875, 12.510986328125, 13.0966796875, 13.682373046875, 14.26806640625, 14.853759765625, 15.439453125, 16.025146484375, 16.61083984375, 17.196533203125, 17.7822265625, 18.367919921875, 18.95361328125, 19.539306640625, 20.125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 10.0, 10.0, 14.0, 17.0, 18.0, 29.0, 43.0, 36.0, 51.0, 43.0, 46.0, 60.0, 56.0, 69.0, 58.0, 69.0, 57.0, 63.0, 45.0, 23.0, 28.0, 25.0, 25.0, 12.0, 12.0, 11.0, 5.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.55126953125, -5.3603515625, -5.16943359375, -4.978515625, -4.78759765625, -4.5966796875, -4.40576171875, -4.21484375, -4.02392578125, -3.8330078125, -3.64208984375, -3.451171875, -3.26025390625, -3.0693359375, -2.87841796875, -2.6875, -2.49658203125, -2.3056640625, -2.11474609375, -1.923828125, -1.73291015625, -1.5419921875, -1.35107421875, -1.16015625, -0.96923828125, -0.7783203125, -0.58740234375, -0.396484375, -0.20556640625, -0.0146484375, 0.17626953125, 0.3671875, 0.55810546875, 0.7490234375, 0.93994140625, 1.130859375, 1.32177734375, 1.5126953125, 1.70361328125, 1.89453125, 2.08544921875, 2.2763671875, 2.46728515625, 2.658203125, 2.84912109375, 3.0400390625, 3.23095703125, 3.421875, 3.61279296875, 3.8037109375, 3.99462890625, 4.185546875, 4.37646484375, 4.5673828125, 4.75830078125, 4.94921875, 5.14013671875, 5.3310546875, 5.52197265625, 5.712890625, 5.90380859375, 6.0947265625, 6.28564453125, 6.4765625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 10.0, 16.0, 15.0, 19.0, 15.0, 22.0, 30.0, 34.0, 27.0, 38.0, 35.0, 41.0, 32.0, 45.0, 43.0, 46.0, 48.0, 40.0, 43.0, 32.0, 38.0, 36.0, 33.0, 31.0, 16.0, 31.0, 22.0, 24.0, 21.0, 8.0, 19.0, 10.0, 7.0, 8.0, 7.0, 2.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.823258399963379, -10.45478630065918, -10.086315155029297, -9.717844009399414, -9.349371910095215, -8.980899810791016, -8.612428665161133, -8.24395751953125, -7.875485420227051, -7.50701379776001, -7.138542175292969, -6.770070552825928, -6.401598930358887, -6.033127307891846, -5.664655685424805, -5.296184062957764, -4.927712440490723, -4.559240818023682, -4.190769195556641, -3.8222975730895996, -3.4538259506225586, -3.0853543281555176, -2.7168827056884766, -2.3484110832214355, -1.9799394607543945, -1.6114678382873535, -1.2429962158203125, -0.8745245933532715, -0.5060529708862305, -0.13758134841918945, 0.23089027404785156, 0.5993618965148926, 0.9678325653076172, 1.3363041877746582, 1.7047758102416992, 2.0732474327087402, 2.4417190551757812, 2.8101906776428223, 3.1786623001098633, 3.5471339225769043, 3.9156055450439453, 4.284077167510986, 4.652548789978027, 5.021020412445068, 5.389492034912109, 5.75796365737915, 6.126435279846191, 6.494906902313232, 6.863378524780273, 7.2318501472473145, 7.6003217697143555, 7.9687933921813965, 8.337265014648438, 8.70573616027832, 9.07420825958252, 9.442680358886719, 9.811151504516602, 10.179622650146484, 10.548094749450684, 10.916566848754883, 11.285037994384766, 11.653509140014648, 12.021981239318848, 12.390453338623047, 12.75892448425293]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 8.0, 12.0, 6.0, 13.0, 13.0, 17.0, 24.0, 23.0, 20.0, 21.0, 29.0, 30.0, 37.0, 39.0, 30.0, 37.0, 39.0, 40.0, 47.0, 35.0, 28.0, 45.0, 46.0, 37.0, 40.0, 27.0, 34.0, 32.0, 23.0, 19.0, 19.0, 16.0, 20.0, 14.0, 17.0, 14.0, 11.0, 11.0, 8.0, 3.0, 8.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.97917366027832, -10.615381240844727, -10.25158977508545, -9.887797355651855, -9.524005889892578, -9.160213470458984, -8.796422004699707, -8.432629585266113, -8.068838119506836, -7.7050461769104, -7.341254234313965, -6.977462291717529, -6.613670349121094, -6.249878406524658, -5.886086463928223, -5.522294044494629, -5.158502101898193, -4.794710159301758, -4.430918216705322, -4.067126274108887, -3.703334331512451, -3.3395423889160156, -2.975750207901001, -2.6119582653045654, -2.24816632270813, -1.8843743801116943, -1.5205824375152588, -1.1567903757095337, -0.7929984331130981, -0.4292064905166626, -0.0654144287109375, 0.29837751388549805, 0.6621694564819336, 1.0259613990783691, 1.3897533416748047, 1.7535454034805298, 2.117337226867676, 2.4811291694641113, 2.844921350479126, 3.2087132930755615, 3.572505235671997, 3.9362971782684326, 4.300089359283447, 4.663881301879883, 5.027673244476318, 5.391465187072754, 5.7552571296691895, 6.119049072265625, 6.4828410148620605, 6.846632957458496, 7.210424900054932, 7.574216842651367, 7.938008785247803, 8.301800727844238, 8.665593147277832, 9.02938461303711, 9.393177032470703, 9.756969451904297, 10.120760917663574, 10.484553337097168, 10.848344802856445, 11.212137222290039, 11.575928688049316, 11.93972110748291, 12.303512573242188]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [7.0, 1.0, 5.0, 5.0, 7.0, 10.0, 21.0, 25.0, 39.0, 75.0, 99.0, 171.0, 287.0, 411.0, 691.0, 1017.0, 1568.0, 2281.0, 3455.0, 5246.0, 7605.0, 11184.0, 16104.0, 22730.0, 30782.0, 41120.0, 53227.0, 66440.0, 78665.0, 88042.0, 93891.0, 93522.0, 88147.0, 78632.0, 65869.0, 53197.0, 41127.0, 30943.0, 22206.0, 15937.0, 11110.0, 7572.0, 5203.0, 3385.0, 2259.0, 1474.0, 997.0, 615.0, 411.0, 245.0, 183.0, 117.0, 83.0, 45.0, 26.0, 26.0, 11.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.71875, -9.4051513671875, -9.091552734375, -8.7779541015625, -8.46435546875, -8.1507568359375, -7.837158203125, -7.5235595703125, -7.2099609375, -6.8963623046875, -6.582763671875, -6.2691650390625, -5.95556640625, -5.6419677734375, -5.328369140625, -5.0147705078125, -4.701171875, -4.3875732421875, -4.073974609375, -3.7603759765625, -3.44677734375, -3.1331787109375, -2.819580078125, -2.5059814453125, -2.1923828125, -1.8787841796875, -1.565185546875, -1.2515869140625, -0.93798828125, -0.6243896484375, -0.310791015625, 0.0028076171875, 0.31640625, 0.6300048828125, 0.943603515625, 1.2572021484375, 1.57080078125, 1.8843994140625, 2.197998046875, 2.5115966796875, 2.8251953125, 3.1387939453125, 3.452392578125, 3.7659912109375, 4.07958984375, 4.3931884765625, 4.706787109375, 5.0203857421875, 5.333984375, 5.6475830078125, 5.961181640625, 6.2747802734375, 6.58837890625, 6.9019775390625, 7.215576171875, 7.5291748046875, 7.8427734375, 8.1563720703125, 8.469970703125, 8.7835693359375, 9.09716796875, 9.4107666015625, 9.724365234375, 10.0379638671875, 10.3515625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 8.0, 8.0, 12.0, 15.0, 24.0, 16.0, 20.0, 24.0, 25.0, 33.0, 41.0, 35.0, 32.0, 37.0, 47.0, 32.0, 50.0, 34.0, 44.0, 34.0, 45.0, 47.0, 26.0, 31.0, 35.0, 33.0, 28.0, 27.0, 19.0, 16.0, 22.0, 20.0, 19.0, 12.0, 7.0, 8.0, 7.0, 1.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0703125, -10.7225341796875, -10.374755859375, -10.0269775390625, -9.67919921875, -9.3314208984375, -8.983642578125, -8.6358642578125, -8.2880859375, -7.9403076171875, -7.592529296875, -7.2447509765625, -6.89697265625, -6.5491943359375, -6.201416015625, -5.8536376953125, -5.505859375, -5.1580810546875, -4.810302734375, -4.4625244140625, -4.11474609375, -3.7669677734375, -3.419189453125, -3.0714111328125, -2.7236328125, -2.3758544921875, -2.028076171875, -1.6802978515625, -1.33251953125, -0.9847412109375, -0.636962890625, -0.2891845703125, 0.05859375, 0.4063720703125, 0.754150390625, 1.1019287109375, 1.44970703125, 1.7974853515625, 2.145263671875, 2.4930419921875, 2.8408203125, 3.1885986328125, 3.536376953125, 3.8841552734375, 4.23193359375, 4.5797119140625, 4.927490234375, 5.2752685546875, 5.623046875, 5.9708251953125, 6.318603515625, 6.6663818359375, 7.01416015625, 7.3619384765625, 7.709716796875, 8.0574951171875, 8.4052734375, 8.7530517578125, 9.100830078125, 9.4486083984375, 9.79638671875, 10.1441650390625, 10.491943359375, 10.8397216796875, 11.1875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 13.0, 11.0, 19.0, 33.0, 47.0, 93.0, 177.0, 319.0, 562.0, 1136.0, 2062.0, 4074.0, 7693.0, 15003.0, 28604.0, 50834.0, 83886.0, 125011.0, 159527.0, 168615.0, 145237.0, 105348.0, 66997.0, 38776.0, 21230.0, 11054.0, 5900.0, 2978.0, 1531.0, 800.0, 434.0, 236.0, 133.0, 63.0, 45.0, 25.0, 10.0, 12.0, 3.0, 5.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.265625, -18.6494140625, -18.033203125, -17.4169921875, -16.80078125, -16.1845703125, -15.568359375, -14.9521484375, -14.3359375, -13.7197265625, -13.103515625, -12.4873046875, -11.87109375, -11.2548828125, -10.638671875, -10.0224609375, -9.40625, -8.7900390625, -8.173828125, -7.5576171875, -6.94140625, -6.3251953125, -5.708984375, -5.0927734375, -4.4765625, -3.8603515625, -3.244140625, -2.6279296875, -2.01171875, -1.3955078125, -0.779296875, -0.1630859375, 0.453125, 1.0693359375, 1.685546875, 2.3017578125, 2.91796875, 3.5341796875, 4.150390625, 4.7666015625, 5.3828125, 5.9990234375, 6.615234375, 7.2314453125, 7.84765625, 8.4638671875, 9.080078125, 9.6962890625, 10.3125, 10.9287109375, 11.544921875, 12.1611328125, 12.77734375, 13.3935546875, 14.009765625, 14.6259765625, 15.2421875, 15.8583984375, 16.474609375, 17.0908203125, 17.70703125, 18.3232421875, 18.939453125, 19.5556640625, 20.171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 10.0, 14.0, 19.0, 16.0, 17.0, 22.0, 28.0, 33.0, 40.0, 30.0, 31.0, 42.0, 51.0, 49.0, 43.0, 41.0, 38.0, 46.0, 50.0, 32.0, 32.0, 38.0, 38.0, 32.0, 30.0, 29.0, 17.0, 17.0, 20.0, 13.0, 13.0, 11.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.953125, -8.6519775390625, -8.350830078125, -8.0496826171875, -7.74853515625, -7.4473876953125, -7.146240234375, -6.8450927734375, -6.5439453125, -6.2427978515625, -5.941650390625, -5.6405029296875, -5.33935546875, -5.0382080078125, -4.737060546875, -4.4359130859375, -4.134765625, -3.8336181640625, -3.532470703125, -3.2313232421875, -2.93017578125, -2.6290283203125, -2.327880859375, -2.0267333984375, -1.7255859375, -1.4244384765625, -1.123291015625, -0.8221435546875, -0.52099609375, -0.2198486328125, 0.081298828125, 0.3824462890625, 0.68359375, 0.9847412109375, 1.285888671875, 1.5870361328125, 1.88818359375, 2.1893310546875, 2.490478515625, 2.7916259765625, 3.0927734375, 3.3939208984375, 3.695068359375, 3.9962158203125, 4.29736328125, 4.5985107421875, 4.899658203125, 5.2008056640625, 5.501953125, 5.8031005859375, 6.104248046875, 6.4053955078125, 6.70654296875, 7.0076904296875, 7.308837890625, 7.6099853515625, 7.9111328125, 8.2122802734375, 8.513427734375, 8.8145751953125, 9.11572265625, 9.4168701171875, 9.718017578125, 10.0191650390625, 10.3203125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 8.0, 5.0, 7.0, 18.0, 29.0, 45.0, 46.0, 80.0, 126.0, 145.0, 235.0, 357.0, 511.0, 701.0, 1065.0, 1650.0, 2274.0, 3637.0, 5343.0, 8063.0, 12252.0, 19011.0, 29432.0, 46633.0, 73452.0, 112177.0, 153164.0, 166596.0, 139345.0, 97004.0, 62722.0, 39219.0, 25356.0, 16382.0, 10553.0, 7027.0, 4559.0, 2990.0, 1973.0, 1377.0, 950.0, 624.0, 440.0, 292.0, 197.0, 141.0, 115.0, 69.0, 58.0, 25.0, 28.0, 16.0, 10.0, 11.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-13.0234375, -12.6204833984375, -12.217529296875, -11.8145751953125, -11.41162109375, -11.0086669921875, -10.605712890625, -10.2027587890625, -9.7998046875, -9.3968505859375, -8.993896484375, -8.5909423828125, -8.18798828125, -7.7850341796875, -7.382080078125, -6.9791259765625, -6.576171875, -6.1732177734375, -5.770263671875, -5.3673095703125, -4.96435546875, -4.5614013671875, -4.158447265625, -3.7554931640625, -3.3525390625, -2.9495849609375, -2.546630859375, -2.1436767578125, -1.74072265625, -1.3377685546875, -0.934814453125, -0.5318603515625, -0.12890625, 0.2740478515625, 0.677001953125, 1.0799560546875, 1.48291015625, 1.8858642578125, 2.288818359375, 2.6917724609375, 3.0947265625, 3.4976806640625, 3.900634765625, 4.3035888671875, 4.70654296875, 5.1094970703125, 5.512451171875, 5.9154052734375, 6.318359375, 6.7213134765625, 7.124267578125, 7.5272216796875, 7.93017578125, 8.3331298828125, 8.736083984375, 9.1390380859375, 9.5419921875, 9.9449462890625, 10.347900390625, 10.7508544921875, 11.15380859375, 11.5567626953125, 11.959716796875, 12.3626708984375, 12.765625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 17.0, 13.0, 21.0, 23.0, 41.0, 39.0, 58.0, 62.0, 90.0, 84.0, 81.0, 89.0, 86.0, 58.0, 47.0, 49.0, 37.0, 19.0, 20.0, 13.0, 12.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.002178192138671875, -0.00211334228515625, -0.002048492431640625, -0.001983642578125, -0.001918792724609375, -0.00185394287109375, -0.001789093017578125, -0.0017242431640625, -0.001659393310546875, -0.00159454345703125, -0.001529693603515625, -0.00146484375, -0.001399993896484375, -0.00133514404296875, -0.001270294189453125, -0.0012054443359375, -0.001140594482421875, -0.00107574462890625, -0.001010894775390625, -0.000946044921875, -0.000881195068359375, -0.00081634521484375, -0.000751495361328125, -0.0006866455078125, -0.000621795654296875, -0.00055694580078125, -0.000492095947265625, -0.00042724609375, -0.000362396240234375, -0.00029754638671875, -0.000232696533203125, -0.0001678466796875, -0.000102996826171875, -3.814697265625e-05, 2.6702880859375e-05, 9.1552734375e-05, 0.000156402587890625, 0.00022125244140625, 0.000286102294921875, 0.0003509521484375, 0.000415802001953125, 0.00048065185546875, 0.000545501708984375, 0.0006103515625, 0.000675201416015625, 0.00074005126953125, 0.000804901123046875, 0.0008697509765625, 0.000934600830078125, 0.00099945068359375, 0.001064300537109375, 0.001129150390625, 0.001194000244140625, 0.00125885009765625, 0.001323699951171875, 0.0013885498046875, 0.001453399658203125, 0.00151824951171875, 0.001583099365234375, 0.00164794921875, 0.001712799072265625, 0.00177764892578125, 0.001842498779296875, 0.0019073486328125, 0.001972198486328125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 12.0, 12.0, 26.0, 17.0, 44.0, 67.0, 120.0, 139.0, 246.0, 367.0, 591.0, 903.0, 1349.0, 2099.0, 3411.0, 5346.0, 8661.0, 13312.0, 21482.0, 33860.0, 52838.0, 78924.0, 108997.0, 136354.0, 144880.0, 131251.0, 102077.0, 71821.0, 47326.0, 30514.0, 19209.0, 11835.0, 7359.0, 4616.0, 3081.0, 1925.0, 1141.0, 847.0, 498.0, 351.0, 232.0, 143.0, 91.0, 59.0, 51.0, 24.0, 11.0, 13.0, 14.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.8125, -10.478515625, -10.14453125, -9.810546875, -9.4765625, -9.142578125, -8.80859375, -8.474609375, -8.140625, -7.806640625, -7.47265625, -7.138671875, -6.8046875, -6.470703125, -6.13671875, -5.802734375, -5.46875, -5.134765625, -4.80078125, -4.466796875, -4.1328125, -3.798828125, -3.46484375, -3.130859375, -2.796875, -2.462890625, -2.12890625, -1.794921875, -1.4609375, -1.126953125, -0.79296875, -0.458984375, -0.125, 0.208984375, 0.54296875, 0.876953125, 1.2109375, 1.544921875, 1.87890625, 2.212890625, 2.546875, 2.880859375, 3.21484375, 3.548828125, 3.8828125, 4.216796875, 4.55078125, 4.884765625, 5.21875, 5.552734375, 5.88671875, 6.220703125, 6.5546875, 6.888671875, 7.22265625, 7.556640625, 7.890625, 8.224609375, 8.55859375, 8.892578125, 9.2265625, 9.560546875, 9.89453125, 10.228515625, 10.5625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 6.0, 10.0, 16.0, 16.0, 25.0, 23.0, 27.0, 34.0, 37.0, 45.0, 62.0, 69.0, 51.0, 79.0, 53.0, 73.0, 58.0, 66.0, 45.0, 39.0, 31.0, 24.0, 18.0, 12.0, 17.0, 16.0, 6.0, 2.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.49365234375, -5.3154296875, -5.13720703125, -4.958984375, -4.78076171875, -4.6025390625, -4.42431640625, -4.24609375, -4.06787109375, -3.8896484375, -3.71142578125, -3.533203125, -3.35498046875, -3.1767578125, -2.99853515625, -2.8203125, -2.64208984375, -2.4638671875, -2.28564453125, -2.107421875, -1.92919921875, -1.7509765625, -1.57275390625, -1.39453125, -1.21630859375, -1.0380859375, -0.85986328125, -0.681640625, -0.50341796875, -0.3251953125, -0.14697265625, 0.03125, 0.20947265625, 0.3876953125, 0.56591796875, 0.744140625, 0.92236328125, 1.1005859375, 1.27880859375, 1.45703125, 1.63525390625, 1.8134765625, 1.99169921875, 2.169921875, 2.34814453125, 2.5263671875, 2.70458984375, 2.8828125, 3.06103515625, 3.2392578125, 3.41748046875, 3.595703125, 3.77392578125, 3.9521484375, 4.13037109375, 4.30859375, 4.48681640625, 4.6650390625, 4.84326171875, 5.021484375, 5.19970703125, 5.3779296875, 5.55615234375, 5.734375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 11.0, 17.0, 11.0, 13.0, 9.0, 23.0, 18.0, 30.0, 25.0, 36.0, 35.0, 40.0, 34.0, 44.0, 35.0, 39.0, 44.0, 39.0, 49.0, 34.0, 43.0, 45.0, 35.0, 31.0, 29.0, 25.0, 21.0, 17.0, 17.0, 33.0, 17.0, 14.0, 14.0, 15.0, 7.0, 7.0, 2.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.669567108154297, -11.289685249328613, -10.909804344177246, -10.529922485351562, -10.150041580200195, -9.770159721374512, -9.390277862548828, -9.010396957397461, -8.630515098571777, -8.250633239746094, -7.870752334594727, -7.490870475769043, -7.110989093780518, -6.731107711791992, -6.351225852966309, -5.971344470977783, -5.591463088989258, -5.211581707000732, -4.831700325012207, -4.451818466186523, -4.071937084197998, -3.6920557022094727, -3.312174081802368, -2.9322924613952637, -2.5524110794067383, -2.172529697418213, -1.7926480770111084, -1.4127665758132935, -1.0328850746154785, -0.6530035734176636, -0.27312207221984863, 0.10675954818725586, 0.48664188385009766, 0.8665233850479126, 1.2464048862457275, 1.6262863874435425, 2.0061678886413574, 2.386049270629883, 2.7659308910369873, 3.145812511444092, 3.525693893432617, 3.9055752754211426, 4.285456657409668, 4.665338516235352, 5.045219898223877, 5.425101280212402, 5.804983139038086, 6.184864521026611, 6.564745903015137, 6.944627285003662, 7.3245086669921875, 7.704390525817871, 8.084272384643555, 8.464153289794922, 8.844035148620605, 9.223917007446289, 9.603797912597656, 9.98367977142334, 10.363560676574707, 10.74344253540039, 11.123323440551758, 11.503205299377441, 11.883087158203125, 12.262968063354492, 12.642849922180176]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 12.0, 8.0, 11.0, 15.0, 21.0, 19.0, 19.0, 15.0, 27.0, 27.0, 34.0, 35.0, 37.0, 25.0, 27.0, 41.0, 34.0, 39.0, 41.0, 49.0, 58.0, 44.0, 34.0, 41.0, 27.0, 28.0, 27.0, 29.0, 22.0, 26.0, 12.0, 16.0, 19.0, 24.0, 6.0, 7.0, 7.0, 6.0, 4.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-14.782143592834473, -14.375288009643555, -13.968433380126953, -13.561577796936035, -13.154722213745117, -12.7478666305542, -12.341011047363281, -11.93415641784668, -11.527300834655762, -11.120445251464844, -10.713590621948242, -10.306735038757324, -9.899879455566406, -9.493023872375488, -9.08616828918457, -8.679313659667969, -8.27245807647705, -7.865602493286133, -7.458747386932373, -7.051892280578613, -6.645036697387695, -6.238181114196777, -5.831326007843018, -5.424470901489258, -5.01761531829834, -4.610759735107422, -4.203904628753662, -3.7970492839813232, -3.3901939392089844, -2.9833385944366455, -2.5764832496643066, -2.1696279048919678, -1.7627735137939453, -1.3559181690216064, -0.9490628242492676, -0.5422074794769287, -0.13535213470458984, 0.271503210067749, 0.6783585548400879, 1.0852138996124268, 1.4920692443847656, 1.8989245891571045, 2.3057799339294434, 2.7126352787017822, 3.119490623474121, 3.52634596824646, 3.933201313018799, 4.340056419372559, 4.746912002563477, 5.1537675857543945, 5.560622692108154, 5.967477798461914, 6.374333381652832, 6.78118896484375, 7.18804407119751, 7.5948991775512695, 8.001754760742188, 8.408610343933105, 8.815465927124023, 9.222320556640625, 9.629176139831543, 10.036031723022461, 10.442886352539062, 10.84974193572998, 11.256597518920898]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 16.0, 26.0, 27.0, 40.0, 78.0, 125.0, 214.0, 403.0, 648.0, 1147.0, 1814.0, 2903.0, 4788.0, 7843.0, 12885.0, 20388.0, 32266.0, 49855.0, 75222.0, 110449.0, 156918.0, 213369.0, 277208.0, 341757.0, 393017.0, 423335.0, 421333.0, 388022.0, 332092.0, 267876.0, 205201.0, 149828.0, 104591.0, 71417.0, 46863.0, 30644.0, 19205.0, 12042.0, 7203.0, 4608.0, 2734.0, 1577.0, 947.0, 568.0, 328.0, 182.0, 105.0, 79.0, 36.0, 28.0, 11.0, 12.0, 8.0, 1.0, 4.0], "bins": [-11.109375, -10.791259765625, -10.47314453125, -10.155029296875, -9.8369140625, -9.518798828125, -9.20068359375, -8.882568359375, -8.564453125, -8.246337890625, -7.92822265625, -7.610107421875, -7.2919921875, -6.973876953125, -6.65576171875, -6.337646484375, -6.01953125, -5.701416015625, -5.38330078125, -5.065185546875, -4.7470703125, -4.428955078125, -4.11083984375, -3.792724609375, -3.474609375, -3.156494140625, -2.83837890625, -2.520263671875, -2.2021484375, -1.884033203125, -1.56591796875, -1.247802734375, -0.9296875, -0.611572265625, -0.29345703125, 0.024658203125, 0.3427734375, 0.660888671875, 0.97900390625, 1.297119140625, 1.615234375, 1.933349609375, 2.25146484375, 2.569580078125, 2.8876953125, 3.205810546875, 3.52392578125, 3.842041015625, 4.16015625, 4.478271484375, 4.79638671875, 5.114501953125, 5.4326171875, 5.750732421875, 6.06884765625, 6.386962890625, 6.705078125, 7.023193359375, 7.34130859375, 7.659423828125, 7.9775390625, 8.295654296875, 8.61376953125, 8.931884765625, 9.25]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 10.0, 14.0, 9.0, 21.0, 25.0, 21.0, 33.0, 28.0, 25.0, 27.0, 33.0, 34.0, 29.0, 47.0, 46.0, 65.0, 52.0, 42.0, 41.0, 49.0, 37.0, 33.0, 39.0, 33.0, 33.0, 18.0, 28.0, 22.0, 20.0, 15.0, 10.0, 3.0, 12.0, 3.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.5546875, -12.18701171875, -11.8193359375, -11.45166015625, -11.083984375, -10.71630859375, -10.3486328125, -9.98095703125, -9.61328125, -9.24560546875, -8.8779296875, -8.51025390625, -8.142578125, -7.77490234375, -7.4072265625, -7.03955078125, -6.671875, -6.30419921875, -5.9365234375, -5.56884765625, -5.201171875, -4.83349609375, -4.4658203125, -4.09814453125, -3.73046875, -3.36279296875, -2.9951171875, -2.62744140625, -2.259765625, -1.89208984375, -1.5244140625, -1.15673828125, -0.7890625, -0.42138671875, -0.0537109375, 0.31396484375, 0.681640625, 1.04931640625, 1.4169921875, 1.78466796875, 2.15234375, 2.52001953125, 2.8876953125, 3.25537109375, 3.623046875, 3.99072265625, 4.3583984375, 4.72607421875, 5.09375, 5.46142578125, 5.8291015625, 6.19677734375, 6.564453125, 6.93212890625, 7.2998046875, 7.66748046875, 8.03515625, 8.40283203125, 8.7705078125, 9.13818359375, 9.505859375, 9.87353515625, 10.2412109375, 10.60888671875, 10.9765625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 6.0, 5.0, 1.0, 12.0, 23.0, 25.0, 35.0, 55.0, 94.0, 167.0, 263.0, 474.0, 728.0, 1180.0, 1887.0, 3066.0, 5032.0, 7822.0, 12528.0, 19524.0, 29487.0, 44200.0, 65041.0, 92261.0, 125748.0, 167476.0, 212904.0, 261196.0, 305356.0, 340450.0, 362183.0, 362258.0, 347262.0, 312777.0, 270878.0, 224453.0, 176565.0, 134046.0, 98293.0, 70050.0, 48319.0, 31990.0, 21292.0, 13736.0, 8679.0, 5551.0, 3413.0, 2146.0, 1329.0, 774.0, 484.0, 287.0, 201.0, 116.0, 61.0, 47.0, 29.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0], "bins": [-9.609375, -9.31005859375, -9.0107421875, -8.71142578125, -8.412109375, -8.11279296875, -7.8134765625, -7.51416015625, -7.21484375, -6.91552734375, -6.6162109375, -6.31689453125, -6.017578125, -5.71826171875, -5.4189453125, -5.11962890625, -4.8203125, -4.52099609375, -4.2216796875, -3.92236328125, -3.623046875, -3.32373046875, -3.0244140625, -2.72509765625, -2.42578125, -2.12646484375, -1.8271484375, -1.52783203125, -1.228515625, -0.92919921875, -0.6298828125, -0.33056640625, -0.03125, 0.26806640625, 0.5673828125, 0.86669921875, 1.166015625, 1.46533203125, 1.7646484375, 2.06396484375, 2.36328125, 2.66259765625, 2.9619140625, 3.26123046875, 3.560546875, 3.85986328125, 4.1591796875, 4.45849609375, 4.7578125, 5.05712890625, 5.3564453125, 5.65576171875, 5.955078125, 6.25439453125, 6.5537109375, 6.85302734375, 7.15234375, 7.45166015625, 7.7509765625, 8.05029296875, 8.349609375, 8.64892578125, 8.9482421875, 9.24755859375, 9.546875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 8.0, 5.0, 19.0, 14.0, 22.0, 22.0, 33.0, 35.0, 41.0, 50.0, 70.0, 68.0, 97.0, 93.0, 123.0, 128.0, 130.0, 139.0, 159.0, 199.0, 188.0, 172.0, 164.0, 197.0, 171.0, 173.0, 180.0, 154.0, 166.0, 132.0, 143.0, 116.0, 100.0, 96.0, 85.0, 72.0, 62.0, 46.0, 43.0, 31.0, 21.0, 20.0, 21.0, 18.0, 18.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.6796875, -5.50433349609375, -5.3289794921875, -5.15362548828125, -4.978271484375, -4.80291748046875, -4.6275634765625, -4.45220947265625, -4.27685546875, -4.10150146484375, -3.9261474609375, -3.75079345703125, -3.575439453125, -3.40008544921875, -3.2247314453125, -3.04937744140625, -2.8740234375, -2.69866943359375, -2.5233154296875, -2.34796142578125, -2.172607421875, -1.99725341796875, -1.8218994140625, -1.64654541015625, -1.47119140625, -1.29583740234375, -1.1204833984375, -0.94512939453125, -0.769775390625, -0.59442138671875, -0.4190673828125, -0.24371337890625, -0.068359375, 0.10699462890625, 0.2823486328125, 0.45770263671875, 0.633056640625, 0.80841064453125, 0.9837646484375, 1.15911865234375, 1.33447265625, 1.50982666015625, 1.6851806640625, 1.86053466796875, 2.035888671875, 2.21124267578125, 2.3865966796875, 2.56195068359375, 2.7373046875, 2.91265869140625, 3.0880126953125, 3.26336669921875, 3.438720703125, 3.61407470703125, 3.7894287109375, 3.96478271484375, 4.14013671875, 4.31549072265625, 4.4908447265625, 4.66619873046875, 4.841552734375, 5.01690673828125, 5.1922607421875, 5.36761474609375, 5.54296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 17.0, 5.0, 12.0, 24.0, 22.0, 17.0, 16.0, 27.0, 37.0, 27.0, 41.0, 55.0, 34.0, 31.0, 43.0, 48.0, 39.0, 53.0, 40.0, 60.0, 44.0, 31.0, 21.0, 36.0, 34.0, 32.0, 29.0, 25.0, 17.0, 17.0, 9.0, 10.0, 6.0, 9.0, 5.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.15325927734375, -15.683693885803223, -15.214129447937012, -14.744564056396484, -14.274999618530273, -13.805434226989746, -13.335868835449219, -12.866304397583008, -12.39673900604248, -11.927173614501953, -11.457609176635742, -10.988043785095215, -10.518479347229004, -10.048913955688477, -9.579349517822266, -9.109784126281738, -8.640218734741211, -8.170653343200684, -7.701088905334473, -7.231523513793945, -6.761958599090576, -6.292393684387207, -5.822828769683838, -5.353263854980469, -4.883699417114258, -4.414134502410889, -3.9445693492889404, -3.4750044345855713, -3.005439281463623, -2.535874366760254, -2.0663094520568848, -1.5967442989349365, -1.1271791458129883, -0.6576141119003296, -0.18804913759231567, 0.28151583671569824, 0.7510808706283569, 1.2206459045410156, 1.6902108192443848, 2.159775972366333, 2.629340887069702, 3.0989058017730713, 3.5684709548950195, 4.038035869598389, 4.507600784301758, 4.977166175842285, 5.446730613708496, 5.916296005249023, 6.385860919952393, 6.855425834655762, 7.324990749359131, 7.7945556640625, 8.264121055603027, 8.733686447143555, 9.203250885009766, 9.672816276550293, 10.142380714416504, 10.611946105957031, 11.081510543823242, 11.55107593536377, 12.02064037322998, 12.490205764770508, 12.959770202636719, 13.429335594177246, 13.898900985717773]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 6.0, 9.0, 8.0, 15.0, 13.0, 15.0, 22.0, 17.0, 23.0, 32.0, 27.0, 29.0, 33.0, 33.0, 28.0, 29.0, 42.0, 33.0, 34.0, 37.0, 43.0, 37.0, 41.0, 31.0, 34.0, 20.0, 33.0, 38.0, 30.0, 29.0, 22.0, 16.0, 19.0, 16.0, 17.0, 18.0, 13.0, 8.0, 8.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.451967239379883, -13.9970703125, -13.542173385620117, -13.087276458740234, -12.632379531860352, -12.177482604980469, -11.722585678100586, -11.267688751220703, -10.81279182434082, -10.357894897460938, -9.902997970581055, -9.448101043701172, -8.993204116821289, -8.538307189941406, -8.083410263061523, -7.628513336181641, -7.173616886138916, -6.718719959259033, -6.26382303237915, -5.808926105499268, -5.354029178619385, -4.89913272857666, -4.444235801696777, -3.9893386363983154, -3.5344417095184326, -3.07954478263855, -2.624647855758667, -2.1697511672973633, -1.714854121208191, -1.2599573135375977, -0.8050603866577148, -0.35016345977783203, 0.10473346710205078, 0.5596303939819336, 1.0145273208618164, 1.4694241285324097, 1.9243210554122925, 2.3792178630828857, 2.8341147899627686, 3.2890117168426514, 3.743908643722534, 4.198805332183838, 4.653702259063721, 5.1085991859436035, 5.563496112823486, 6.018393039703369, 6.473289966583252, 6.928186893463135, 7.383083820343018, 7.8379807472229, 8.292877197265625, 8.747774124145508, 9.20267105102539, 9.657567977905273, 10.112464904785156, 10.567361831665039, 11.022258758544922, 11.477155685424805, 11.932052612304688, 12.38694953918457, 12.841846466064453, 13.296743392944336, 13.751640319824219, 14.206537246704102, 14.661434173583984]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 7.0, 7.0, 14.0, 31.0, 40.0, 63.0, 102.0, 149.0, 227.0, 292.0, 506.0, 738.0, 1146.0, 1670.0, 2637.0, 4207.0, 6502.0, 10352.0, 16450.0, 26602.0, 43346.0, 70075.0, 107988.0, 150442.0, 170796.0, 147656.0, 106085.0, 68031.0, 42427.0, 26157.0, 15986.0, 9976.0, 6320.0, 4010.0, 2573.0, 1686.0, 1124.0, 746.0, 434.0, 338.0, 217.0, 139.0, 85.0, 73.0, 31.0, 26.0, 14.0, 13.0, 7.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.109375, -19.449462890625, -18.78955078125, -18.129638671875, -17.4697265625, -16.809814453125, -16.14990234375, -15.489990234375, -14.830078125, -14.170166015625, -13.51025390625, -12.850341796875, -12.1904296875, -11.530517578125, -10.87060546875, -10.210693359375, -9.55078125, -8.890869140625, -8.23095703125, -7.571044921875, -6.9111328125, -6.251220703125, -5.59130859375, -4.931396484375, -4.271484375, -3.611572265625, -2.95166015625, -2.291748046875, -1.6318359375, -0.971923828125, -0.31201171875, 0.347900390625, 1.0078125, 1.667724609375, 2.32763671875, 2.987548828125, 3.6474609375, 4.307373046875, 4.96728515625, 5.627197265625, 6.287109375, 6.947021484375, 7.60693359375, 8.266845703125, 8.9267578125, 9.586669921875, 10.24658203125, 10.906494140625, 11.56640625, 12.226318359375, 12.88623046875, 13.546142578125, 14.2060546875, 14.865966796875, 15.52587890625, 16.185791015625, 16.845703125, 17.505615234375, 18.16552734375, 18.825439453125, 19.4853515625, 20.145263671875, 20.80517578125, 21.465087890625, 22.125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 11.0, 8.0, 10.0, 15.0, 20.0, 15.0, 25.0, 27.0, 28.0, 29.0, 25.0, 32.0, 41.0, 40.0, 39.0, 42.0, 36.0, 38.0, 45.0, 39.0, 37.0, 32.0, 41.0, 34.0, 23.0, 36.0, 26.0, 35.0, 23.0, 19.0, 22.0, 15.0, 11.0, 15.0, 13.0, 9.0, 10.0, 3.0, 9.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.640625, -16.1402587890625, -15.639892578125, -15.1395263671875, -14.63916015625, -14.1387939453125, -13.638427734375, -13.1380615234375, -12.6376953125, -12.1373291015625, -11.636962890625, -11.1365966796875, -10.63623046875, -10.1358642578125, -9.635498046875, -9.1351318359375, -8.634765625, -8.1343994140625, -7.634033203125, -7.1336669921875, -6.63330078125, -6.1329345703125, -5.632568359375, -5.1322021484375, -4.6318359375, -4.1314697265625, -3.631103515625, -3.1307373046875, -2.63037109375, -2.1300048828125, -1.629638671875, -1.1292724609375, -0.62890625, -0.1285400390625, 0.371826171875, 0.8721923828125, 1.37255859375, 1.8729248046875, 2.373291015625, 2.8736572265625, 3.3740234375, 3.8743896484375, 4.374755859375, 4.8751220703125, 5.37548828125, 5.8758544921875, 6.376220703125, 6.8765869140625, 7.376953125, 7.8773193359375, 8.377685546875, 8.8780517578125, 9.37841796875, 9.8787841796875, 10.379150390625, 10.8795166015625, 11.3798828125, 11.8802490234375, 12.380615234375, 12.8809814453125, 13.38134765625, 13.8817138671875, 14.382080078125, 14.8824462890625, 15.3828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 8.0, 11.0, 16.0, 25.0, 25.0, 50.0, 79.0, 126.0, 227.0, 342.0, 562.0, 1016.0, 1920.0, 3830.0, 8574.0, 19737.0, 52198.0, 157798.0, 415827.0, 254207.0, 80043.0, 29148.0, 11772.0, 5351.0, 2557.0, 1313.0, 688.0, 394.0, 250.0, 173.0, 89.0, 61.0, 35.0, 24.0, 16.0, 11.0, 6.0, 14.0, 9.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-49.4375, -47.92578125, -46.4140625, -44.90234375, -43.390625, -41.87890625, -40.3671875, -38.85546875, -37.34375, -35.83203125, -34.3203125, -32.80859375, -31.296875, -29.78515625, -28.2734375, -26.76171875, -25.25, -23.73828125, -22.2265625, -20.71484375, -19.203125, -17.69140625, -16.1796875, -14.66796875, -13.15625, -11.64453125, -10.1328125, -8.62109375, -7.109375, -5.59765625, -4.0859375, -2.57421875, -1.0625, 0.44921875, 1.9609375, 3.47265625, 4.984375, 6.49609375, 8.0078125, 9.51953125, 11.03125, 12.54296875, 14.0546875, 15.56640625, 17.078125, 18.58984375, 20.1015625, 21.61328125, 23.125, 24.63671875, 26.1484375, 27.66015625, 29.171875, 30.68359375, 32.1953125, 33.70703125, 35.21875, 36.73046875, 38.2421875, 39.75390625, 41.265625, 42.77734375, 44.2890625, 45.80078125, 47.3125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 5.0, 7.0, 11.0, 16.0, 14.0, 10.0, 19.0, 17.0, 22.0, 36.0, 20.0, 29.0, 31.0, 31.0, 43.0, 53.0, 39.0, 53.0, 51.0, 55.0, 38.0, 43.0, 39.0, 43.0, 30.0, 36.0, 29.0, 16.0, 15.0, 28.0, 14.0, 30.0, 6.0, 15.0, 6.0, 8.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.9375, -11.5555419921875, -11.173583984375, -10.7916259765625, -10.40966796875, -10.0277099609375, -9.645751953125, -9.2637939453125, -8.8818359375, -8.4998779296875, -8.117919921875, -7.7359619140625, -7.35400390625, -6.9720458984375, -6.590087890625, -6.2081298828125, -5.826171875, -5.4442138671875, -5.062255859375, -4.6802978515625, -4.29833984375, -3.9163818359375, -3.534423828125, -3.1524658203125, -2.7705078125, -2.3885498046875, -2.006591796875, -1.6246337890625, -1.24267578125, -0.8607177734375, -0.478759765625, -0.0968017578125, 0.28515625, 0.6671142578125, 1.049072265625, 1.4310302734375, 1.81298828125, 2.1949462890625, 2.576904296875, 2.9588623046875, 3.3408203125, 3.7227783203125, 4.104736328125, 4.4866943359375, 4.86865234375, 5.2506103515625, 5.632568359375, 6.0145263671875, 6.396484375, 6.7784423828125, 7.160400390625, 7.5423583984375, 7.92431640625, 8.3062744140625, 8.688232421875, 9.0701904296875, 9.4521484375, 9.8341064453125, 10.216064453125, 10.5980224609375, 10.97998046875, 11.3619384765625, 11.743896484375, 12.1258544921875, 12.5078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 9.0, 6.0, 17.0, 16.0, 30.0, 34.0, 51.0, 73.0, 98.0, 140.0, 204.0, 267.0, 427.0, 608.0, 889.0, 1399.0, 2283.0, 3578.0, 5979.0, 10382.0, 18568.0, 34782.0, 71366.0, 161513.0, 322093.0, 218835.0, 94940.0, 44525.0, 23129.0, 12698.0, 7401.0, 4404.0, 2686.0, 1725.0, 1096.0, 690.0, 461.0, 336.0, 206.0, 177.0, 111.0, 75.0, 62.0, 60.0, 28.0, 20.0, 18.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 0.0, 1.0, 4.0], "bins": [-21.71875, -21.05419921875, -20.3896484375, -19.72509765625, -19.060546875, -18.39599609375, -17.7314453125, -17.06689453125, -16.40234375, -15.73779296875, -15.0732421875, -14.40869140625, -13.744140625, -13.07958984375, -12.4150390625, -11.75048828125, -11.0859375, -10.42138671875, -9.7568359375, -9.09228515625, -8.427734375, -7.76318359375, -7.0986328125, -6.43408203125, -5.76953125, -5.10498046875, -4.4404296875, -3.77587890625, -3.111328125, -2.44677734375, -1.7822265625, -1.11767578125, -0.453125, 0.21142578125, 0.8759765625, 1.54052734375, 2.205078125, 2.86962890625, 3.5341796875, 4.19873046875, 4.86328125, 5.52783203125, 6.1923828125, 6.85693359375, 7.521484375, 8.18603515625, 8.8505859375, 9.51513671875, 10.1796875, 10.84423828125, 11.5087890625, 12.17333984375, 12.837890625, 13.50244140625, 14.1669921875, 14.83154296875, 15.49609375, 16.16064453125, 16.8251953125, 17.48974609375, 18.154296875, 18.81884765625, 19.4833984375, 20.14794921875, 20.8125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 6.0, 10.0, 20.0, 16.0, 13.0, 29.0, 36.0, 41.0, 53.0, 63.0, 77.0, 85.0, 81.0, 74.0, 78.0, 61.0, 48.0, 47.0, 33.0, 19.0, 14.0, 11.0, 7.0, 10.0, 12.0, 9.0, 5.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010509490966796875, -0.0010192692279815674, -0.0009875893592834473, -0.0009559094905853271, -0.000924229621887207, -0.0008925497531890869, -0.0008608698844909668, -0.0008291900157928467, -0.0007975101470947266, -0.0007658302783966064, -0.0007341504096984863, -0.0007024705410003662, -0.0006707906723022461, -0.000639110803604126, -0.0006074309349060059, -0.0005757510662078857, -0.0005440711975097656, -0.0005123913288116455, -0.0004807114601135254, -0.0004490315914154053, -0.00041735172271728516, -0.00038567185401916504, -0.0003539919853210449, -0.0003223121166229248, -0.0002906322479248047, -0.00025895237922668457, -0.00022727251052856445, -0.00019559264183044434, -0.00016391277313232422, -0.0001322329044342041, -0.00010055303573608398, -6.887316703796387e-05, -3.719329833984375e-05, -5.513429641723633e-06, 2.6166439056396484e-05, 5.78463077545166e-05, 8.952617645263672e-05, 0.00012120604515075684, 0.00015288591384887695, 0.00018456578254699707, 0.0002162456512451172, 0.0002479255199432373, 0.0002796053886413574, 0.00031128525733947754, 0.00034296512603759766, 0.0003746449947357178, 0.0004063248634338379, 0.000438004732131958, 0.0004696846008300781, 0.0005013644695281982, 0.0005330443382263184, 0.0005647242069244385, 0.0005964040756225586, 0.0006280839443206787, 0.0006597638130187988, 0.0006914436817169189, 0.0007231235504150391, 0.0007548034191131592, 0.0007864832878112793, 0.0008181631565093994, 0.0008498430252075195, 0.0008815228939056396, 0.0009132027626037598, 0.0009448826313018799, 0.0009765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 6.0, 1.0, 4.0, 3.0, 6.0, 13.0, 16.0, 17.0, 27.0, 45.0, 43.0, 96.0, 128.0, 176.0, 271.0, 370.0, 554.0, 935.0, 1389.0, 2085.0, 3394.0, 5404.0, 8370.0, 13640.0, 21593.0, 34300.0, 53489.0, 81477.0, 116963.0, 149156.0, 156301.0, 130265.0, 94889.0, 62875.0, 40483.0, 25610.0, 16105.0, 10241.0, 6499.0, 4022.0, 2511.0, 1658.0, 1007.0, 750.0, 460.0, 309.0, 200.0, 133.0, 86.0, 58.0, 46.0, 30.0, 21.0, 11.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-12.6171875, -12.212646484375, -11.80810546875, -11.403564453125, -10.9990234375, -10.594482421875, -10.18994140625, -9.785400390625, -9.380859375, -8.976318359375, -8.57177734375, -8.167236328125, -7.7626953125, -7.358154296875, -6.95361328125, -6.549072265625, -6.14453125, -5.739990234375, -5.33544921875, -4.930908203125, -4.5263671875, -4.121826171875, -3.71728515625, -3.312744140625, -2.908203125, -2.503662109375, -2.09912109375, -1.694580078125, -1.2900390625, -0.885498046875, -0.48095703125, -0.076416015625, 0.328125, 0.732666015625, 1.13720703125, 1.541748046875, 1.9462890625, 2.350830078125, 2.75537109375, 3.159912109375, 3.564453125, 3.968994140625, 4.37353515625, 4.778076171875, 5.1826171875, 5.587158203125, 5.99169921875, 6.396240234375, 6.80078125, 7.205322265625, 7.60986328125, 8.014404296875, 8.4189453125, 8.823486328125, 9.22802734375, 9.632568359375, 10.037109375, 10.441650390625, 10.84619140625, 11.250732421875, 11.6552734375, 12.059814453125, 12.46435546875, 12.868896484375, 13.2734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 7.0, 13.0, 15.0, 18.0, 14.0, 19.0, 31.0, 33.0, 36.0, 46.0, 44.0, 53.0, 50.0, 62.0, 67.0, 46.0, 62.0, 59.0, 52.0, 36.0, 34.0, 37.0, 23.0, 19.0, 22.0, 17.0, 17.0, 18.0, 7.0, 5.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-7.359375, -7.15576171875, -6.9521484375, -6.74853515625, -6.544921875, -6.34130859375, -6.1376953125, -5.93408203125, -5.73046875, -5.52685546875, -5.3232421875, -5.11962890625, -4.916015625, -4.71240234375, -4.5087890625, -4.30517578125, -4.1015625, -3.89794921875, -3.6943359375, -3.49072265625, -3.287109375, -3.08349609375, -2.8798828125, -2.67626953125, -2.47265625, -2.26904296875, -2.0654296875, -1.86181640625, -1.658203125, -1.45458984375, -1.2509765625, -1.04736328125, -0.84375, -0.64013671875, -0.4365234375, -0.23291015625, -0.029296875, 0.17431640625, 0.3779296875, 0.58154296875, 0.78515625, 0.98876953125, 1.1923828125, 1.39599609375, 1.599609375, 1.80322265625, 2.0068359375, 2.21044921875, 2.4140625, 2.61767578125, 2.8212890625, 3.02490234375, 3.228515625, 3.43212890625, 3.6357421875, 3.83935546875, 4.04296875, 4.24658203125, 4.4501953125, 4.65380859375, 4.857421875, 5.06103515625, 5.2646484375, 5.46826171875, 5.671875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 7.0, 12.0, 11.0, 8.0, 10.0, 13.0, 14.0, 18.0, 28.0, 26.0, 23.0, 40.0, 38.0, 38.0, 38.0, 42.0, 48.0, 41.0, 46.0, 40.0, 52.0, 37.0, 43.0, 28.0, 31.0, 27.0, 35.0, 33.0, 33.0, 26.0, 22.0, 22.0, 19.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.263439178466797, -15.781574249267578, -15.299710273742676, -14.817845344543457, -14.335980415344238, -13.854116439819336, -13.372251510620117, -12.890386581420898, -12.408522605895996, -11.926657676696777, -11.444793701171875, -10.962928771972656, -10.481063842773438, -9.999199867248535, -9.517334938049316, -9.035470962524414, -8.553606033325195, -8.071741104125977, -7.589876651763916, -7.1080121994018555, -6.626147747039795, -6.144283294677734, -5.662418365478516, -5.180553913116455, -4.698688507080078, -4.216824054718018, -3.734959363937378, -3.2530946731567383, -2.7712302207946777, -2.289365530014038, -1.8075008392333984, -1.325636386871338, -0.8437719345092773, -0.36190733313560486, 0.11995726823806763, 0.6018218994140625, 1.0836864709854126, 1.5655510425567627, 2.0474157333374023, 2.529280185699463, 3.0111448764801025, 3.493009567260742, 3.9748740196228027, 4.456738471984863, 4.938603401184082, 5.420467853546143, 5.902332305908203, 6.384197235107422, 6.866061687469482, 7.347926139831543, 7.829791069030762, 8.311655044555664, 8.793519973754883, 9.275384902954102, 9.75724983215332, 10.239113807678223, 10.720978736877441, 11.20284366607666, 11.684707641601562, 12.166572570800781, 12.6484375, 13.130301475524902, 13.612166404724121, 14.094030380249023, 14.575895309448242]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 10.0, 7.0, 14.0, 10.0, 14.0, 19.0, 12.0, 23.0, 18.0, 27.0, 25.0, 28.0, 22.0, 38.0, 31.0, 39.0, 35.0, 44.0, 38.0, 27.0, 25.0, 34.0, 43.0, 34.0, 29.0, 26.0, 32.0, 28.0, 24.0, 21.0, 35.0, 25.0, 25.0, 18.0, 22.0, 17.0, 13.0, 7.0, 11.0, 8.0, 3.0, 5.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-14.83842658996582, -14.390618324279785, -13.94281005859375, -13.495000839233398, -13.047192573547363, -12.599384307861328, -12.151575088500977, -11.703766822814941, -11.255958557128906, -10.808150291442871, -10.360342025756836, -9.912532806396484, -9.46472454071045, -9.016916275024414, -8.569107055664062, -8.121298789978027, -7.673490524291992, -7.225682258605957, -6.777873516082764, -6.33006477355957, -5.882256507873535, -5.4344482421875, -4.986639499664307, -4.538830757141113, -4.091022491455078, -3.643213987350464, -3.1954054832458496, -2.7475969791412354, -2.299788475036621, -1.8519799709320068, -1.4041714668273926, -0.9563629627227783, -0.5085544586181641, -0.060745954513549805, 0.38706254959106445, 0.8348710536956787, 1.282679557800293, 1.7304880619049072, 2.1782965660095215, 2.6261050701141357, 3.07391357421875, 3.5217220783233643, 3.9695305824279785, 4.417339324951172, 4.865147590637207, 5.312955856323242, 5.7607645988464355, 6.208573341369629, 6.656381607055664, 7.104189872741699, 7.551998615264893, 7.999807357788086, 8.447615623474121, 8.895423889160156, 9.343233108520508, 9.791041374206543, 10.238849639892578, 10.686657905578613, 11.134466171264648, 11.582275390625, 12.030083656311035, 12.47789192199707, 12.925701141357422, 13.373509407043457, 13.821317672729492]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 7.0, 14.0, 26.0, 29.0, 39.0, 58.0, 88.0, 122.0, 194.0, 317.0, 465.0, 794.0, 1320.0, 2343.0, 4080.0, 7681.0, 13734.0, 24736.0, 43733.0, 74758.0, 116495.0, 157523.0, 173947.0, 153314.0, 110160.0, 69845.0, 40674.0, 23204.0, 12590.0, 6944.0, 3793.0, 2230.0, 1237.0, 737.0, 468.0, 296.0, 176.0, 146.0, 72.0, 51.0, 30.0, 20.0, 16.0, 13.0, 12.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.03125, -15.521240234375, -15.01123046875, -14.501220703125, -13.9912109375, -13.481201171875, -12.97119140625, -12.461181640625, -11.951171875, -11.441162109375, -10.93115234375, -10.421142578125, -9.9111328125, -9.401123046875, -8.89111328125, -8.381103515625, -7.87109375, -7.361083984375, -6.85107421875, -6.341064453125, -5.8310546875, -5.321044921875, -4.81103515625, -4.301025390625, -3.791015625, -3.281005859375, -2.77099609375, -2.260986328125, -1.7509765625, -1.240966796875, -0.73095703125, -0.220947265625, 0.2890625, 0.799072265625, 1.30908203125, 1.819091796875, 2.3291015625, 2.839111328125, 3.34912109375, 3.859130859375, 4.369140625, 4.879150390625, 5.38916015625, 5.899169921875, 6.4091796875, 6.919189453125, 7.42919921875, 7.939208984375, 8.44921875, 8.959228515625, 9.46923828125, 9.979248046875, 10.4892578125, 10.999267578125, 11.50927734375, 12.019287109375, 12.529296875, 13.039306640625, 13.54931640625, 14.059326171875, 14.5693359375, 15.079345703125, 15.58935546875, 16.099365234375, 16.609375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 12.0, 13.0, 17.0, 10.0, 13.0, 17.0, 22.0, 34.0, 27.0, 39.0, 25.0, 33.0, 29.0, 37.0, 40.0, 41.0, 36.0, 35.0, 29.0, 30.0, 35.0, 26.0, 31.0, 36.0, 33.0, 18.0, 32.0, 32.0, 27.0, 24.0, 26.0, 19.0, 18.0, 13.0, 12.0, 7.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.453125, -13.0250244140625, -12.596923828125, -12.1688232421875, -11.74072265625, -11.3126220703125, -10.884521484375, -10.4564208984375, -10.0283203125, -9.6002197265625, -9.172119140625, -8.7440185546875, -8.31591796875, -7.8878173828125, -7.459716796875, -7.0316162109375, -6.603515625, -6.1754150390625, -5.747314453125, -5.3192138671875, -4.89111328125, -4.4630126953125, -4.034912109375, -3.6068115234375, -3.1787109375, -2.7506103515625, -2.322509765625, -1.8944091796875, -1.46630859375, -1.0382080078125, -0.610107421875, -0.1820068359375, 0.24609375, 0.6741943359375, 1.102294921875, 1.5303955078125, 1.95849609375, 2.3865966796875, 2.814697265625, 3.2427978515625, 3.6708984375, 4.0989990234375, 4.527099609375, 4.9552001953125, 5.38330078125, 5.8114013671875, 6.239501953125, 6.6676025390625, 7.095703125, 7.5238037109375, 7.951904296875, 8.3800048828125, 8.80810546875, 9.2362060546875, 9.664306640625, 10.0924072265625, 10.5205078125, 10.9486083984375, 11.376708984375, 11.8048095703125, 12.23291015625, 12.6610107421875, 13.089111328125, 13.5172119140625, 13.9453125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 10.0, 10.0, 27.0, 35.0, 50.0, 81.0, 137.0, 213.0, 307.0, 490.0, 735.0, 1149.0, 1771.0, 2887.0, 4399.0, 6862.0, 11408.0, 18982.0, 31467.0, 54488.0, 91878.0, 144396.0, 186089.0, 175730.0, 125285.0, 76637.0, 44756.0, 26357.0, 15809.0, 9710.0, 5986.0, 3730.0, 2378.0, 1482.0, 1031.0, 629.0, 418.0, 261.0, 172.0, 104.0, 65.0, 48.0, 24.0, 22.0, 19.0, 11.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-23.03125, -22.350341796875, -21.66943359375, -20.988525390625, -20.3076171875, -19.626708984375, -18.94580078125, -18.264892578125, -17.583984375, -16.903076171875, -16.22216796875, -15.541259765625, -14.8603515625, -14.179443359375, -13.49853515625, -12.817626953125, -12.13671875, -11.455810546875, -10.77490234375, -10.093994140625, -9.4130859375, -8.732177734375, -8.05126953125, -7.370361328125, -6.689453125, -6.008544921875, -5.32763671875, -4.646728515625, -3.9658203125, -3.284912109375, -2.60400390625, -1.923095703125, -1.2421875, -0.561279296875, 0.11962890625, 0.800537109375, 1.4814453125, 2.162353515625, 2.84326171875, 3.524169921875, 4.205078125, 4.885986328125, 5.56689453125, 6.247802734375, 6.9287109375, 7.609619140625, 8.29052734375, 8.971435546875, 9.65234375, 10.333251953125, 11.01416015625, 11.695068359375, 12.3759765625, 13.056884765625, 13.73779296875, 14.418701171875, 15.099609375, 15.780517578125, 16.46142578125, 17.142333984375, 17.8232421875, 18.504150390625, 19.18505859375, 19.865966796875, 20.546875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 13.0, 13.0, 11.0, 14.0, 19.0, 16.0, 26.0, 21.0, 30.0, 28.0, 27.0, 29.0, 45.0, 40.0, 43.0, 39.0, 52.0, 43.0, 48.0, 27.0, 43.0, 45.0, 34.0, 31.0, 35.0, 27.0, 25.0, 27.0, 17.0, 23.0, 20.0, 15.0, 11.0, 11.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.897216796875, -9.52880859375, -9.160400390625, -8.7919921875, -8.423583984375, -8.05517578125, -7.686767578125, -7.318359375, -6.949951171875, -6.58154296875, -6.213134765625, -5.8447265625, -5.476318359375, -5.10791015625, -4.739501953125, -4.37109375, -4.002685546875, -3.63427734375, -3.265869140625, -2.8974609375, -2.529052734375, -2.16064453125, -1.792236328125, -1.423828125, -1.055419921875, -0.68701171875, -0.318603515625, 0.0498046875, 0.418212890625, 0.78662109375, 1.155029296875, 1.5234375, 1.891845703125, 2.26025390625, 2.628662109375, 2.9970703125, 3.365478515625, 3.73388671875, 4.102294921875, 4.470703125, 4.839111328125, 5.20751953125, 5.575927734375, 5.9443359375, 6.312744140625, 6.68115234375, 7.049560546875, 7.41796875, 7.786376953125, 8.15478515625, 8.523193359375, 8.8916015625, 9.260009765625, 9.62841796875, 9.996826171875, 10.365234375, 10.733642578125, 11.10205078125, 11.470458984375, 11.8388671875, 12.207275390625, 12.57568359375, 12.944091796875, 13.3125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 18.0, 15.0, 26.0, 33.0, 57.0, 59.0, 99.0, 147.0, 201.0, 342.0, 555.0, 891.0, 1479.0, 2730.0, 4751.0, 9173.0, 17668.0, 34769.0, 68788.0, 129800.0, 225899.0, 241341.0, 147936.0, 78443.0, 39851.0, 20175.0, 10386.0, 5493.0, 2972.0, 1660.0, 1031.0, 580.0, 417.0, 233.0, 150.0, 106.0, 76.0, 66.0, 28.0, 30.0, 25.0, 16.0, 8.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.0531005859375, -10.645263671875, -10.2374267578125, -9.82958984375, -9.4217529296875, -9.013916015625, -8.6060791015625, -8.1982421875, -7.7904052734375, -7.382568359375, -6.9747314453125, -6.56689453125, -6.1590576171875, -5.751220703125, -5.3433837890625, -4.935546875, -4.5277099609375, -4.119873046875, -3.7120361328125, -3.30419921875, -2.8963623046875, -2.488525390625, -2.0806884765625, -1.6728515625, -1.2650146484375, -0.857177734375, -0.4493408203125, -0.04150390625, 0.3663330078125, 0.774169921875, 1.1820068359375, 1.58984375, 1.9976806640625, 2.405517578125, 2.8133544921875, 3.22119140625, 3.6290283203125, 4.036865234375, 4.4447021484375, 4.8525390625, 5.2603759765625, 5.668212890625, 6.0760498046875, 6.48388671875, 6.8917236328125, 7.299560546875, 7.7073974609375, 8.115234375, 8.5230712890625, 8.930908203125, 9.3387451171875, 9.74658203125, 10.1544189453125, 10.562255859375, 10.9700927734375, 11.3779296875, 11.7857666015625, 12.193603515625, 12.6014404296875, 13.00927734375, 13.4171142578125, 13.824951171875, 14.2327880859375, 14.640625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 8.0, 12.0, 12.0, 14.0, 22.0, 25.0, 31.0, 26.0, 25.0, 43.0, 35.0, 38.0, 63.0, 62.0, 56.0, 58.0, 66.0, 58.0, 48.0, 42.0, 44.0, 37.0, 27.0, 23.0, 21.0, 21.0, 15.0, 8.0, 6.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0011396408081054688, -0.0011090263724327087, -0.0010784119367599487, -0.0010477975010871887, -0.0010171830654144287, -0.0009865686297416687, -0.0009559541940689087, -0.0009253397583961487, -0.0008947253227233887, -0.0008641108870506287, -0.0008334964513778687, -0.0008028820157051086, -0.0007722675800323486, -0.0007416531443595886, -0.0007110387086868286, -0.0006804242730140686, -0.0006498098373413086, -0.0006191954016685486, -0.0005885809659957886, -0.0005579665303230286, -0.0005273520946502686, -0.0004967376589775085, -0.00046612322330474854, -0.0004355087876319885, -0.0004048943519592285, -0.0003742799162864685, -0.0003436654806137085, -0.0003130510449409485, -0.0002824366092681885, -0.00025182217359542847, -0.00022120773792266846, -0.00019059330224990845, -0.00015997886657714844, -0.00012936443090438843, -9.874999523162842e-05, -6.813555955886841e-05, -3.75211238861084e-05, -6.906688213348389e-06, 2.370774745941162e-05, 5.432218313217163e-05, 8.493661880493164e-05, 0.00011555105447769165, 0.00014616549015045166, 0.00017677992582321167, 0.00020739436149597168, 0.0002380087971687317, 0.0002686232328414917, 0.0002992376685142517, 0.0003298521041870117, 0.00036046653985977173, 0.00039108097553253174, 0.00042169541120529175, 0.00045230984687805176, 0.00048292428255081177, 0.0005135387182235718, 0.0005441531538963318, 0.0005747675895690918, 0.0006053820252418518, 0.0006359964609146118, 0.0006666108965873718, 0.0006972253322601318, 0.0007278397679328918, 0.0007584542036056519, 0.0007890686392784119, 0.0008196830749511719]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 10.0, 24.0, 23.0, 27.0, 73.0, 78.0, 118.0, 205.0, 289.0, 407.0, 600.0, 938.0, 1400.0, 2293.0, 3770.0, 6668.0, 11836.0, 22774.0, 46715.0, 96658.0, 176234.0, 240477.0, 200860.0, 116673.0, 57727.0, 27845.0, 14110.0, 7945.0, 4265.0, 2666.0, 1671.0, 1076.0, 703.0, 469.0, 272.0, 216.0, 134.0, 89.0, 66.0, 59.0, 21.0, 16.0, 12.0, 15.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-17.765625, -17.2528076171875, -16.739990234375, -16.2271728515625, -15.71435546875, -15.2015380859375, -14.688720703125, -14.1759033203125, -13.6630859375, -13.1502685546875, -12.637451171875, -12.1246337890625, -11.61181640625, -11.0989990234375, -10.586181640625, -10.0733642578125, -9.560546875, -9.0477294921875, -8.534912109375, -8.0220947265625, -7.50927734375, -6.9964599609375, -6.483642578125, -5.9708251953125, -5.4580078125, -4.9451904296875, -4.432373046875, -3.9195556640625, -3.40673828125, -2.8939208984375, -2.381103515625, -1.8682861328125, -1.35546875, -0.8426513671875, -0.329833984375, 0.1829833984375, 0.69580078125, 1.2086181640625, 1.721435546875, 2.2342529296875, 2.7470703125, 3.2598876953125, 3.772705078125, 4.2855224609375, 4.79833984375, 5.3111572265625, 5.823974609375, 6.3367919921875, 6.849609375, 7.3624267578125, 7.875244140625, 8.3880615234375, 8.90087890625, 9.4136962890625, 9.926513671875, 10.4393310546875, 10.9521484375, 11.4649658203125, 11.977783203125, 12.4906005859375, 13.00341796875, 13.5162353515625, 14.029052734375, 14.5418701171875, 15.0546875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 16.0, 18.0, 14.0, 32.0, 31.0, 54.0, 61.0, 86.0, 69.0, 94.0, 73.0, 79.0, 74.0, 61.0, 45.0, 35.0, 26.0, 19.0, 13.0, 17.0, 11.0, 7.0, 11.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.77105712890625, -5.5694580078125, -5.36785888671875, -5.166259765625, -4.96466064453125, -4.7630615234375, -4.56146240234375, -4.35986328125, -4.15826416015625, -3.9566650390625, -3.75506591796875, -3.553466796875, -3.35186767578125, -3.1502685546875, -2.94866943359375, -2.7470703125, -2.54547119140625, -2.3438720703125, -2.14227294921875, -1.940673828125, -1.73907470703125, -1.5374755859375, -1.33587646484375, -1.13427734375, -0.93267822265625, -0.7310791015625, -0.52947998046875, -0.327880859375, -0.12628173828125, 0.0753173828125, 0.27691650390625, 0.478515625, 0.68011474609375, 0.8817138671875, 1.08331298828125, 1.284912109375, 1.48651123046875, 1.6881103515625, 1.88970947265625, 2.09130859375, 2.29290771484375, 2.4945068359375, 2.69610595703125, 2.897705078125, 3.09930419921875, 3.3009033203125, 3.50250244140625, 3.7041015625, 3.90570068359375, 4.1072998046875, 4.30889892578125, 4.510498046875, 4.71209716796875, 4.9136962890625, 5.11529541015625, 5.31689453125, 5.51849365234375, 5.7200927734375, 5.92169189453125, 6.123291015625, 6.32489013671875, 6.5264892578125, 6.72808837890625, 6.9296875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 12.0, 6.0, 9.0, 7.0, 19.0, 13.0, 14.0, 16.0, 23.0, 32.0, 43.0, 29.0, 42.0, 41.0, 43.0, 38.0, 49.0, 40.0, 42.0, 47.0, 37.0, 45.0, 39.0, 25.0, 39.0, 36.0, 22.0, 26.0, 35.0, 29.0, 10.0, 17.0, 22.0, 13.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.376142501831055, -15.858060836791992, -15.33997917175293, -14.821898460388184, -14.303816795349121, -13.785735130310059, -13.267654418945312, -12.74957275390625, -12.231491088867188, -11.713409423828125, -11.195327758789062, -10.677247047424316, -10.159165382385254, -9.641083717346191, -9.123003005981445, -8.604921340942383, -8.08683967590332, -7.568758010864258, -7.0506768226623535, -6.532595634460449, -6.014513969421387, -5.496432304382324, -4.97835111618042, -4.460269927978516, -3.942188262939453, -3.4241068363189697, -2.9060254096984863, -2.387943983078003, -1.8698625564575195, -1.3517811298370361, -0.8336997032165527, -0.31561827659606934, 0.20246124267578125, 0.7205426692962646, 1.238624095916748, 1.7567055225372314, 2.274786949157715, 2.7928683757781982, 3.3109498023986816, 3.829031229019165, 4.347112655639648, 4.865194320678711, 5.383275508880615, 5.9013566970825195, 6.419438362121582, 6.9375200271606445, 7.455601215362549, 7.973682403564453, 8.491764068603516, 9.009845733642578, 9.52792739868164, 10.046008110046387, 10.56408977508545, 11.082171440124512, 11.600252151489258, 12.11833381652832, 12.636415481567383, 13.154497146606445, 13.672578811645508, 14.190659523010254, 14.708741188049316, 15.226822853088379, 15.744903564453125, 16.262985229492188, 16.78106689453125]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 6.0, 8.0, 13.0, 13.0, 20.0, 22.0, 14.0, 17.0, 31.0, 34.0, 33.0, 55.0, 40.0, 46.0, 38.0, 46.0, 43.0, 37.0, 47.0, 42.0, 36.0, 34.0, 45.0, 32.0, 34.0, 28.0, 29.0, 22.0, 14.0, 20.0, 16.0, 19.0, 6.0, 8.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.71037483215332, -22.04431915283203, -21.37826156616211, -20.71220588684082, -20.04615020751953, -19.38009262084961, -18.71403694152832, -18.04798126220703, -17.38192367553711, -16.71586799621582, -16.0498104095459, -15.38375473022461, -14.717698097229004, -14.051641464233398, -13.38558578491211, -12.719529151916504, -12.053473472595215, -11.38741683959961, -10.72136116027832, -10.055304527282715, -9.38924789428711, -8.72319221496582, -8.057135581970215, -7.391078948974609, -6.725022792816162, -6.058966636657715, -5.392910003662109, -4.726853847503662, -4.060797691345215, -3.3947410583496094, -2.728684902191162, -2.0626282691955566, -1.3965721130371094, -0.7305157780647278, -0.06445944309234619, 0.6015968322753906, 1.267653226852417, 1.9337096214294434, 2.5997657775878906, 3.265822410583496, 3.9318785667419434, 4.597934722900391, 5.263991355895996, 5.930047512054443, 6.596103668212891, 7.262160301208496, 7.928216457366943, 8.59427261352539, 9.260329246520996, 9.926385879516602, 10.59244155883789, 11.258498191833496, 11.924554824829102, 12.59061050415039, 13.256667137145996, 13.922723770141602, 14.58877944946289, 15.254836082458496, 15.920891761779785, 16.58694839477539, 17.25300407409668, 17.9190616607666, 18.58511734008789, 19.251174926757812, 19.9172306060791]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 12.0, 18.0, 38.0, 50.0, 75.0, 118.0, 178.0, 223.0, 346.0, 491.0, 706.0, 926.0, 1282.0, 1720.0, 2236.0, 2758.0, 3473.0, 4443.0, 6147.0, 476723.0, 5267.0, 4092.0, 3098.0, 2500.0, 1933.0, 1511.0, 1155.0, 809.0, 623.0, 430.0, 292.0, 187.0, 133.0, 98.0, 65.0, 34.0, 25.0, 19.0, 9.0, 6.0, 4.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.20637512207031, -106.01193237304688, -101.8174819946289, -97.62303161621094, -93.4285888671875, -89.23414611816406, -85.0396957397461, -80.84524536132812, -76.65080261230469, -72.45635986328125, -68.26190948486328, -64.06745910644531, -59.873016357421875, -55.67856979370117, -51.48412322998047, -47.289676666259766, -43.09523010253906, -38.90078353881836, -34.706336975097656, -30.511890411376953, -26.31744384765625, -22.122997283935547, -17.928550720214844, -13.73410415649414, -9.539657592773438, -5.345211029052734, -1.1507644653320312, 3.043682098388672, 7.238128662109375, 11.432575225830078, 15.627021789550781, 19.821468353271484, 24.015914916992188, 28.21036148071289, 32.404808044433594, 36.5992546081543, 40.793701171875, 44.9881477355957, 49.182594299316406, 53.37704086303711, 57.57148742675781, 61.765933990478516, 65.96038055419922, 70.15483093261719, 74.34927368164062, 78.54371643066406, 82.73816680908203, 86.9326171875, 91.12705993652344, 95.32150268554688, 99.51595306396484, 103.71040344238281, 107.90484619140625, 112.09928894042969, 116.29373931884766, 120.48818969726562, 124.68263244628906, 128.8770751953125, 133.071533203125, 137.26597595214844, 141.46041870117188, 145.6548614501953, 149.84930419921875, 154.04376220703125, 158.2382049560547]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 4.0, 9.0, 11.0, 13.0, 19.0, 17.0, 17.0, 20.0, 37.0, 28.0, 29.0, 51.0, 35.0, 54.0, 40.0, 38.0, 56.0, 1062.0, 41.0, 37.0, 43.0, 31.0, 51.0, 34.0, 33.0, 23.0, 35.0, 22.0, 17.0, 17.0, 14.0, 23.0, 5.0, 11.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-718.29931640625, -697.1889038085938, -676.0785522460938, -654.9681396484375, -633.8577880859375, -612.7473754882812, -591.6370239257812, -570.526611328125, -549.416259765625, -528.3058471679688, -507.19549560546875, -486.0851135253906, -464.9747314453125, -443.8643493652344, -422.75396728515625, -401.6435546875, -380.5331726074219, -359.42279052734375, -338.3124084472656, -317.2020263671875, -296.0916442871094, -274.98126220703125, -253.87086486816406, -232.76048278808594, -211.6501007080078, -190.5397186279297, -169.42933654785156, -148.31893920898438, -127.20856475830078, -106.09818267822266, -84.98779296875, -63.877410888671875, -42.76702880859375, -21.656644821166992, -0.5462608337402344, 20.564125061035156, 41.67450714111328, 62.784889221191406, 83.89527893066406, 105.00566101074219, 126.11604309082031, 147.22642517089844, 168.33680725097656, 189.44720458984375, 210.55758666992188, 231.66796875, 252.77835083007812, 273.88873291015625, 294.9991149902344, 316.1094970703125, 337.2198791503906, 358.33026123046875, 379.4406433105469, 400.551025390625, 421.66143798828125, 442.77178955078125, 463.8822021484375, 484.9925842285156, 506.10296630859375, 527.21337890625, 548.32373046875, 569.4341430664062, 590.5444946289062, 611.6549072265625, 632.7652587890625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 13.0, 9.0, 15.0, 24.0, 24.0, 28.0, 49.0, 72.0, 100.0, 172.0, 252.0, 382.0, 700.0, 1043.0, 1911.0, 3618.0, 6907.0, 12515.0, 21324.0, 35100.0, 62409.0, 30923968.0, 96678.0, 44997.0, 21843.0, 10183.0, 4790.0, 2383.0, 1271.0, 680.0, 383.0, 231.0, 153.0, 83.0, 43.0, 49.0, 33.0, 19.0, 19.0, 8.0, 7.0, 5.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-132.5502166748047, -128.20663452148438, -123.86306762695312, -119.51948547363281, -115.17591094970703, -110.83233642578125, -106.48875427246094, -102.14517974853516, -97.80160522460938, -93.4580307006836, -89.11445617675781, -84.7708740234375, -80.42729949951172, -76.08372497558594, -71.74014282226562, -67.39656829833984, -63.05299377441406, -58.70941925048828, -54.365840911865234, -50.02226257324219, -45.678688049316406, -41.335113525390625, -36.99153518676758, -32.64795684814453, -28.30438232421875, -23.960805892944336, -19.617229461669922, -15.273653030395508, -10.930076599121094, -6.58650016784668, -2.2429237365722656, 2.1006526947021484, 6.444244384765625, 10.787820816040039, 15.131397247314453, 19.474973678588867, 23.81855010986328, 28.162126541137695, 32.50570297241211, 36.849281311035156, 41.19285583496094, 45.53643035888672, 49.880008697509766, 54.22358703613281, 58.567161560058594, 62.910736083984375, 67.25431823730469, 71.59789276123047, 75.94146728515625, 80.28504180908203, 84.62861633300781, 88.97219848632812, 93.3157730102539, 97.65934753417969, 102.0029296875, 106.34650421142578, 110.69007873535156, 115.03365325927734, 119.37722778320312, 123.72080993652344, 128.06439208984375, 132.407958984375, 136.7515411376953, 141.09510803222656, 145.43869018554688]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 10.0, 18.0, 20.0, 26.0, 55.0, 54.0, 98.0, 172.0, 232.0, 370.0, 561.0, 826.0, 1393.0, 2171.0, 3419.0, 5682.0, 9716.0, 16815.0, 29776.0, 54921.0, 105296.0, 213290.0, 465317.0, 1097328.0, 2116713.0, 1186540.0, 500302.0, 230454.0, 113041.0, 59121.0, 32124.0, 18076.0, 10457.0, 6314.0, 3872.0, 2478.0, 1467.0, 974.0, 630.0, 414.0, 252.0, 185.0, 128.0, 101.0, 77.0, 45.0, 31.0, 30.0, 13.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0], "bins": [-18.109375, -17.53515625, -16.9609375, -16.38671875, -15.8125, -15.23828125, -14.6640625, -14.08984375, -13.515625, -12.94140625, -12.3671875, -11.79296875, -11.21875, -10.64453125, -10.0703125, -9.49609375, -8.921875, -8.34765625, -7.7734375, -7.19921875, -6.625, -6.05078125, -5.4765625, -4.90234375, -4.328125, -3.75390625, -3.1796875, -2.60546875, -2.03125, -1.45703125, -0.8828125, -0.30859375, 0.265625, 0.83984375, 1.4140625, 1.98828125, 2.5625, 3.13671875, 3.7109375, 4.28515625, 4.859375, 5.43359375, 6.0078125, 6.58203125, 7.15625, 7.73046875, 8.3046875, 8.87890625, 9.453125, 10.02734375, 10.6015625, 11.17578125, 11.75, 12.32421875, 12.8984375, 13.47265625, 14.046875, 14.62109375, 15.1953125, 15.76953125, 16.34375, 16.91796875, 17.4921875, 18.06640625, 18.640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 6.0, 9.0, 7.0, 14.0, 10.0, 20.0, 23.0, 29.0, 32.0, 37.0, 41.0, 65.0, 74.0, 73.0, 96.0, 131.0, 143.0, 139.0, 159.0, 163.0, 135.0, 121.0, 83.0, 71.0, 70.0, 46.0, 43.0, 48.0, 29.0, 20.0, 15.0, 12.0, 10.0, 8.0, 10.0, 5.0, 4.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.0330810546875, -7.761474609375, -7.4898681640625, -7.21826171875, -6.9466552734375, -6.675048828125, -6.4034423828125, -6.1318359375, -5.8602294921875, -5.588623046875, -5.3170166015625, -5.04541015625, -4.7738037109375, -4.502197265625, -4.2305908203125, -3.958984375, -3.6873779296875, -3.415771484375, -3.1441650390625, -2.87255859375, -2.6009521484375, -2.329345703125, -2.0577392578125, -1.7861328125, -1.5145263671875, -1.242919921875, -0.9713134765625, -0.69970703125, -0.4281005859375, -0.156494140625, 0.1151123046875, 0.38671875, 0.6583251953125, 0.929931640625, 1.2015380859375, 1.47314453125, 1.7447509765625, 2.016357421875, 2.2879638671875, 2.5595703125, 2.8311767578125, 3.102783203125, 3.3743896484375, 3.64599609375, 3.9176025390625, 4.189208984375, 4.4608154296875, 4.732421875, 5.0040283203125, 5.275634765625, 5.5472412109375, 5.81884765625, 6.0904541015625, 6.362060546875, 6.6336669921875, 6.9052734375, 7.1768798828125, 7.448486328125, 7.7200927734375, 7.99169921875, 8.2633056640625, 8.534912109375, 8.8065185546875, 9.078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 19.0, 30.0, 35.0, 42.0, 55.0, 77.0, 96.0, 188.0, 267.0, 484.0, 682.0, 980.0, 1550.0, 2627.0, 4134.0, 7099.0, 12181.0, 21298.0, 37972.0, 68924.0, 125261.0, 231106.0, 439759.0, 951087.0, 1978589.0, 1246510.0, 543076.0, 278619.0, 150122.0, 82127.0, 45817.0, 25518.0, 14498.0, 8217.0, 4848.0, 2789.0, 1713.0, 1091.0, 754.0, 391.0, 257.0, 158.0, 130.0, 89.0, 59.0, 45.0, 18.0, 15.0, 10.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.2109375, -7.943115234375, -7.67529296875, -7.407470703125, -7.1396484375, -6.871826171875, -6.60400390625, -6.336181640625, -6.068359375, -5.800537109375, -5.53271484375, -5.264892578125, -4.9970703125, -4.729248046875, -4.46142578125, -4.193603515625, -3.92578125, -3.657958984375, -3.39013671875, -3.122314453125, -2.8544921875, -2.586669921875, -2.31884765625, -2.051025390625, -1.783203125, -1.515380859375, -1.24755859375, -0.979736328125, -0.7119140625, -0.444091796875, -0.17626953125, 0.091552734375, 0.359375, 0.627197265625, 0.89501953125, 1.162841796875, 1.4306640625, 1.698486328125, 1.96630859375, 2.234130859375, 2.501953125, 2.769775390625, 3.03759765625, 3.305419921875, 3.5732421875, 3.841064453125, 4.10888671875, 4.376708984375, 4.64453125, 4.912353515625, 5.18017578125, 5.447998046875, 5.7158203125, 5.983642578125, 6.25146484375, 6.519287109375, 6.787109375, 7.054931640625, 7.32275390625, 7.590576171875, 7.8583984375, 8.126220703125, 8.39404296875, 8.661865234375, 8.9296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 17.0, 17.0, 30.0, 26.0, 31.0, 36.0, 49.0, 50.0, 74.0, 93.0, 107.0, 164.0, 172.0, 187.0, 200.0, 150.0, 131.0, 71.0, 63.0, 56.0, 43.0, 30.0, 37.0, 37.0, 30.0, 16.0, 20.0, 10.0, 11.0, 9.0, 12.0, 8.0, 3.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.08642578125, -8.7509765625, -8.41552734375, -8.080078125, -7.74462890625, -7.4091796875, -7.07373046875, -6.73828125, -6.40283203125, -6.0673828125, -5.73193359375, -5.396484375, -5.06103515625, -4.7255859375, -4.39013671875, -4.0546875, -3.71923828125, -3.3837890625, -3.04833984375, -2.712890625, -2.37744140625, -2.0419921875, -1.70654296875, -1.37109375, -1.03564453125, -0.7001953125, -0.36474609375, -0.029296875, 0.30615234375, 0.6416015625, 0.97705078125, 1.3125, 1.64794921875, 1.9833984375, 2.31884765625, 2.654296875, 2.98974609375, 3.3251953125, 3.66064453125, 3.99609375, 4.33154296875, 4.6669921875, 5.00244140625, 5.337890625, 5.67333984375, 6.0087890625, 6.34423828125, 6.6796875, 7.01513671875, 7.3505859375, 7.68603515625, 8.021484375, 8.35693359375, 8.6923828125, 9.02783203125, 9.36328125, 9.69873046875, 10.0341796875, 10.36962890625, 10.705078125, 11.04052734375, 11.3759765625, 11.71142578125, 12.046875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 7.0, 7.0, 11.0, 12.0, 10.0, 25.0, 37.0, 45.0, 73.0, 99.0, 114.0, 159.0, 213.0, 278.0, 417.0, 634.0, 977.0, 1512.0, 2330.0, 3869.0, 6301.0, 10458.0, 18539.0, 34522.0, 75121.0, 292258.0, 5598999.0, 133247.0, 49720.0, 25564.0, 14053.0, 8313.0, 4750.0, 2970.0, 1991.0, 1226.0, 821.0, 545.0, 350.0, 233.0, 159.0, 137.0, 90.0, 63.0, 39.0, 33.0, 24.0, 21.0, 9.0, 18.0, 8.0, 6.0, 4.0, 5.0, 2.0, 4.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-21.03125, -20.259765625, -19.48828125, -18.716796875, -17.9453125, -17.173828125, -16.40234375, -15.630859375, -14.859375, -14.087890625, -13.31640625, -12.544921875, -11.7734375, -11.001953125, -10.23046875, -9.458984375, -8.6875, -7.916015625, -7.14453125, -6.373046875, -5.6015625, -4.830078125, -4.05859375, -3.287109375, -2.515625, -1.744140625, -0.97265625, -0.201171875, 0.5703125, 1.341796875, 2.11328125, 2.884765625, 3.65625, 4.427734375, 5.19921875, 5.970703125, 6.7421875, 7.513671875, 8.28515625, 9.056640625, 9.828125, 10.599609375, 11.37109375, 12.142578125, 12.9140625, 13.685546875, 14.45703125, 15.228515625, 16.0, 16.771484375, 17.54296875, 18.314453125, 19.0859375, 19.857421875, 20.62890625, 21.400390625, 22.171875, 22.943359375, 23.71484375, 24.486328125, 25.2578125, 26.029296875, 26.80078125, 27.572265625, 28.34375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 11.0, 15.0, 23.0, 23.0, 32.0, 33.0, 37.0, 48.0, 46.0, 69.0, 189.0, 340.0, 451.0, 250.0, 109.0, 65.0, 57.0, 38.0, 47.0, 41.0, 25.0, 19.0, 11.0, 11.0, 10.0, 7.0, 7.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.794677734375, -22.99560546875, -22.196533203125, -21.3974609375, -20.598388671875, -19.79931640625, -19.000244140625, -18.201171875, -17.402099609375, -16.60302734375, -15.803955078125, -15.0048828125, -14.205810546875, -13.40673828125, -12.607666015625, -11.80859375, -11.009521484375, -10.21044921875, -9.411376953125, -8.6123046875, -7.813232421875, -7.01416015625, -6.215087890625, -5.416015625, -4.616943359375, -3.81787109375, -3.018798828125, -2.2197265625, -1.420654296875, -0.62158203125, 0.177490234375, 0.9765625, 1.775634765625, 2.57470703125, 3.373779296875, 4.1728515625, 4.971923828125, 5.77099609375, 6.570068359375, 7.369140625, 8.168212890625, 8.96728515625, 9.766357421875, 10.5654296875, 11.364501953125, 12.16357421875, 12.962646484375, 13.76171875, 14.560791015625, 15.35986328125, 16.158935546875, 16.9580078125, 17.757080078125, 18.55615234375, 19.355224609375, 20.154296875, 20.953369140625, 21.75244140625, 22.551513671875, 23.3505859375, 24.149658203125, 24.94873046875, 25.747802734375, 26.546875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 9.0, 12.0, 18.0, 31.0, 65.0, 103.0, 260.0, 257.0, 84.0, 46.0, 28.0, 24.0, 14.0, 5.0, 7.0, 8.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-324.64801025390625, -311.16864013671875, -297.6892395019531, -284.2098693847656, -270.73046875, -257.2510986328125, -243.77169799804688, -230.29232788085938, -216.81292724609375, -203.3335418701172, -189.85415649414062, -176.37477111816406, -162.8953857421875, -149.416015625, -135.93661499023438, -122.45723724365234, -108.97785949707031, -95.49847412109375, -82.01908874511719, -68.53970336914062, -55.06032180786133, -41.58094024658203, -28.10155487060547, -14.622169494628906, -1.1427841186523438, 12.336600303649902, 25.81598472595215, 39.29536819458008, 52.77475357055664, 66.25413513183594, 79.7335205078125, 93.21290588378906, 106.69229125976562, 120.17167663574219, 133.65106201171875, 147.1304473876953, 160.60983276367188, 174.08920288085938, 187.568603515625, 201.0479736328125, 214.52737426757812, 228.0067596435547, 241.48614501953125, 254.9655303955078, 268.4449157714844, 281.9242858886719, 295.4036865234375, 308.883056640625, 322.3624267578125, 335.841796875, 349.3211975097656, 362.8005676269531, 376.27996826171875, 389.75933837890625, 403.2387390136719, 416.7181091308594, 430.197509765625, 443.6768798828125, 457.1562805175781, 470.6356506347656, 484.11505126953125, 497.59442138671875, 511.0738220214844, 524.55322265625, 538.0325927734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 10.0, 8.0, 5.0, 10.0, 6.0, 8.0, 22.0, 29.0, 56.0, 114.0, 260.0, 195.0, 89.0, 56.0, 24.0, 27.0, 12.0, 10.0, 7.0, 12.0, 6.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-729.6953125, -711.3696899414062, -693.0440673828125, -674.7184448242188, -656.392822265625, -638.0671997070312, -619.7415771484375, -601.4158935546875, -583.09033203125, -564.7647094726562, -546.4390869140625, -528.1134643554688, -509.787841796875, -491.46221923828125, -473.1365661621094, -454.8109436035156, -436.48529052734375, -418.15966796875, -399.83404541015625, -381.5084228515625, -363.18280029296875, -344.857177734375, -326.5315246582031, -308.2059020996094, -289.8802795410156, -271.5546569824219, -253.22903442382812, -234.9033966064453, -216.57777404785156, -198.2521514892578, -179.926513671875, -161.60089111328125, -143.27529907226562, -124.94967651367188, -106.6240463256836, -88.29841613769531, -69.97279357910156, -51.64717102050781, -33.32154083251953, -14.99591064453125, 3.3297119140625, 21.655338287353516, 39.98096466064453, 58.30659103393555, 76.63221740722656, 94.95783996582031, 113.2834701538086, 131.60910034179688, 149.93472290039062, 168.26034545898438, 186.58596801757812, 204.91160583496094, 223.2372283935547, 241.56285095214844, 259.88848876953125, 278.214111328125, 296.53973388671875, 314.8653564453125, 333.19097900390625, 351.5166015625, 369.84222412109375, 388.1678466796875, 406.4934997558594, 424.8191223144531, 443.1447448730469]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 7.0, 4.0, 11.0, 9.0, 17.0, 20.0, 29.0, 41.0, 51.0, 59.0, 99.0, 113.0, 167.0, 247.0, 306.0, 421.0, 632.0, 837.0, 1221.0, 1877.0, 2775.0, 4220.0, 7041.0, 11723.0, 20730.0, 41095.0, 105848.0, 1414874.0, 2389219.0, 98198.0, 37182.0, 19713.0, 11483.0, 7230.0, 4910.0, 3194.0, 2335.0, 1690.0, 1224.0, 882.0, 659.0, 466.0, 390.0, 276.0, 204.0, 159.0, 110.0, 81.0, 58.0, 38.0, 30.0, 20.0, 20.0, 17.0, 9.0, 4.0, 8.0, 5.0, 1.0, 0.0, 1.0], "bins": [-3.4375, -3.32672119140625, -3.2159423828125, -3.10516357421875, -2.994384765625, -2.88360595703125, -2.7728271484375, -2.66204833984375, -2.55126953125, -2.44049072265625, -2.3297119140625, -2.21893310546875, -2.108154296875, -1.99737548828125, -1.8865966796875, -1.77581787109375, -1.6650390625, -1.55426025390625, -1.4434814453125, -1.33270263671875, -1.221923828125, -1.11114501953125, -1.0003662109375, -0.88958740234375, -0.77880859375, -0.66802978515625, -0.5572509765625, -0.44647216796875, -0.335693359375, -0.22491455078125, -0.1141357421875, -0.00335693359375, 0.107421875, 0.21820068359375, 0.3289794921875, 0.43975830078125, 0.550537109375, 0.66131591796875, 0.7720947265625, 0.88287353515625, 0.99365234375, 1.10443115234375, 1.2152099609375, 1.32598876953125, 1.436767578125, 1.54754638671875, 1.6583251953125, 1.76910400390625, 1.8798828125, 1.99066162109375, 2.1014404296875, 2.21221923828125, 2.322998046875, 2.43377685546875, 2.5445556640625, 2.65533447265625, 2.76611328125, 2.87689208984375, 2.9876708984375, 3.09844970703125, 3.209228515625, 3.32000732421875, 3.4307861328125, 3.54156494140625, 3.65234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 9.0, 5.0, 7.0, 13.0, 5.0, 10.0, 18.0, 28.0, 48.0, 334.0, 339.0, 63.0, 34.0, 10.0, 11.0, 10.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.473876953125, -0.4585990905761719, -0.44332122802734375, -0.4280433654785156, -0.4127655029296875, -0.3974876403808594, -0.38220977783203125, -0.3669319152832031, -0.351654052734375, -0.3363761901855469, -0.32109832763671875, -0.3058204650878906, -0.2905426025390625, -0.2752647399902344, -0.25998687744140625, -0.24470901489257812, -0.22943115234375, -0.21415328979492188, -0.19887542724609375, -0.18359756469726562, -0.1683197021484375, -0.15304183959960938, -0.13776397705078125, -0.12248611450195312, -0.107208251953125, -0.09193038940429688, -0.07665252685546875, -0.061374664306640625, -0.0460968017578125, -0.030818939208984375, -0.01554107666015625, -0.000263214111328125, 0.0150146484375, 0.030292510986328125, 0.04557037353515625, 0.060848236083984375, 0.0761260986328125, 0.09140396118164062, 0.10668182373046875, 0.12195968627929688, 0.137237548828125, 0.15251541137695312, 0.16779327392578125, 0.18307113647460938, 0.1983489990234375, 0.21362686157226562, 0.22890472412109375, 0.24418258666992188, 0.25946044921875, 0.2747383117675781, 0.29001617431640625, 0.3052940368652344, 0.3205718994140625, 0.3358497619628906, 0.35112762451171875, 0.3664054870605469, 0.381683349609375, 0.3969612121582031, 0.41223907470703125, 0.4275169372558594, 0.4427947998046875, 0.4580726623535156, 0.47335052490234375, 0.4886283874511719, 0.50390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 9.0, 13.0, 14.0, 22.0, 31.0, 60.0, 93.0, 139.0, 244.0, 422.0, 834.0, 1533.0, 3457.0, 8939.0, 29609.0, 160614.0, 2704609.0, 1151472.0, 97829.0, 21387.0, 6999.0, 2802.0, 1357.0, 764.0, 351.0, 261.0, 127.0, 106.0, 56.0, 47.0, 25.0, 15.0, 13.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.87969970703125, -5.7008056640625, -5.52191162109375, -5.343017578125, -5.16412353515625, -4.9852294921875, -4.80633544921875, -4.62744140625, -4.44854736328125, -4.2696533203125, -4.09075927734375, -3.911865234375, -3.73297119140625, -3.5540771484375, -3.37518310546875, -3.1962890625, -3.01739501953125, -2.8385009765625, -2.65960693359375, -2.480712890625, -2.30181884765625, -2.1229248046875, -1.94403076171875, -1.76513671875, -1.58624267578125, -1.4073486328125, -1.22845458984375, -1.049560546875, -0.87066650390625, -0.6917724609375, -0.51287841796875, -0.333984375, -0.15509033203125, 0.0238037109375, 0.20269775390625, 0.381591796875, 0.56048583984375, 0.7393798828125, 0.91827392578125, 1.09716796875, 1.27606201171875, 1.4549560546875, 1.63385009765625, 1.812744140625, 1.99163818359375, 2.1705322265625, 2.34942626953125, 2.5283203125, 2.70721435546875, 2.8861083984375, 3.06500244140625, 3.243896484375, 3.42279052734375, 3.6016845703125, 3.78057861328125, 3.95947265625, 4.13836669921875, 4.3172607421875, 4.49615478515625, 4.675048828125, 4.85394287109375, 5.0328369140625, 5.21173095703125, 5.390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 8.0, 8.0, 6.0, 9.0, 12.0, 22.0, 19.0, 22.0, 40.0, 55.0, 64.0, 78.0, 118.0, 135.0, 173.0, 247.0, 305.0, 468.0, 597.0, 421.0, 288.0, 215.0, 171.0, 127.0, 105.0, 60.0, 65.0, 50.0, 43.0, 25.0, 29.0, 28.0, 22.0, 14.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.169921875, -1.1348419189453125, -1.099761962890625, -1.0646820068359375, -1.02960205078125, -0.9945220947265625, -0.959442138671875, -0.9243621826171875, -0.8892822265625, -0.8542022705078125, -0.819122314453125, -0.7840423583984375, -0.74896240234375, -0.7138824462890625, -0.678802490234375, -0.6437225341796875, -0.608642578125, -0.5735626220703125, -0.538482666015625, -0.5034027099609375, -0.46832275390625, -0.4332427978515625, -0.398162841796875, -0.3630828857421875, -0.3280029296875, -0.2929229736328125, -0.257843017578125, -0.2227630615234375, -0.18768310546875, -0.1526031494140625, -0.117523193359375, -0.0824432373046875, -0.04736328125, -0.0122833251953125, 0.022796630859375, 0.0578765869140625, 0.09295654296875, 0.1280364990234375, 0.163116455078125, 0.1981964111328125, 0.2332763671875, 0.2683563232421875, 0.303436279296875, 0.3385162353515625, 0.37359619140625, 0.4086761474609375, 0.443756103515625, 0.4788360595703125, 0.513916015625, 0.5489959716796875, 0.584075927734375, 0.6191558837890625, 0.65423583984375, 0.6893157958984375, 0.724395751953125, 0.7594757080078125, 0.7945556640625, 0.8296356201171875, 0.864715576171875, 0.8997955322265625, 0.93487548828125, 0.9699554443359375, 1.005035400390625, 1.0401153564453125, 1.0751953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 7.0, 27.0, 24.0, 25.0, 45.0, 88.0, 107.0, 131.0, 132.0, 126.0, 63.0, 70.0, 31.0, 33.0, 11.0, 12.0, 11.0, 9.0, 8.0, 5.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.081180095672607, -5.749165058135986, -5.417150020599365, -5.085134983062744, -4.753119468688965, -4.421104431152344, -4.089089393615723, -3.7570743560791016, -3.4250593185424805, -3.0930442810058594, -2.7610292434692383, -2.429013967514038, -2.096998929977417, -1.764983892440796, -1.4329687356948853, -1.1009535789489746, -0.7689385414123535, -0.43692344427108765, -0.10490834712982178, 0.2271067500114441, 0.55912184715271, 0.891136884689331, 1.2231520414352417, 1.5551671981811523, 1.8871822357177734, 2.2191972732543945, 2.5512123107910156, 2.883227586746216, 3.215242624282837, 3.547257661819458, 3.879272937774658, 4.211287975311279, 4.543302536010742, 4.875317573547363, 5.207332611083984, 5.5393476486206055, 5.871362686157227, 6.203377723693848, 6.535393238067627, 6.867408275604248, 7.199423313140869, 7.53143835067749, 7.863453388214111, 8.19546890258789, 8.527483940124512, 8.859498977661133, 9.191514015197754, 9.523529052734375, 9.855544090270996, 10.187559127807617, 10.519574165344238, 10.85158920288086, 11.18360424041748, 11.515619277954102, 11.847634315490723, 12.179649353027344, 12.511665344238281, 12.843680381774902, 13.175695419311523, 13.507710456848145, 13.839725494384766, 14.171740531921387, 14.503755569458008, 14.835771560668945, 15.16778564453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 5.0, 7.0, 5.0, 10.0, 17.0, 20.0, 12.0, 23.0, 31.0, 26.0, 28.0, 32.0, 45.0, 38.0, 32.0, 48.0, 36.0, 47.0, 46.0, 45.0, 35.0, 53.0, 50.0, 37.0, 43.0, 32.0, 23.0, 27.0, 29.0, 22.0, 20.0, 10.0, 9.0, 10.0, 11.0, 8.0, 6.0, 3.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.469351768493652, -6.236355304718018, -6.003358840942383, -5.77036190032959, -5.537365436553955, -5.30436897277832, -5.0713725090026855, -4.838376045227051, -4.605379581451416, -4.372383117675781, -4.1393866539001465, -3.9063899517059326, -3.673393487930298, -3.440396785736084, -3.207400321960449, -2.9744038581848145, -2.7414071559906006, -2.508410692214966, -2.275413990020752, -2.042417526245117, -1.8094210624694824, -1.576424479484558, -1.3434278964996338, -1.110431432723999, -0.8774348497390747, -0.6444383263587952, -0.41144177317619324, -0.1784452199935913, 0.05455130338668823, 0.2875478267669678, 0.5205444097518921, 0.7535408735275269, 0.9865374565124512, 1.2195340394973755, 1.4525305032730103, 1.6855270862579346, 1.9185235500335693, 2.151520252227783, 2.384516716003418, 2.6175131797790527, 2.8505096435546875, 3.0835061073303223, 3.316502809524536, 3.549499273300171, 3.7824957370758057, 4.0154924392700195, 4.248488903045654, 4.481485366821289, 4.714482307434082, 4.947478771209717, 5.180475234985352, 5.4134721755981445, 5.646468639373779, 5.879465103149414, 6.112461566925049, 6.345458030700684, 6.578454494476318, 6.811450958251953, 7.044447422027588, 7.277443885803223, 7.510440826416016, 7.74343729019165, 7.976433753967285, 8.209430694580078, 8.442426681518555]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 9.0, 19.0, 33.0, 33.0, 58.0, 83.0, 124.0, 181.0, 309.0, 473.0, 708.0, 1171.0, 1902.0, 3329.0, 6195.0, 14455.0, 52504.0, 558253.0, 343853.0, 39400.0, 12318.0, 5533.0, 2954.0, 1719.0, 1047.0, 626.0, 442.0, 275.0, 188.0, 123.0, 70.0, 42.0, 38.0, 27.0, 9.0, 12.0, 8.0, 9.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.59375, -5.44219970703125, -5.2906494140625, -5.13909912109375, -4.987548828125, -4.83599853515625, -4.6844482421875, -4.53289794921875, -4.38134765625, -4.22979736328125, -4.0782470703125, -3.92669677734375, -3.775146484375, -3.62359619140625, -3.4720458984375, -3.32049560546875, -3.1689453125, -3.01739501953125, -2.8658447265625, -2.71429443359375, -2.562744140625, -2.41119384765625, -2.2596435546875, -2.10809326171875, -1.95654296875, -1.80499267578125, -1.6534423828125, -1.50189208984375, -1.350341796875, -1.19879150390625, -1.0472412109375, -0.89569091796875, -0.744140625, -0.59259033203125, -0.4410400390625, -0.28948974609375, -0.137939453125, 0.01361083984375, 0.1651611328125, 0.31671142578125, 0.46826171875, 0.61981201171875, 0.7713623046875, 0.92291259765625, 1.074462890625, 1.22601318359375, 1.3775634765625, 1.52911376953125, 1.6806640625, 1.83221435546875, 1.9837646484375, 2.13531494140625, 2.286865234375, 2.43841552734375, 2.5899658203125, 2.74151611328125, 2.89306640625, 3.04461669921875, 3.1961669921875, 3.34771728515625, 3.499267578125, 3.65081787109375, 3.8023681640625, 3.95391845703125, 4.10546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 8.0, 11.0, 14.0, 18.0, 30.0, 47.0, 82.0, 137.0, 145.0, 147.0, 113.0, 83.0, 52.0, 19.0, 20.0, 15.0, 5.0, 7.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426513671875, -0.4094200134277344, -0.39232635498046875, -0.3752326965332031, -0.3581390380859375, -0.3410453796386719, -0.32395172119140625, -0.3068580627441406, -0.289764404296875, -0.2726707458496094, -0.25557708740234375, -0.23848342895507812, -0.2213897705078125, -0.20429611206054688, -0.18720245361328125, -0.17010879516601562, -0.15301513671875, -0.13592147827148438, -0.11882781982421875, -0.10173416137695312, -0.0846405029296875, -0.06754684448242188, -0.05045318603515625, -0.033359527587890625, -0.016265869140625, 0.000827789306640625, 0.01792144775390625, 0.035015106201171875, 0.0521087646484375, 0.06920242309570312, 0.08629608154296875, 0.10338973999023438, 0.1204833984375, 0.13757705688476562, 0.15467071533203125, 0.17176437377929688, 0.1888580322265625, 0.20595169067382812, 0.22304534912109375, 0.24013900756835938, 0.257232666015625, 0.2743263244628906, 0.29141998291015625, 0.3085136413574219, 0.3256072998046875, 0.3427009582519531, 0.35979461669921875, 0.3768882751464844, 0.39398193359375, 0.4110755920410156, 0.42816925048828125, 0.4452629089355469, 0.4623565673828125, 0.4794502258300781, 0.49654388427734375, 0.5136375427246094, 0.530731201171875, 0.5478248596191406, 0.5649185180664062, 0.5820121765136719, 0.5991058349609375, 0.6161994934082031, 0.6332931518554688, 0.6503868103027344, 0.66748046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 11.0, 15.0, 15.0, 31.0, 42.0, 76.0, 154.0, 247.0, 712.0, 1681.0, 5032.0, 27106.0, 706003.0, 283485.0, 17603.0, 3872.0, 1382.0, 519.0, 217.0, 131.0, 74.0, 41.0, 20.0, 23.0, 14.0, 4.0, 6.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1484375, -8.8204345703125, -8.492431640625, -8.1644287109375, -7.83642578125, -7.5084228515625, -7.180419921875, -6.8524169921875, -6.5244140625, -6.1964111328125, -5.868408203125, -5.5404052734375, -5.21240234375, -4.8843994140625, -4.556396484375, -4.2283935546875, -3.900390625, -3.5723876953125, -3.244384765625, -2.9163818359375, -2.58837890625, -2.2603759765625, -1.932373046875, -1.6043701171875, -1.2763671875, -0.9483642578125, -0.620361328125, -0.2923583984375, 0.03564453125, 0.3636474609375, 0.691650390625, 1.0196533203125, 1.34765625, 1.6756591796875, 2.003662109375, 2.3316650390625, 2.65966796875, 2.9876708984375, 3.315673828125, 3.6436767578125, 3.9716796875, 4.2996826171875, 4.627685546875, 4.9556884765625, 5.28369140625, 5.6116943359375, 5.939697265625, 6.2677001953125, 6.595703125, 6.9237060546875, 7.251708984375, 7.5797119140625, 7.90771484375, 8.2357177734375, 8.563720703125, 8.8917236328125, 9.2197265625, 9.5477294921875, 9.875732421875, 10.2037353515625, 10.53173828125, 10.8597412109375, 11.187744140625, 11.5157470703125, 11.84375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 16.0, 17.0, 16.0, 16.0, 21.0, 19.0, 26.0, 22.0, 34.0, 31.0, 40.0, 51.0, 41.0, 37.0, 51.0, 50.0, 35.0, 56.0, 46.0, 33.0, 43.0, 46.0, 23.0, 31.0, 32.0, 24.0, 30.0, 12.0, 17.0, 22.0, 17.0, 8.0, 13.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.99609375, -2.90802001953125, -2.8199462890625, -2.73187255859375, -2.643798828125, -2.55572509765625, -2.4676513671875, -2.37957763671875, -2.29150390625, -2.20343017578125, -2.1153564453125, -2.02728271484375, -1.939208984375, -1.85113525390625, -1.7630615234375, -1.67498779296875, -1.5869140625, -1.49884033203125, -1.4107666015625, -1.32269287109375, -1.234619140625, -1.14654541015625, -1.0584716796875, -0.97039794921875, -0.88232421875, -0.79425048828125, -0.7061767578125, -0.61810302734375, -0.530029296875, -0.44195556640625, -0.3538818359375, -0.26580810546875, -0.177734375, -0.08966064453125, -0.0015869140625, 0.08648681640625, 0.174560546875, 0.26263427734375, 0.3507080078125, 0.43878173828125, 0.52685546875, 0.61492919921875, 0.7030029296875, 0.79107666015625, 0.879150390625, 0.96722412109375, 1.0552978515625, 1.14337158203125, 1.2314453125, 1.31951904296875, 1.4075927734375, 1.49566650390625, 1.583740234375, 1.67181396484375, 1.7598876953125, 1.84796142578125, 1.93603515625, 2.02410888671875, 2.1121826171875, 2.20025634765625, 2.288330078125, 2.37640380859375, 2.4644775390625, 2.55255126953125, 2.640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 11.0, 8.0, 13.0, 15.0, 19.0, 29.0, 48.0, 67.0, 119.0, 158.0, 279.0, 490.0, 864.0, 1983.0, 5348.0, 22143.0, 724802.0, 268868.0, 15465.0, 4278.0, 1651.0, 782.0, 396.0, 231.0, 151.0, 99.0, 73.0, 46.0, 26.0, 23.0, 16.0, 6.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.2265625, -12.8475341796875, -12.468505859375, -12.0894775390625, -11.71044921875, -11.3314208984375, -10.952392578125, -10.5733642578125, -10.1943359375, -9.8153076171875, -9.436279296875, -9.0572509765625, -8.67822265625, -8.2991943359375, -7.920166015625, -7.5411376953125, -7.162109375, -6.7830810546875, -6.404052734375, -6.0250244140625, -5.64599609375, -5.2669677734375, -4.887939453125, -4.5089111328125, -4.1298828125, -3.7508544921875, -3.371826171875, -2.9927978515625, -2.61376953125, -2.2347412109375, -1.855712890625, -1.4766845703125, -1.09765625, -0.7186279296875, -0.339599609375, 0.0394287109375, 0.41845703125, 0.7974853515625, 1.176513671875, 1.5555419921875, 1.9345703125, 2.3135986328125, 2.692626953125, 3.0716552734375, 3.45068359375, 3.8297119140625, 4.208740234375, 4.5877685546875, 4.966796875, 5.3458251953125, 5.724853515625, 6.1038818359375, 6.48291015625, 6.8619384765625, 7.240966796875, 7.6199951171875, 7.9990234375, 8.3780517578125, 8.757080078125, 9.1361083984375, 9.51513671875, 9.8941650390625, 10.273193359375, 10.6522216796875, 11.03125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 7.0, 20.0, 12.0, 26.0, 28.0, 27.0, 37.0, 54.0, 81.0, 64.0, 88.0, 84.0, 86.0, 79.0, 65.0, 47.0, 35.0, 30.0, 21.0, 23.0, 11.0, 13.0, 7.0, 10.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012683868408203125, -0.00012251362204551697, -0.00011818856000900269, -0.0001138634979724884, -0.00010953843593597412, -0.00010521337389945984, -0.00010088831186294556, -9.656324982643127e-05, -9.223818778991699e-05, -8.791312575340271e-05, -8.358806371688843e-05, -7.926300168037415e-05, -7.493793964385986e-05, -7.061287760734558e-05, -6.62878155708313e-05, -6.196275353431702e-05, -5.7637691497802734e-05, -5.331262946128845e-05, -4.898756742477417e-05, -4.466250538825989e-05, -4.0337443351745605e-05, -3.601238131523132e-05, -3.168731927871704e-05, -2.736225724220276e-05, -2.3037195205688477e-05, -1.8712133169174194e-05, -1.4387071132659912e-05, -1.006200909614563e-05, -5.736947059631348e-06, -1.4118850231170654e-06, 2.913177013397217e-06, 7.238239049911499e-06, 1.1563301086425781e-05, 1.5888363122940063e-05, 2.0213425159454346e-05, 2.4538487195968628e-05, 2.886354923248291e-05, 3.318861126899719e-05, 3.7513673305511475e-05, 4.183873534202576e-05, 4.616379737854004e-05, 5.048885941505432e-05, 5.4813921451568604e-05, 5.9138983488082886e-05, 6.346404552459717e-05, 6.778910756111145e-05, 7.211416959762573e-05, 7.643923163414001e-05, 8.07642936706543e-05, 8.508935570716858e-05, 8.941441774368286e-05, 9.373947978019714e-05, 9.806454181671143e-05, 0.00010238960385322571, 0.00010671466588973999, 0.00011103972792625427, 0.00011536478996276855, 0.00011968985199928284, 0.00012401491403579712, 0.0001283399760723114, 0.00013266503810882568, 0.00013699010014533997, 0.00014131516218185425, 0.00014564022421836853, 0.0001499652862548828]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 6.0, 9.0, 8.0, 11.0, 12.0, 11.0, 26.0, 31.0, 39.0, 58.0, 74.0, 100.0, 135.0, 202.0, 260.0, 390.0, 611.0, 948.0, 1710.0, 3138.0, 6710.0, 17715.0, 72789.0, 691898.0, 200391.0, 30966.0, 10058.0, 4307.0, 2201.0, 1264.0, 767.0, 540.0, 332.0, 210.0, 141.0, 117.0, 78.0, 71.0, 50.0, 37.0, 31.0, 31.0, 13.0, 11.0, 8.0, 8.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-7.7265625, -7.4830322265625, -7.239501953125, -6.9959716796875, -6.75244140625, -6.5089111328125, -6.265380859375, -6.0218505859375, -5.7783203125, -5.5347900390625, -5.291259765625, -5.0477294921875, -4.80419921875, -4.5606689453125, -4.317138671875, -4.0736083984375, -3.830078125, -3.5865478515625, -3.343017578125, -3.0994873046875, -2.85595703125, -2.6124267578125, -2.368896484375, -2.1253662109375, -1.8818359375, -1.6383056640625, -1.394775390625, -1.1512451171875, -0.90771484375, -0.6641845703125, -0.420654296875, -0.1771240234375, 0.06640625, 0.3099365234375, 0.553466796875, 0.7969970703125, 1.04052734375, 1.2840576171875, 1.527587890625, 1.7711181640625, 2.0146484375, 2.2581787109375, 2.501708984375, 2.7452392578125, 2.98876953125, 3.2322998046875, 3.475830078125, 3.7193603515625, 3.962890625, 4.2064208984375, 4.449951171875, 4.6934814453125, 4.93701171875, 5.1805419921875, 5.424072265625, 5.6676025390625, 5.9111328125, 6.1546630859375, 6.398193359375, 6.6417236328125, 6.88525390625, 7.1287841796875, 7.372314453125, 7.6158447265625, 7.859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 10.0, 10.0, 18.0, 12.0, 22.0, 20.0, 45.0, 40.0, 64.0, 67.0, 83.0, 85.0, 91.0, 86.0, 63.0, 77.0, 46.0, 32.0, 23.0, 17.0, 19.0, 11.0, 6.0, 4.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.76953125, -4.60400390625, -4.4384765625, -4.27294921875, -4.107421875, -3.94189453125, -3.7763671875, -3.61083984375, -3.4453125, -3.27978515625, -3.1142578125, -2.94873046875, -2.783203125, -2.61767578125, -2.4521484375, -2.28662109375, -2.12109375, -1.95556640625, -1.7900390625, -1.62451171875, -1.458984375, -1.29345703125, -1.1279296875, -0.96240234375, -0.796875, -0.63134765625, -0.4658203125, -0.30029296875, -0.134765625, 0.03076171875, 0.1962890625, 0.36181640625, 0.52734375, 0.69287109375, 0.8583984375, 1.02392578125, 1.189453125, 1.35498046875, 1.5205078125, 1.68603515625, 1.8515625, 2.01708984375, 2.1826171875, 2.34814453125, 2.513671875, 2.67919921875, 2.8447265625, 3.01025390625, 3.17578125, 3.34130859375, 3.5068359375, 3.67236328125, 3.837890625, 4.00341796875, 4.1689453125, 4.33447265625, 4.5, 4.66552734375, 4.8310546875, 4.99658203125, 5.162109375, 5.32763671875, 5.4931640625, 5.65869140625, 5.82421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 12.0, 23.0, 56.0, 154.0, 309.0, 239.0, 87.0, 44.0, 22.0, 13.0, 11.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.02613830566406, -41.12462615966797, -39.223114013671875, -37.321598052978516, -35.42008590698242, -33.51857376098633, -31.6170597076416, -29.715545654296875, -27.81403350830078, -25.912521362304688, -24.01100730895996, -22.109493255615234, -20.20798110961914, -18.306468963623047, -16.40495491027832, -14.50344181060791, -12.6019287109375, -10.70041561126709, -8.79890251159668, -6.8973894119262695, -4.995876312255859, -3.094363212585449, -1.192850112915039, 0.7086629867553711, 2.6101760864257812, 4.511689186096191, 6.413202285766602, 8.314715385437012, 10.216228485107422, 12.117741584777832, 14.019254684448242, 15.920767784118652, 17.822280883789062, 19.723793029785156, 21.625307083129883, 23.52682113647461, 25.428333282470703, 27.329845428466797, 29.231359481811523, 31.13287353515625, 33.034385681152344, 34.93589782714844, 36.83740997314453, 38.73892593383789, 40.640438079833984, 42.54195022583008, 44.44346618652344, 46.34497833251953, 48.246490478515625, 50.14800262451172, 52.04951477050781, 53.95103073120117, 55.852542877197266, 57.75405502319336, 59.65557098388672, 61.55708312988281, 63.458595275878906, 65.360107421875, 67.2616195678711, 69.16313171386719, 71.06465148925781, 72.9661636352539, 74.86767578125, 76.7691879272461, 78.67070007324219]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 7.0, 10.0, 10.0, 17.0, 23.0, 32.0, 39.0, 63.0, 94.0, 90.0, 97.0, 105.0, 93.0, 85.0, 65.0, 46.0, 36.0, 20.0, 12.0, 7.0, 8.0, 10.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.54393005371094, -46.146568298339844, -44.74920654296875, -43.351844787597656, -41.95448303222656, -40.5571174621582, -39.15975570678711, -37.762393951416016, -36.36503219604492, -34.96767044067383, -33.570308685302734, -32.17294692993164, -30.775583267211914, -29.37822151184082, -27.980857849121094, -26.58349609375, -25.186134338378906, -23.788772583007812, -22.39141082763672, -20.994047164916992, -19.5966854095459, -18.199323654174805, -16.801959991455078, -15.404598236083984, -14.00723648071289, -12.609874725341797, -11.212512016296387, -9.815149307250977, -8.417787551879883, -7.020425319671631, -5.623063087463379, -4.225700378417969, -2.828338623046875, -1.430976390838623, -0.033614158630371094, 1.3637480735778809, 2.761110305786133, 4.158472537994385, 5.555834770202637, 6.953197479248047, 8.35055923461914, 9.747920989990234, 11.145283699035645, 12.542646408081055, 13.940008163452148, 15.337369918823242, 16.73473358154297, 18.132095336914062, 19.529457092285156, 20.92681884765625, 22.324180603027344, 23.72154426574707, 25.118906021118164, 26.516267776489258, 27.913631439208984, 29.310993194580078, 30.708354949951172, 32.105716705322266, 33.50307846069336, 34.90044021606445, 36.29780578613281, 37.695167541503906, 39.092529296875, 40.489891052246094, 41.88725280761719]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 13.0, 22.0, 21.0, 52.0, 71.0, 179.0, 303.0, 653.0, 1554.0, 4444.0, 18437.0, 237103.0, 3877661.0, 41499.0, 7670.0, 2478.0, 978.0, 457.0, 248.0, 158.0, 94.0, 65.0, 32.0, 28.0, 19.0, 15.0, 13.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.390625, -13.820068359375, -13.24951171875, -12.678955078125, -12.1083984375, -11.537841796875, -10.96728515625, -10.396728515625, -9.826171875, -9.255615234375, -8.68505859375, -8.114501953125, -7.5439453125, -6.973388671875, -6.40283203125, -5.832275390625, -5.26171875, -4.691162109375, -4.12060546875, -3.550048828125, -2.9794921875, -2.408935546875, -1.83837890625, -1.267822265625, -0.697265625, -0.126708984375, 0.44384765625, 1.014404296875, 1.5849609375, 2.155517578125, 2.72607421875, 3.296630859375, 3.8671875, 4.437744140625, 5.00830078125, 5.578857421875, 6.1494140625, 6.719970703125, 7.29052734375, 7.861083984375, 8.431640625, 9.002197265625, 9.57275390625, 10.143310546875, 10.7138671875, 11.284423828125, 11.85498046875, 12.425537109375, 12.99609375, 13.566650390625, 14.13720703125, 14.707763671875, 15.2783203125, 15.848876953125, 16.41943359375, 16.989990234375, 17.560546875, 18.131103515625, 18.70166015625, 19.272216796875, 19.8427734375, 20.413330078125, 20.98388671875, 21.554443359375, 22.125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 11.0, 12.0, 12.0, 17.0, 29.0, 48.0, 79.0, 99.0, 126.0, 128.0, 120.0, 87.0, 57.0, 50.0, 43.0, 14.0, 9.0, 15.0, 7.0, 6.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.48174285888671875, -0.4634857177734375, -0.44522857666015625, -0.426971435546875, -0.40871429443359375, -0.3904571533203125, -0.37220001220703125, -0.35394287109375, -0.33568572998046875, -0.3174285888671875, -0.29917144775390625, -0.280914306640625, -0.26265716552734375, -0.2444000244140625, -0.22614288330078125, -0.2078857421875, -0.18962860107421875, -0.1713714599609375, -0.15311431884765625, -0.134857177734375, -0.11660003662109375, -0.0983428955078125, -0.08008575439453125, -0.06182861328125, -0.04357147216796875, -0.0253143310546875, -0.00705718994140625, 0.011199951171875, 0.02945709228515625, 0.0477142333984375, 0.06597137451171875, 0.084228515625, 0.10248565673828125, 0.1207427978515625, 0.13899993896484375, 0.157257080078125, 0.17551422119140625, 0.1937713623046875, 0.21202850341796875, 0.23028564453125, 0.24854278564453125, 0.2667999267578125, 0.28505706787109375, 0.303314208984375, 0.32157135009765625, 0.3398284912109375, 0.35808563232421875, 0.3763427734375, 0.39459991455078125, 0.4128570556640625, 0.43111419677734375, 0.449371337890625, 0.46762847900390625, 0.4858856201171875, 0.5041427612304688, 0.52239990234375, 0.5406570434570312, 0.5589141845703125, 0.5771713256835938, 0.595428466796875, 0.6136856079101562, 0.6319427490234375, 0.6501998901367188, 0.66845703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 2.0, 9.0, 8.0, 12.0, 26.0, 44.0, 70.0, 107.0, 182.0, 407.0, 1088.0, 4011.0, 23545.0, 1291920.0, 2841626.0, 25089.0, 4118.0, 1135.0, 396.0, 206.0, 107.0, 60.0, 35.0, 16.0, 16.0, 14.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.9638671875, -18.287109375, -17.6103515625, -16.93359375, -16.2568359375, -15.580078125, -14.9033203125, -14.2265625, -13.5498046875, -12.873046875, -12.1962890625, -11.51953125, -10.8427734375, -10.166015625, -9.4892578125, -8.8125, -8.1357421875, -7.458984375, -6.7822265625, -6.10546875, -5.4287109375, -4.751953125, -4.0751953125, -3.3984375, -2.7216796875, -2.044921875, -1.3681640625, -0.69140625, -0.0146484375, 0.662109375, 1.3388671875, 2.015625, 2.6923828125, 3.369140625, 4.0458984375, 4.72265625, 5.3994140625, 6.076171875, 6.7529296875, 7.4296875, 8.1064453125, 8.783203125, 9.4599609375, 10.13671875, 10.8134765625, 11.490234375, 12.1669921875, 12.84375, 13.5205078125, 14.197265625, 14.8740234375, 15.55078125, 16.2275390625, 16.904296875, 17.5810546875, 18.2578125, 18.9345703125, 19.611328125, 20.2880859375, 20.96484375, 21.6416015625, 22.318359375, 22.9951171875, 23.671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 10.0, 9.0, 14.0, 16.0, 22.0, 40.0, 45.0, 68.0, 115.0, 163.0, 379.0, 1818.0, 815.0, 220.0, 122.0, 61.0, 38.0, 25.0, 24.0, 21.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7666015625, -1.7222442626953125, -1.677886962890625, -1.6335296630859375, -1.58917236328125, -1.5448150634765625, -1.500457763671875, -1.4561004638671875, -1.4117431640625, -1.3673858642578125, -1.323028564453125, -1.2786712646484375, -1.23431396484375, -1.1899566650390625, -1.145599365234375, -1.1012420654296875, -1.056884765625, -1.0125274658203125, -0.968170166015625, -0.9238128662109375, -0.87945556640625, -0.8350982666015625, -0.790740966796875, -0.7463836669921875, -0.7020263671875, -0.6576690673828125, -0.613311767578125, -0.5689544677734375, -0.52459716796875, -0.4802398681640625, -0.435882568359375, -0.3915252685546875, -0.34716796875, -0.3028106689453125, -0.258453369140625, -0.2140960693359375, -0.16973876953125, -0.1253814697265625, -0.081024169921875, -0.0366668701171875, 0.0076904296875, 0.0520477294921875, 0.096405029296875, 0.1407623291015625, 0.18511962890625, 0.2294769287109375, 0.273834228515625, 0.3181915283203125, 0.362548828125, 0.4069061279296875, 0.451263427734375, 0.4956207275390625, 0.53997802734375, 0.5843353271484375, 0.628692626953125, 0.6730499267578125, 0.7174072265625, 0.7617645263671875, 0.806121826171875, 0.8504791259765625, 0.89483642578125, 0.9391937255859375, 0.983551025390625, 1.0279083251953125, 1.072265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 11.0, 13.0, 26.0, 49.0, 86.0, 221.0, 337.0, 163.0, 43.0, 24.0, 15.0, 4.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.103084564208984, -31.38210678100586, -30.661128997802734, -29.940153121948242, -29.219175338745117, -28.498197555541992, -27.7772216796875, -27.056243896484375, -26.33526611328125, -25.614288330078125, -24.893310546875, -24.172334671020508, -23.451356887817383, -22.730379104614258, -22.009403228759766, -21.28842544555664, -20.567447662353516, -19.84646987915039, -19.125492095947266, -18.404516220092773, -17.68353843688965, -16.962560653686523, -16.24158477783203, -15.520606994628906, -14.799629211425781, -14.078651428222656, -13.357674598693848, -12.636697769165039, -11.915719985961914, -11.194742202758789, -10.47376537322998, -9.752788543701172, -9.03180980682373, -8.310832977294922, -7.589855194091797, -6.86887788772583, -6.147900581359863, -5.4269232749938965, -4.70594596862793, -3.984968662261963, -3.263991355895996, -2.5430140495300293, -1.8220367431640625, -1.1010594367980957, -0.3800821304321289, 0.3408951759338379, 1.0618724822998047, 1.7828497886657715, 2.5038270950317383, 3.224804401397705, 3.945781707763672, 4.666759014129639, 5.3877363204956055, 6.108713626861572, 6.829690933227539, 7.550668239593506, 8.271645545959473, 8.992622375488281, 9.713600158691406, 10.434577941894531, 11.15555477142334, 11.876531600952148, 12.597509384155273, 13.318487167358398, 14.039463996887207]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 10.0, 14.0, 14.0, 27.0, 29.0, 31.0, 36.0, 42.0, 48.0, 53.0, 77.0, 68.0, 64.0, 69.0, 72.0, 50.0, 56.0, 43.0, 28.0, 24.0, 24.0, 21.0, 22.0, 15.0, 11.0, 8.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.639950752258301, -6.372225284576416, -6.104499816894531, -5.836773872375488, -5.5690484046936035, -5.301322937011719, -5.033596992492676, -4.765871524810791, -4.498146057128906, -4.2304205894470215, -3.9626948833465576, -3.6949691772460938, -3.427243709564209, -3.159518241882324, -2.8917925357818604, -2.6240668296813965, -2.3563413619995117, -2.088615894317627, -1.820890188217163, -1.5531646013259888, -1.2854390144348145, -1.0177134275436401, -0.7499878406524658, -0.4822622537612915, -0.2145366668701172, 0.05318892002105713, 0.32091450691223145, 0.5886400938034058, 0.8563656806945801, 1.1240912675857544, 1.3918168544769287, 1.659542441368103, 1.927267074584961, 2.1949925422668457, 2.4627182483673096, 2.7304439544677734, 2.998169422149658, 3.265894889831543, 3.533620595932007, 3.8013463020324707, 4.0690717697143555, 4.33679723739624, 4.604522705078125, 4.872248649597168, 5.139974117279053, 5.4076995849609375, 5.6754255294799805, 5.943150997161865, 6.21087646484375, 6.478601932525635, 6.7463274002075195, 7.0140533447265625, 7.281778812408447, 7.549504280090332, 7.817230224609375, 8.084955215454102, 8.352681159973145, 8.620407104492188, 8.888132095336914, 9.155858039855957, 9.423583984375, 9.691308975219727, 9.95903491973877, 10.226759910583496, 10.494485855102539]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 14.0, 11.0, 19.0, 39.0, 42.0, 63.0, 78.0, 93.0, 150.0, 204.0, 353.0, 488.0, 829.0, 1284.0, 2147.0, 3936.0, 7675.0, 18097.0, 57730.0, 458067.0, 408699.0, 53940.0, 17657.0, 7581.0, 3639.0, 2112.0, 1266.0, 794.0, 484.0, 335.0, 224.0, 155.0, 102.0, 59.0, 47.0, 36.0, 28.0, 30.0, 14.0, 8.0, 10.0, 3.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.637451171875, -9.34521484375, -9.052978515625, -8.7607421875, -8.468505859375, -8.17626953125, -7.884033203125, -7.591796875, -7.299560546875, -7.00732421875, -6.715087890625, -6.4228515625, -6.130615234375, -5.83837890625, -5.546142578125, -5.25390625, -4.961669921875, -4.66943359375, -4.377197265625, -4.0849609375, -3.792724609375, -3.50048828125, -3.208251953125, -2.916015625, -2.623779296875, -2.33154296875, -2.039306640625, -1.7470703125, -1.454833984375, -1.16259765625, -0.870361328125, -0.578125, -0.285888671875, 0.00634765625, 0.298583984375, 0.5908203125, 0.883056640625, 1.17529296875, 1.467529296875, 1.759765625, 2.052001953125, 2.34423828125, 2.636474609375, 2.9287109375, 3.220947265625, 3.51318359375, 3.805419921875, 4.09765625, 4.389892578125, 4.68212890625, 4.974365234375, 5.2666015625, 5.558837890625, 5.85107421875, 6.143310546875, 6.435546875, 6.727783203125, 7.02001953125, 7.312255859375, 7.6044921875, 7.896728515625, 8.18896484375, 8.481201171875, 8.7734375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 12.0, 19.0, 21.0, 29.0, 34.0, 28.0, 45.0, 65.0, 55.0, 67.0, 72.0, 65.0, 79.0, 51.0, 50.0, 48.0, 49.0, 34.0, 23.0, 23.0, 15.0, 15.0, 13.0, 9.0, 8.0, 5.0, 11.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3845710754394531, -0.36997222900390625, -0.3553733825683594, -0.3407745361328125, -0.3261756896972656, -0.31157684326171875, -0.2969779968261719, -0.282379150390625, -0.2677803039550781, -0.25318145751953125, -0.23858261108398438, -0.2239837646484375, -0.20938491821289062, -0.19478607177734375, -0.18018722534179688, -0.16558837890625, -0.15098953247070312, -0.13639068603515625, -0.12179183959960938, -0.1071929931640625, -0.09259414672851562, -0.07799530029296875, -0.06339645385742188, -0.048797607421875, -0.034198760986328125, -0.01959991455078125, -0.005001068115234375, 0.0095977783203125, 0.024196624755859375, 0.03879547119140625, 0.053394317626953125, 0.0679931640625, 0.08259201049804688, 0.09719085693359375, 0.11178970336914062, 0.1263885498046875, 0.14098739624023438, 0.15558624267578125, 0.17018508911132812, 0.184783935546875, 0.19938278198242188, 0.21398162841796875, 0.22858047485351562, 0.2431793212890625, 0.2577781677246094, 0.27237701416015625, 0.2869758605957031, 0.30157470703125, 0.3161735534667969, 0.33077239990234375, 0.3453712463378906, 0.3599700927734375, 0.3745689392089844, 0.38916778564453125, 0.4037666320800781, 0.418365478515625, 0.4329643249511719, 0.44756317138671875, 0.4621620178222656, 0.4767608642578125, 0.4913597106933594, 0.5059585571289062, 0.5205574035644531, 0.53515625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 2.0, 10.0, 5.0, 8.0, 9.0, 20.0, 35.0, 136.0, 801.0, 14260.0, 1006353.0, 25636.0, 971.0, 147.0, 29.0, 18.0, 9.0, 6.0, 5.0, 6.0, 7.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-32.6875, -31.74169921875, -30.7958984375, -29.85009765625, -28.904296875, -27.95849609375, -27.0126953125, -26.06689453125, -25.12109375, -24.17529296875, -23.2294921875, -22.28369140625, -21.337890625, -20.39208984375, -19.4462890625, -18.50048828125, -17.5546875, -16.60888671875, -15.6630859375, -14.71728515625, -13.771484375, -12.82568359375, -11.8798828125, -10.93408203125, -9.98828125, -9.04248046875, -8.0966796875, -7.15087890625, -6.205078125, -5.25927734375, -4.3134765625, -3.36767578125, -2.421875, -1.47607421875, -0.5302734375, 0.41552734375, 1.361328125, 2.30712890625, 3.2529296875, 4.19873046875, 5.14453125, 6.09033203125, 7.0361328125, 7.98193359375, 8.927734375, 9.87353515625, 10.8193359375, 11.76513671875, 12.7109375, 13.65673828125, 14.6025390625, 15.54833984375, 16.494140625, 17.43994140625, 18.3857421875, 19.33154296875, 20.27734375, 21.22314453125, 22.1689453125, 23.11474609375, 24.060546875, 25.00634765625, 25.9521484375, 26.89794921875, 27.84375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 4.0, 12.0, 10.0, 12.0, 9.0, 18.0, 22.0, 20.0, 24.0, 23.0, 32.0, 27.0, 37.0, 36.0, 33.0, 35.0, 47.0, 47.0, 42.0, 45.0, 33.0, 45.0, 47.0, 37.0, 35.0, 39.0, 41.0, 30.0, 21.0, 20.0, 15.0, 18.0, 14.0, 18.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.421875, -2.3507080078125, -2.279541015625, -2.2083740234375, -2.13720703125, -2.0660400390625, -1.994873046875, -1.9237060546875, -1.8525390625, -1.7813720703125, -1.710205078125, -1.6390380859375, -1.56787109375, -1.4967041015625, -1.425537109375, -1.3543701171875, -1.283203125, -1.2120361328125, -1.140869140625, -1.0697021484375, -0.99853515625, -0.9273681640625, -0.856201171875, -0.7850341796875, -0.7138671875, -0.6427001953125, -0.571533203125, -0.5003662109375, -0.42919921875, -0.3580322265625, -0.286865234375, -0.2156982421875, -0.14453125, -0.0733642578125, -0.002197265625, 0.0689697265625, 0.14013671875, 0.2113037109375, 0.282470703125, 0.3536376953125, 0.4248046875, 0.4959716796875, 0.567138671875, 0.6383056640625, 0.70947265625, 0.7806396484375, 0.851806640625, 0.9229736328125, 0.994140625, 1.0653076171875, 1.136474609375, 1.2076416015625, 1.27880859375, 1.3499755859375, 1.421142578125, 1.4923095703125, 1.5634765625, 1.6346435546875, 1.705810546875, 1.7769775390625, 1.84814453125, 1.9193115234375, 1.990478515625, 2.0616455078125, 2.1328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 3.0, 8.0, 4.0, 12.0, 16.0, 23.0, 52.0, 148.0, 1123.0, 139310.0, 905545.0, 1923.0, 219.0, 53.0, 20.0, 11.0, 19.0, 12.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.5625, -50.1728515625, -48.783203125, -47.3935546875, -46.00390625, -44.6142578125, -43.224609375, -41.8349609375, -40.4453125, -39.0556640625, -37.666015625, -36.2763671875, -34.88671875, -33.4970703125, -32.107421875, -30.7177734375, -29.328125, -27.9384765625, -26.548828125, -25.1591796875, -23.76953125, -22.3798828125, -20.990234375, -19.6005859375, -18.2109375, -16.8212890625, -15.431640625, -14.0419921875, -12.65234375, -11.2626953125, -9.873046875, -8.4833984375, -7.09375, -5.7041015625, -4.314453125, -2.9248046875, -1.53515625, -0.1455078125, 1.244140625, 2.6337890625, 4.0234375, 5.4130859375, 6.802734375, 8.1923828125, 9.58203125, 10.9716796875, 12.361328125, 13.7509765625, 15.140625, 16.5302734375, 17.919921875, 19.3095703125, 20.69921875, 22.0888671875, 23.478515625, 24.8681640625, 26.2578125, 27.6474609375, 29.037109375, 30.4267578125, 31.81640625, 33.2060546875, 34.595703125, 35.9853515625, 37.375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 10.0, 11.0, 7.0, 24.0, 26.0, 32.0, 29.0, 51.0, 70.0, 80.0, 87.0, 83.0, 96.0, 74.0, 52.0, 52.0, 35.0, 35.0, 26.0, 20.0, 15.0, 6.0, 12.0, 7.0, 8.0, 2.0, 11.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025343894958496094, -0.00024391338229179382, -0.0002343878149986267, -0.0002248622477054596, -0.00021533668041229248, -0.00020581111311912537, -0.00019628554582595825, -0.00018675997853279114, -0.00017723441123962402, -0.0001677088439464569, -0.0001581832766532898, -0.00014865770936012268, -0.00013913214206695557, -0.00012960657477378845, -0.00012008100748062134, -0.00011055544018745422, -0.00010102987289428711, -9.150430560112e-05, -8.197873830795288e-05, -7.245317101478577e-05, -6.292760372161865e-05, -5.340203642845154e-05, -4.3876469135284424e-05, -3.435090184211731e-05, -2.4825334548950195e-05, -1.529976725578308e-05, -5.774199962615967e-06, 3.7513673305511475e-06, 1.3276934623718262e-05, 2.2802501916885376e-05, 3.232806921005249e-05, 4.1853636503219604e-05, 5.137920379638672e-05, 6.090477108955383e-05, 7.043033838272095e-05, 7.995590567588806e-05, 8.948147296905518e-05, 9.900704026222229e-05, 0.0001085326075553894, 0.00011805817484855652, 0.00012758374214172363, 0.00013710930943489075, 0.00014663487672805786, 0.00015616044402122498, 0.0001656860113143921, 0.0001752115786075592, 0.00018473714590072632, 0.00019426271319389343, 0.00020378828048706055, 0.00021331384778022766, 0.00022283941507339478, 0.0002323649823665619, 0.000241890549659729, 0.0002514161169528961, 0.00026094168424606323, 0.00027046725153923035, 0.00027999281883239746, 0.0002895183861255646, 0.0002990439534187317, 0.0003085695207118988, 0.0003180950880050659, 0.00032762065529823303, 0.00033714622259140015, 0.00034667178988456726, 0.0003561973571777344]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 12.0, 8.0, 17.0, 29.0, 25.0, 32.0, 50.0, 57.0, 81.0, 147.0, 182.0, 263.0, 417.0, 597.0, 1016.0, 1670.0, 2975.0, 5834.0, 14781.0, 87455.0, 815409.0, 89796.0, 14807.0, 5854.0, 2862.0, 1621.0, 949.0, 574.0, 347.0, 233.0, 153.0, 90.0, 72.0, 37.0, 22.0, 22.0, 16.0, 8.0, 11.0, 7.0, 4.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.7734375, -15.3162841796875, -14.859130859375, -14.4019775390625, -13.94482421875, -13.4876708984375, -13.030517578125, -12.5733642578125, -12.1162109375, -11.6590576171875, -11.201904296875, -10.7447509765625, -10.28759765625, -9.8304443359375, -9.373291015625, -8.9161376953125, -8.458984375, -8.0018310546875, -7.544677734375, -7.0875244140625, -6.63037109375, -6.1732177734375, -5.716064453125, -5.2589111328125, -4.8017578125, -4.3446044921875, -3.887451171875, -3.4302978515625, -2.97314453125, -2.5159912109375, -2.058837890625, -1.6016845703125, -1.14453125, -0.6873779296875, -0.230224609375, 0.2269287109375, 0.68408203125, 1.1412353515625, 1.598388671875, 2.0555419921875, 2.5126953125, 2.9698486328125, 3.427001953125, 3.8841552734375, 4.34130859375, 4.7984619140625, 5.255615234375, 5.7127685546875, 6.169921875, 6.6270751953125, 7.084228515625, 7.5413818359375, 7.99853515625, 8.4556884765625, 8.912841796875, 9.3699951171875, 9.8271484375, 10.2843017578125, 10.741455078125, 11.1986083984375, 11.65576171875, 12.1129150390625, 12.570068359375, 13.0272216796875, 13.484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 22.0, 29.0, 122.0, 237.0, 238.0, 151.0, 81.0, 32.0, 3.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-12.5078125, -12.204345703125, -11.90087890625, -11.597412109375, -11.2939453125, -10.990478515625, -10.68701171875, -10.383544921875, -10.080078125, -9.776611328125, -9.47314453125, -9.169677734375, -8.8662109375, -8.562744140625, -8.25927734375, -7.955810546875, -7.65234375, -7.348876953125, -7.04541015625, -6.741943359375, -6.4384765625, -6.135009765625, -5.83154296875, -5.528076171875, -5.224609375, -4.921142578125, -4.61767578125, -4.314208984375, -4.0107421875, -3.707275390625, -3.40380859375, -3.100341796875, -2.796875, -2.493408203125, -2.18994140625, -1.886474609375, -1.5830078125, -1.279541015625, -0.97607421875, -0.672607421875, -0.369140625, -0.065673828125, 0.23779296875, 0.541259765625, 0.8447265625, 1.148193359375, 1.45166015625, 1.755126953125, 2.05859375, 2.362060546875, 2.66552734375, 2.968994140625, 3.2724609375, 3.575927734375, 3.87939453125, 4.182861328125, 4.486328125, 4.789794921875, 5.09326171875, 5.396728515625, 5.7001953125, 6.003662109375, 6.30712890625, 6.610595703125, 6.9140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 8.0, 20.0, 45.0, 129.0, 284.0, 279.0, 122.0, 63.0, 26.0, 15.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.472925186157227, -22.416006088256836, -20.359086990356445, -18.302169799804688, -16.245250701904297, -14.18833065032959, -12.131412506103516, -10.074493408203125, -8.017574310302734, -5.960655212402344, -3.9037365913391113, -1.846817970275879, 0.21010112762451172, 2.2670202255249023, 4.323938369750977, 6.380857467651367, 8.437776565551758, 10.494695663452148, 12.551614761352539, 14.608532905578613, 16.665451049804688, 18.722370147705078, 20.77928924560547, 22.83620834350586, 24.89312744140625, 26.95004653930664, 29.00696563720703, 31.063884735107422, 33.12080383300781, 35.1777229309082, 37.234642028808594, 39.29155731201172, 41.348480224609375, 43.405399322509766, 45.462318420410156, 47.51923751831055, 49.57615661621094, 51.63307571411133, 53.68999481201172, 55.746910095214844, 57.8038330078125, 59.86075210571289, 61.91767120361328, 63.97459030151367, 66.03150939941406, 68.08842468261719, 70.14534759521484, 72.20226287841797, 74.25918579101562, 76.31610107421875, 78.3730239868164, 80.42993927001953, 82.48686218261719, 84.54377746582031, 86.60070037841797, 88.6576156616211, 90.71453094482422, 92.77144622802734, 94.828369140625, 96.88528442382812, 98.94220733642578, 100.9991226196289, 103.05604553222656, 105.11296081542969, 107.16988372802734]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 6.0, 7.0, 13.0, 5.0, 10.0, 12.0, 17.0, 20.0, 24.0, 37.0, 22.0, 46.0, 36.0, 50.0, 45.0, 55.0, 65.0, 57.0, 60.0, 52.0, 40.0, 32.0, 43.0, 40.0, 34.0, 31.0, 20.0, 23.0, 17.0, 18.0, 10.0, 7.0, 8.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.04619789123535, -22.366579055786133, -21.68695831298828, -21.007339477539062, -20.32771873474121, -19.648099899291992, -18.96847915649414, -18.288860321044922, -17.609241485595703, -16.929622650146484, -16.250001907348633, -15.570383071899414, -14.890762329101562, -14.211143493652344, -13.531523704528809, -12.851903915405273, -12.172283172607422, -11.492663383483887, -10.813043594360352, -10.133424758911133, -9.453804016113281, -8.774185180664062, -8.094565391540527, -7.414945602416992, -6.735325813293457, -6.055706024169922, -5.376086235046387, -4.69646692276001, -4.016847133636475, -3.3372273445129395, -2.6576080322265625, -1.9779882431030273, -1.2983665466308594, -0.6187468767166138, 0.060872793197631836, 0.7404923439025879, 1.420112133026123, 2.099731922149658, 2.779351234436035, 3.4589710235595703, 4.1385908126831055, 4.818210601806641, 5.497830390930176, 6.177449703216553, 6.857069492340088, 7.536689281463623, 8.21630859375, 8.895928382873535, 9.57554817199707, 10.255167961120605, 10.93478775024414, 11.61440658569336, 12.294027328491211, 12.97364616394043, 13.653265953063965, 14.3328857421875, 15.012505531311035, 15.69212532043457, 16.37174415588379, 17.05136489868164, 17.73098373413086, 18.41060447692871, 19.09022331237793, 19.76984405517578, 20.449462890625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 18.0, 23.0, 43.0, 104.0, 184.0, 426.0, 886.0, 2241.0, 6163.0, 23677.0, 178958.0, 3811707.0, 139871.0, 20546.0, 5591.0, 2021.0, 833.0, 396.0, 192.0, 134.0, 79.0, 51.0, 34.0, 31.0, 17.0, 16.0, 8.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.321044921875, -7.78271484375, -7.244384765625, -6.7060546875, -6.167724609375, -5.62939453125, -5.091064453125, -4.552734375, -4.014404296875, -3.47607421875, -2.937744140625, -2.3994140625, -1.861083984375, -1.32275390625, -0.784423828125, -0.24609375, 0.292236328125, 0.83056640625, 1.368896484375, 1.9072265625, 2.445556640625, 2.98388671875, 3.522216796875, 4.060546875, 4.598876953125, 5.13720703125, 5.675537109375, 6.2138671875, 6.752197265625, 7.29052734375, 7.828857421875, 8.3671875, 8.905517578125, 9.44384765625, 9.982177734375, 10.5205078125, 11.058837890625, 11.59716796875, 12.135498046875, 12.673828125, 13.212158203125, 13.75048828125, 14.288818359375, 14.8271484375, 15.365478515625, 15.90380859375, 16.442138671875, 16.98046875, 17.518798828125, 18.05712890625, 18.595458984375, 19.1337890625, 19.672119140625, 20.21044921875, 20.748779296875, 21.287109375, 21.825439453125, 22.36376953125, 22.902099609375, 23.4404296875, 23.978759765625, 24.51708984375, 25.055419921875, 25.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 12.0, 15.0, 18.0, 17.0, 21.0, 30.0, 29.0, 42.0, 55.0, 56.0, 76.0, 85.0, 66.0, 64.0, 65.0, 56.0, 52.0, 57.0, 31.0, 32.0, 25.0, 28.0, 15.0, 14.0, 7.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.408447265625, -0.3925361633300781, -0.37662506103515625, -0.3607139587402344, -0.3448028564453125, -0.3288917541503906, -0.31298065185546875, -0.2970695495605469, -0.281158447265625, -0.2652473449707031, -0.24933624267578125, -0.23342514038085938, -0.2175140380859375, -0.20160293579101562, -0.18569183349609375, -0.16978073120117188, -0.15386962890625, -0.13795852661132812, -0.12204742431640625, -0.10613632202148438, -0.0902252197265625, -0.07431411743164062, -0.05840301513671875, -0.042491912841796875, -0.026580810546875, -0.010669708251953125, 0.00524139404296875, 0.021152496337890625, 0.0370635986328125, 0.052974700927734375, 0.06888580322265625, 0.08479690551757812, 0.1007080078125, 0.11661911010742188, 0.13253021240234375, 0.14844131469726562, 0.1643524169921875, 0.18026351928710938, 0.19617462158203125, 0.21208572387695312, 0.227996826171875, 0.24390792846679688, 0.25981903076171875, 0.2757301330566406, 0.2916412353515625, 0.3075523376464844, 0.32346343994140625, 0.3393745422363281, 0.35528564453125, 0.3711967468261719, 0.38710784912109375, 0.4030189514160156, 0.4189300537109375, 0.4348411560058594, 0.45075225830078125, 0.4666633605957031, 0.482574462890625, 0.4984855651855469, 0.5143966674804688, 0.5303077697753906, 0.5462188720703125, 0.5621299743652344, 0.5780410766601562, 0.5939521789550781, 0.60986328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 10.0, 5.0, 14.0, 24.0, 29.0, 38.0, 65.0, 136.0, 318.0, 978.0, 9819.0, 4011281.0, 167656.0, 2868.0, 597.0, 228.0, 80.0, 47.0, 27.0, 21.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.90478515625, -35.6220703125, -34.33935546875, -33.056640625, -31.77392578125, -30.4912109375, -29.20849609375, -27.92578125, -26.64306640625, -25.3603515625, -24.07763671875, -22.794921875, -21.51220703125, -20.2294921875, -18.94677734375, -17.6640625, -16.38134765625, -15.0986328125, -13.81591796875, -12.533203125, -11.25048828125, -9.9677734375, -8.68505859375, -7.40234375, -6.11962890625, -4.8369140625, -3.55419921875, -2.271484375, -0.98876953125, 0.2939453125, 1.57666015625, 2.859375, 4.14208984375, 5.4248046875, 6.70751953125, 7.990234375, 9.27294921875, 10.5556640625, 11.83837890625, 13.12109375, 14.40380859375, 15.6865234375, 16.96923828125, 18.251953125, 19.53466796875, 20.8173828125, 22.10009765625, 23.3828125, 24.66552734375, 25.9482421875, 27.23095703125, 28.513671875, 29.79638671875, 31.0791015625, 32.36181640625, 33.64453125, 34.92724609375, 36.2099609375, 37.49267578125, 38.775390625, 40.05810546875, 41.3408203125, 42.62353515625, 43.90625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 16.0, 30.0, 70.0, 123.0, 255.0, 668.0, 1782.0, 629.0, 224.0, 113.0, 49.0, 33.0, 22.0, 21.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.425384521484375, -2.35076904296875, -2.276153564453125, -2.2015380859375, -2.126922607421875, -2.05230712890625, -1.977691650390625, -1.903076171875, -1.828460693359375, -1.75384521484375, -1.679229736328125, -1.6046142578125, -1.529998779296875, -1.45538330078125, -1.380767822265625, -1.30615234375, -1.231536865234375, -1.15692138671875, -1.082305908203125, -1.0076904296875, -0.933074951171875, -0.85845947265625, -0.783843994140625, -0.709228515625, -0.634613037109375, -0.55999755859375, -0.485382080078125, -0.4107666015625, -0.336151123046875, -0.26153564453125, -0.186920166015625, -0.1123046875, -0.037689208984375, 0.03692626953125, 0.111541748046875, 0.1861572265625, 0.260772705078125, 0.33538818359375, 0.410003662109375, 0.484619140625, 0.559234619140625, 0.63385009765625, 0.708465576171875, 0.7830810546875, 0.857696533203125, 0.93231201171875, 1.006927490234375, 1.08154296875, 1.156158447265625, 1.23077392578125, 1.305389404296875, 1.3800048828125, 1.454620361328125, 1.52923583984375, 1.603851318359375, 1.678466796875, 1.753082275390625, 1.82769775390625, 1.902313232421875, 1.9769287109375, 2.051544189453125, 2.12615966796875, 2.200775146484375, 2.275390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 20.0, 47.0, 129.0, 226.0, 281.0, 156.0, 65.0, 33.0, 20.0, 13.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.47102355957031, -37.68798828125, -36.90494918823242, -36.12191390991211, -35.33887481689453, -34.55583953857422, -33.77280044555664, -32.98976516723633, -32.20672607421875, -31.423688888549805, -30.64065170288086, -29.857614517211914, -29.07457733154297, -28.291540145874023, -27.508502960205078, -26.725467681884766, -25.94243049621582, -25.159393310546875, -24.37635612487793, -23.593318939208984, -22.81028175354004, -22.027244567871094, -21.24420928955078, -20.461170196533203, -19.67813491821289, -18.895097732543945, -18.112060546875, -17.329023361206055, -16.54598617553711, -15.762948989868164, -14.979912757873535, -14.19687557220459, -13.413839340209961, -12.630802154541016, -11.84776496887207, -11.064727783203125, -10.28169059753418, -9.498653411865234, -8.715617179870605, -7.93257999420166, -7.149542808532715, -6.3665056228637695, -5.583468437194824, -4.800431728363037, -4.017394542694092, -3.2343573570251465, -2.4513206481933594, -1.668283462524414, -0.8852462768554688, -0.10220921039581299, 0.6808278560638428, 1.463864803314209, 2.2469019889831543, 3.0299391746520996, 3.8129758834838867, 4.596013069152832, 5.379050254821777, 6.162087440490723, 6.945124626159668, 7.728161334991455, 8.511198043823242, 9.294235229492188, 10.077272415161133, 10.860309600830078, 11.643346786499023]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 13.0, 9.0, 14.0, 16.0, 14.0, 31.0, 25.0, 28.0, 27.0, 33.0, 27.0, 37.0, 45.0, 40.0, 39.0, 43.0, 51.0, 52.0, 49.0, 39.0, 34.0, 42.0, 32.0, 31.0, 34.0, 32.0, 26.0, 33.0, 23.0, 17.0, 12.0, 8.0, 10.0, 6.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.217605590820312, -7.970247268676758, -7.722888946533203, -7.475530624389648, -7.228172302246094, -6.980813980102539, -6.733455657958984, -6.48609733581543, -6.238739013671875, -5.99138069152832, -5.744022369384766, -5.496664047241211, -5.249305725097656, -5.001947402954102, -4.754589080810547, -4.507230758666992, -4.259871959686279, -4.012513637542725, -3.76515531539917, -3.5177969932556152, -3.2704386711120605, -3.023080348968506, -2.775721788406372, -2.5283634662628174, -2.2810051441192627, -2.033646821975708, -1.7862884998321533, -1.538930058479309, -1.2915717363357544, -1.0442134141921997, -0.7968549728393555, -0.5494966506958008, -0.3021388053894043, -0.05478045344352722, 0.19257789850234985, 0.4399362802505493, 0.687294602394104, 0.9346529245376587, 1.182011365890503, 1.4293696880340576, 1.6767280101776123, 1.924086332321167, 2.1714446544647217, 2.4188032150268555, 2.66616153717041, 2.913519859313965, 3.1608781814575195, 3.408236503601074, 3.655594825744629, 3.9029531478881836, 4.150311470031738, 4.397669792175293, 4.645028114318848, 4.892386436462402, 5.139744758605957, 5.387103080749512, 5.634461402893066, 5.881819725036621, 6.129178047180176, 6.3765363693237305, 6.623894691467285, 6.87125301361084, 7.1186113357543945, 7.365969657897949, 7.613328456878662]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 9.0, 3.0, 5.0, 7.0, 9.0, 9.0, 11.0, 12.0, 13.0, 14.0, 21.0, 35.0, 58.0, 81.0, 183.0, 463.0, 1476.0, 5335.0, 21748.0, 104779.0, 459458.0, 360068.0, 72870.0, 15862.0, 4076.0, 1148.0, 377.0, 165.0, 64.0, 42.0, 23.0, 21.0, 17.0, 21.0, 9.0, 9.0, 6.0, 8.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.33203125, -7.08673095703125, -6.8414306640625, -6.59613037109375, -6.350830078125, -6.10552978515625, -5.8602294921875, -5.61492919921875, -5.36962890625, -5.12432861328125, -4.8790283203125, -4.63372802734375, -4.388427734375, -4.14312744140625, -3.8978271484375, -3.65252685546875, -3.4072265625, -3.16192626953125, -2.9166259765625, -2.67132568359375, -2.426025390625, -2.18072509765625, -1.9354248046875, -1.69012451171875, -1.44482421875, -1.19952392578125, -0.9542236328125, -0.70892333984375, -0.463623046875, -0.21832275390625, 0.0269775390625, 0.27227783203125, 0.517578125, 0.76287841796875, 1.0081787109375, 1.25347900390625, 1.498779296875, 1.74407958984375, 1.9893798828125, 2.23468017578125, 2.47998046875, 2.72528076171875, 2.9705810546875, 3.21588134765625, 3.461181640625, 3.70648193359375, 3.9517822265625, 4.19708251953125, 4.4423828125, 4.68768310546875, 4.9329833984375, 5.17828369140625, 5.423583984375, 5.66888427734375, 5.9141845703125, 6.15948486328125, 6.40478515625, 6.65008544921875, 6.8953857421875, 7.14068603515625, 7.385986328125, 7.63128662109375, 7.8765869140625, 8.12188720703125, 8.3671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 15.0, 9.0, 10.0, 24.0, 32.0, 54.0, 51.0, 61.0, 75.0, 83.0, 80.0, 88.0, 75.0, 80.0, 65.0, 58.0, 52.0, 24.0, 23.0, 23.0, 16.0, 4.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1274642944335938, -1.1006317138671875, -1.0737991333007812, -1.046966552734375, -1.0201339721679688, -0.9933013916015625, -0.9664688110351562, -0.93963623046875, -0.9128036499023438, -0.8859710693359375, -0.8591384887695312, -0.832305908203125, -0.8054733276367188, -0.7786407470703125, -0.7518081665039062, -0.7249755859375, -0.6981430053710938, -0.6713104248046875, -0.6444778442382812, -0.617645263671875, -0.5908126831054688, -0.5639801025390625, -0.5371475219726562, -0.51031494140625, -0.48348236083984375, -0.4566497802734375, -0.42981719970703125, -0.402984619140625, -0.37615203857421875, -0.3493194580078125, -0.32248687744140625, -0.295654296875, -0.26882171630859375, -0.2419891357421875, -0.21515655517578125, -0.188323974609375, -0.16149139404296875, -0.1346588134765625, -0.10782623291015625, -0.08099365234375, -0.05416107177734375, -0.0273284912109375, -0.00049591064453125, 0.026336669921875, 0.05316925048828125, 0.0800018310546875, 0.10683441162109375, 0.1336669921875, 0.16049957275390625, 0.1873321533203125, 0.21416473388671875, 0.240997314453125, 0.26782989501953125, 0.2946624755859375, 0.32149505615234375, 0.34832763671875, 0.37516021728515625, 0.4019927978515625, 0.42882537841796875, 0.455657958984375, 0.48249053955078125, 0.5093231201171875, 0.5361557006835938, 0.56298828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 11.0, 15.0, 17.0, 37.0, 41.0, 66.0, 100.0, 196.0, 298.0, 539.0, 837.0, 1633.0, 3425.0, 8137.0, 22707.0, 69972.0, 223625.0, 406431.0, 210624.0, 64410.0, 20963.0, 7635.0, 3126.0, 1534.0, 840.0, 500.0, 304.0, 187.0, 105.0, 67.0, 45.0, 36.0, 19.0, 19.0, 9.0, 6.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.99609375, -4.81427001953125, -4.6324462890625, -4.45062255859375, -4.268798828125, -4.08697509765625, -3.9051513671875, -3.72332763671875, -3.54150390625, -3.35968017578125, -3.1778564453125, -2.99603271484375, -2.814208984375, -2.63238525390625, -2.4505615234375, -2.26873779296875, -2.0869140625, -1.90509033203125, -1.7232666015625, -1.54144287109375, -1.359619140625, -1.17779541015625, -0.9959716796875, -0.81414794921875, -0.63232421875, -0.45050048828125, -0.2686767578125, -0.08685302734375, 0.094970703125, 0.27679443359375, 0.4586181640625, 0.64044189453125, 0.822265625, 1.00408935546875, 1.1859130859375, 1.36773681640625, 1.549560546875, 1.73138427734375, 1.9132080078125, 2.09503173828125, 2.27685546875, 2.45867919921875, 2.6405029296875, 2.82232666015625, 3.004150390625, 3.18597412109375, 3.3677978515625, 3.54962158203125, 3.7314453125, 3.91326904296875, 4.0950927734375, 4.27691650390625, 4.458740234375, 4.64056396484375, 4.8223876953125, 5.00421142578125, 5.18603515625, 5.36785888671875, 5.5496826171875, 5.73150634765625, 5.913330078125, 6.09515380859375, 6.2769775390625, 6.45880126953125, 6.640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 12.0, 13.0, 17.0, 25.0, 26.0, 42.0, 35.0, 67.0, 44.0, 51.0, 48.0, 62.0, 60.0, 65.0, 66.0, 50.0, 52.0, 42.0, 45.0, 49.0, 29.0, 23.0, 18.0, 16.0, 18.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.764862060546875, -3.62152099609375, -3.478179931640625, -3.3348388671875, -3.191497802734375, -3.04815673828125, -2.904815673828125, -2.761474609375, -2.618133544921875, -2.47479248046875, -2.331451416015625, -2.1881103515625, -2.044769287109375, -1.90142822265625, -1.758087158203125, -1.61474609375, -1.471405029296875, -1.32806396484375, -1.184722900390625, -1.0413818359375, -0.898040771484375, -0.75469970703125, -0.611358642578125, -0.468017578125, -0.324676513671875, -0.18133544921875, -0.037994384765625, 0.1053466796875, 0.248687744140625, 0.39202880859375, 0.535369873046875, 0.6787109375, 0.822052001953125, 0.96539306640625, 1.108734130859375, 1.2520751953125, 1.395416259765625, 1.53875732421875, 1.682098388671875, 1.825439453125, 1.968780517578125, 2.11212158203125, 2.255462646484375, 2.3988037109375, 2.542144775390625, 2.68548583984375, 2.828826904296875, 2.97216796875, 3.115509033203125, 3.25885009765625, 3.402191162109375, 3.5455322265625, 3.688873291015625, 3.83221435546875, 3.975555419921875, 4.118896484375, 4.262237548828125, 4.40557861328125, 4.548919677734375, 4.6922607421875, 4.835601806640625, 4.97894287109375, 5.122283935546875, 5.265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 3.0, 8.0, 10.0, 14.0, 12.0, 29.0, 37.0, 44.0, 77.0, 86.0, 132.0, 185.0, 311.0, 414.0, 647.0, 1026.0, 1579.0, 2782.0, 4822.0, 9043.0, 21285.0, 81700.0, 483332.0, 349197.0, 56298.0, 16985.0, 7611.0, 4099.0, 2481.0, 1433.0, 907.0, 585.0, 435.0, 257.0, 184.0, 145.0, 112.0, 67.0, 39.0, 34.0, 32.0, 21.0, 11.0, 13.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.40234375, -7.16265869140625, -6.9229736328125, -6.68328857421875, -6.443603515625, -6.20391845703125, -5.9642333984375, -5.72454833984375, -5.48486328125, -5.24517822265625, -5.0054931640625, -4.76580810546875, -4.526123046875, -4.28643798828125, -4.0467529296875, -3.80706787109375, -3.5673828125, -3.32769775390625, -3.0880126953125, -2.84832763671875, -2.608642578125, -2.36895751953125, -2.1292724609375, -1.88958740234375, -1.64990234375, -1.41021728515625, -1.1705322265625, -0.93084716796875, -0.691162109375, -0.45147705078125, -0.2117919921875, 0.02789306640625, 0.267578125, 0.50726318359375, 0.7469482421875, 0.98663330078125, 1.226318359375, 1.46600341796875, 1.7056884765625, 1.94537353515625, 2.18505859375, 2.42474365234375, 2.6644287109375, 2.90411376953125, 3.143798828125, 3.38348388671875, 3.6231689453125, 3.86285400390625, 4.1025390625, 4.34222412109375, 4.5819091796875, 4.82159423828125, 5.061279296875, 5.30096435546875, 5.5406494140625, 5.78033447265625, 6.02001953125, 6.25970458984375, 6.4993896484375, 6.73907470703125, 6.978759765625, 7.21844482421875, 7.4581298828125, 7.69781494140625, 7.9375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 11.0, 15.0, 21.0, 27.0, 34.0, 60.0, 51.0, 68.0, 83.0, 84.0, 96.0, 91.0, 71.0, 58.0, 52.0, 31.0, 24.0, 23.0, 18.0, 10.0, 9.0, 13.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00064849853515625, -0.0006305575370788574, -0.0006126165390014648, -0.0005946755409240723, -0.0005767345428466797, -0.0005587935447692871, -0.0005408525466918945, -0.000522911548614502, -0.0005049705505371094, -0.0004870295524597168, -0.0004690885543823242, -0.00045114755630493164, -0.00043320655822753906, -0.0004152655601501465, -0.0003973245620727539, -0.00037938356399536133, -0.00036144256591796875, -0.00034350156784057617, -0.0003255605697631836, -0.000307619571685791, -0.00028967857360839844, -0.00027173757553100586, -0.0002537965774536133, -0.0002358555793762207, -0.00021791458129882812, -0.00019997358322143555, -0.00018203258514404297, -0.0001640915870666504, -0.0001461505889892578, -0.00012820959091186523, -0.00011026859283447266, -9.232759475708008e-05, -7.43865966796875e-05, -5.644559860229492e-05, -3.8504600524902344e-05, -2.0563602447509766e-05, -2.6226043701171875e-06, 1.531839370727539e-05, 3.325939178466797e-05, 5.120038986206055e-05, 6.914138793945312e-05, 8.70823860168457e-05, 0.00010502338409423828, 0.00012296438217163086, 0.00014090538024902344, 0.00015884637832641602, 0.0001767873764038086, 0.00019472837448120117, 0.00021266937255859375, 0.00023061037063598633, 0.0002485513687133789, 0.0002664923667907715, 0.00028443336486816406, 0.00030237436294555664, 0.0003203153610229492, 0.0003382563591003418, 0.0003561973571777344, 0.00037413835525512695, 0.00039207935333251953, 0.0004100203514099121, 0.0004279613494873047, 0.00044590234756469727, 0.00046384334564208984, 0.0004817843437194824, 0.000499725341796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 10.0, 6.0, 13.0, 31.0, 38.0, 77.0, 144.0, 200.0, 415.0, 678.0, 1337.0, 3559.0, 13378.0, 98418.0, 753875.0, 151628.0, 17240.0, 4375.0, 1623.0, 676.0, 330.0, 201.0, 113.0, 56.0, 43.0, 33.0, 18.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.79541015625, -10.4423828125, -10.08935546875, -9.736328125, -9.38330078125, -9.0302734375, -8.67724609375, -8.32421875, -7.97119140625, -7.6181640625, -7.26513671875, -6.912109375, -6.55908203125, -6.2060546875, -5.85302734375, -5.5, -5.14697265625, -4.7939453125, -4.44091796875, -4.087890625, -3.73486328125, -3.3818359375, -3.02880859375, -2.67578125, -2.32275390625, -1.9697265625, -1.61669921875, -1.263671875, -0.91064453125, -0.5576171875, -0.20458984375, 0.1484375, 0.50146484375, 0.8544921875, 1.20751953125, 1.560546875, 1.91357421875, 2.2666015625, 2.61962890625, 2.97265625, 3.32568359375, 3.6787109375, 4.03173828125, 4.384765625, 4.73779296875, 5.0908203125, 5.44384765625, 5.796875, 6.14990234375, 6.5029296875, 6.85595703125, 7.208984375, 7.56201171875, 7.9150390625, 8.26806640625, 8.62109375, 8.97412109375, 9.3271484375, 9.68017578125, 10.033203125, 10.38623046875, 10.7392578125, 11.09228515625, 11.4453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 11.0, 13.0, 26.0, 30.0, 54.0, 88.0, 131.0, 151.0, 146.0, 100.0, 73.0, 42.0, 32.0, 23.0, 13.0, 13.0, 8.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.59765625, -6.4273681640625, -6.257080078125, -6.0867919921875, -5.91650390625, -5.7462158203125, -5.575927734375, -5.4056396484375, -5.2353515625, -5.0650634765625, -4.894775390625, -4.7244873046875, -4.55419921875, -4.3839111328125, -4.213623046875, -4.0433349609375, -3.873046875, -3.7027587890625, -3.532470703125, -3.3621826171875, -3.19189453125, -3.0216064453125, -2.851318359375, -2.6810302734375, -2.5107421875, -2.3404541015625, -2.170166015625, -1.9998779296875, -1.82958984375, -1.6593017578125, -1.489013671875, -1.3187255859375, -1.1484375, -0.9781494140625, -0.807861328125, -0.6375732421875, -0.46728515625, -0.2969970703125, -0.126708984375, 0.0435791015625, 0.2138671875, 0.3841552734375, 0.554443359375, 0.7247314453125, 0.89501953125, 1.0653076171875, 1.235595703125, 1.4058837890625, 1.576171875, 1.7464599609375, 1.916748046875, 2.0870361328125, 2.25732421875, 2.4276123046875, 2.597900390625, 2.7681884765625, 2.9384765625, 3.1087646484375, 3.279052734375, 3.4493408203125, 3.61962890625, 3.7899169921875, 3.960205078125, 4.1304931640625, 4.30078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 17.0, 37.0, 56.0, 133.0, 254.0, 285.0, 125.0, 54.0, 16.0, 14.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.52326202392578, -81.89424896240234, -79.26522827148438, -76.63621520996094, -74.0072021484375, -71.37818145751953, -68.7491683959961, -66.12014770507812, -63.49113464355469, -60.862117767333984, -58.23310089111328, -55.604087829589844, -52.97507095336914, -50.34605407714844, -47.717041015625, -45.0880241394043, -42.459007263183594, -39.82999038696289, -37.20097351074219, -34.57196044921875, -31.942943572998047, -29.313926696777344, -26.684911727905273, -24.055896759033203, -21.4268798828125, -18.797863006591797, -16.168848037719727, -13.53983211517334, -10.910816192626953, -8.281800270080566, -5.65278434753418, -3.0237693786621094, -0.3947601318359375, 2.234255790710449, 4.863271713256836, 7.492287635803223, 10.12130355834961, 12.750319480895996, 15.379335403442383, 18.008350372314453, 20.637367248535156, 23.26638412475586, 25.89539909362793, 28.5244140625, 31.153430938720703, 33.782447814941406, 36.411460876464844, 39.04047775268555, 41.66949462890625, 44.29851150512695, 46.927528381347656, 49.556541442871094, 52.1855583190918, 54.8145751953125, 57.44358825683594, 60.07260513305664, 62.701622009277344, 65.33063507080078, 67.95965576171875, 70.58866882324219, 73.21768188476562, 75.8467025756836, 78.47571563720703, 81.104736328125, 83.73374938964844]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 12.0, 4.0, 17.0, 14.0, 14.0, 14.0, 25.0, 17.0, 46.0, 34.0, 38.0, 44.0, 62.0, 40.0, 63.0, 63.0, 54.0, 50.0, 47.0, 49.0, 42.0, 37.0, 32.0, 36.0, 29.0, 19.0, 16.0, 20.0, 13.0, 15.0, 10.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.595651626586914, -23.660932540893555, -22.726213455200195, -21.791492462158203, -20.856773376464844, -19.922054290771484, -18.987335205078125, -18.052616119384766, -17.117897033691406, -16.183177947998047, -15.248457908630371, -14.313738822937012, -13.379018783569336, -12.444299697875977, -11.509580612182617, -10.574861526489258, -9.640140533447266, -8.705421447753906, -7.7707014083862305, -6.835982322692871, -5.9012627601623535, -4.966543197631836, -4.031824111938477, -3.097104549407959, -2.1623849868774414, -1.2276655435562134, -0.29294610023498535, 0.6417732238769531, 1.5764927864074707, 2.5112123489379883, 3.4459314346313477, 4.380650997161865, 5.315372467041016, 6.250092029571533, 7.184811592102051, 8.11953067779541, 9.054250717163086, 9.988969802856445, 10.923688888549805, 11.858407974243164, 12.79312801361084, 13.7278470993042, 14.662567138671875, 15.597286224365234, 16.532005310058594, 17.466724395751953, 18.401443481445312, 19.336164474487305, 20.270883560180664, 21.205602645874023, 22.140321731567383, 23.075042724609375, 24.009761810302734, 24.944480895996094, 25.879199981689453, 26.813919067382812, 27.748638153076172, 28.68335723876953, 29.61807632446289, 30.55279541015625, 31.487516403198242, 32.42223358154297, 33.356956481933594, 34.29167556762695, 35.22639465332031]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 20.0, 30.0, 34.0, 42.0, 65.0, 135.0, 172.0, 379.0, 917.0, 2506.0, 10690.0, 103494.0, 3975197.0, 88237.0, 9523.0, 1811.0, 496.0, 189.0, 97.0, 44.0, 48.0, 29.0, 27.0, 10.0, 15.0, 8.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5, -32.629150390625, -31.75830078125, -30.887451171875, -30.0166015625, -29.145751953125, -28.27490234375, -27.404052734375, -26.533203125, -25.662353515625, -24.79150390625, -23.920654296875, -23.0498046875, -22.178955078125, -21.30810546875, -20.437255859375, -19.56640625, -18.695556640625, -17.82470703125, -16.953857421875, -16.0830078125, -15.212158203125, -14.34130859375, -13.470458984375, -12.599609375, -11.728759765625, -10.85791015625, -9.987060546875, -9.1162109375, -8.245361328125, -7.37451171875, -6.503662109375, -5.6328125, -4.761962890625, -3.89111328125, -3.020263671875, -2.1494140625, -1.278564453125, -0.40771484375, 0.463134765625, 1.333984375, 2.204833984375, 3.07568359375, 3.946533203125, 4.8173828125, 5.688232421875, 6.55908203125, 7.429931640625, 8.30078125, 9.171630859375, 10.04248046875, 10.913330078125, 11.7841796875, 12.655029296875, 13.52587890625, 14.396728515625, 15.267578125, 16.138427734375, 17.00927734375, 17.880126953125, 18.7509765625, 19.621826171875, 20.49267578125, 21.363525390625, 22.234375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 13.0, 12.0, 20.0, 24.0, 37.0, 39.0, 63.0, 67.0, 62.0, 75.0, 61.0, 70.0, 63.0, 55.0, 60.0, 61.0, 38.0, 30.0, 38.0, 26.0, 17.0, 10.0, 9.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1298141479492188, -1.1014251708984375, -1.0730361938476562, -1.044647216796875, -1.0162582397460938, -0.9878692626953125, -0.9594802856445312, -0.93109130859375, -0.9027023315429688, -0.8743133544921875, -0.8459243774414062, -0.817535400390625, -0.7891464233398438, -0.7607574462890625, -0.7323684692382812, -0.7039794921875, -0.6755905151367188, -0.6472015380859375, -0.6188125610351562, -0.590423583984375, -0.5620346069335938, -0.5336456298828125, -0.5052566528320312, -0.47686767578125, -0.44847869873046875, -0.4200897216796875, -0.39170074462890625, -0.363311767578125, -0.33492279052734375, -0.3065338134765625, -0.27814483642578125, -0.249755859375, -0.22136688232421875, -0.1929779052734375, -0.16458892822265625, -0.136199951171875, -0.10781097412109375, -0.0794219970703125, -0.05103302001953125, -0.02264404296875, 0.00574493408203125, 0.0341339111328125, 0.06252288818359375, 0.090911865234375, 0.11930084228515625, 0.1476898193359375, 0.17607879638671875, 0.2044677734375, 0.23285675048828125, 0.2612457275390625, 0.28963470458984375, 0.318023681640625, 0.34641265869140625, 0.3748016357421875, 0.40319061279296875, 0.43157958984375, 0.45996856689453125, 0.4883575439453125, 0.5167465209960938, 0.545135498046875, 0.5735244750976562, 0.6019134521484375, 0.6303024291992188, 0.65869140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 8.0, 14.0, 20.0, 19.0, 31.0, 42.0, 53.0, 79.0, 93.0, 144.0, 187.0, 274.0, 593.0, 2756.0, 85548.0, 4060529.0, 40091.0, 2200.0, 581.0, 268.0, 188.0, 155.0, 124.0, 90.0, 64.0, 33.0, 31.0, 22.0, 20.0, 13.0, 4.0, 5.0, 0.0, 0.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.375, -40.268798828125, -39.16259765625, -38.056396484375, -36.9501953125, -35.843994140625, -34.73779296875, -33.631591796875, -32.525390625, -31.419189453125, -30.31298828125, -29.206787109375, -28.1005859375, -26.994384765625, -25.88818359375, -24.781982421875, -23.67578125, -22.569580078125, -21.46337890625, -20.357177734375, -19.2509765625, -18.144775390625, -17.03857421875, -15.932373046875, -14.826171875, -13.719970703125, -12.61376953125, -11.507568359375, -10.4013671875, -9.295166015625, -8.18896484375, -7.082763671875, -5.9765625, -4.870361328125, -3.76416015625, -2.657958984375, -1.5517578125, -0.445556640625, 0.66064453125, 1.766845703125, 2.873046875, 3.979248046875, 5.08544921875, 6.191650390625, 7.2978515625, 8.404052734375, 9.51025390625, 10.616455078125, 11.72265625, 12.828857421875, 13.93505859375, 15.041259765625, 16.1474609375, 17.253662109375, 18.35986328125, 19.466064453125, 20.572265625, 21.678466796875, 22.78466796875, 23.890869140625, 24.9970703125, 26.103271484375, 27.20947265625, 28.315673828125, 29.421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 20.0, 62.0, 217.0, 1461.0, 1864.0, 262.0, 98.0, 38.0, 29.0, 12.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.837890625, -3.63671875, -3.435546875, -3.234375, -3.033203125, -2.83203125, -2.630859375, -2.4296875, -2.228515625, -2.02734375, -1.826171875, -1.625, -1.423828125, -1.22265625, -1.021484375, -0.8203125, -0.619140625, -0.41796875, -0.216796875, -0.015625, 0.185546875, 0.38671875, 0.587890625, 0.7890625, 0.990234375, 1.19140625, 1.392578125, 1.59375, 1.794921875, 1.99609375, 2.197265625, 2.3984375, 2.599609375, 2.80078125, 3.001953125, 3.203125, 3.404296875, 3.60546875, 3.806640625, 4.0078125, 4.208984375, 4.41015625, 4.611328125, 4.8125, 5.013671875, 5.21484375, 5.416015625, 5.6171875, 5.818359375, 6.01953125, 6.220703125, 6.421875, 6.623046875, 6.82421875, 7.025390625, 7.2265625, 7.427734375, 7.62890625, 7.830078125, 8.03125, 8.232421875, 8.43359375, 8.634765625, 8.8359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 12.0, 44.0, 110.0, 296.0, 290.0, 166.0, 48.0, 10.0, 11.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.84372329711914, -46.252784729003906, -44.661842346191406, -43.07090377807617, -41.47996520996094, -39.88902282714844, -38.2980842590332, -36.70714569091797, -35.11620330810547, -33.525264739990234, -31.934324264526367, -30.3433837890625, -28.752445220947266, -27.1615047454834, -25.57056427001953, -23.979625701904297, -22.388687133789062, -20.797746658325195, -19.20680809020996, -17.615867614746094, -16.02492904663086, -14.433988571166992, -12.843048095703125, -11.252108573913574, -9.661169052124023, -8.070229530334473, -6.479289531707764, -4.888349533081055, -3.297410011291504, -1.7064704895019531, -0.11553001403808594, 1.4754095077514648, 3.06634521484375, 4.657284736633301, 6.24822473526001, 7.839164733886719, 9.43010425567627, 11.02104377746582, 12.611984252929688, 14.202923774719238, 15.793863296508789, 17.384803771972656, 18.97574234008789, 20.566682815551758, 22.157623291015625, 23.74856185913086, 25.339502334594727, 26.930442810058594, 28.521381378173828, 30.112321853637695, 31.70326042175293, 33.2942008972168, 34.88513946533203, 36.47608184814453, 38.067020416259766, 39.657958984375, 41.2489013671875, 42.839839935302734, 44.430782318115234, 46.02172088623047, 47.6126594543457, 49.20359802246094, 50.79454040527344, 52.38547897338867, 53.976417541503906]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 4.0, 5.0, 18.0, 12.0, 26.0, 27.0, 55.0, 45.0, 61.0, 69.0, 74.0, 79.0, 76.0, 87.0, 58.0, 74.0, 58.0, 42.0, 31.0, 23.0, 18.0, 19.0, 15.0, 7.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.940818786621094, -16.36530876159668, -15.78979778289795, -15.214287757873535, -14.638776779174805, -14.06326675415039, -13.487756729125977, -12.912245750427246, -12.336734771728516, -11.761224746704102, -11.185713768005371, -10.610203742980957, -10.034692764282227, -9.459182739257812, -8.883672714233398, -8.308161735534668, -7.732651710510254, -7.157141208648682, -6.581630706787109, -6.006120681762695, -5.430609703063965, -4.855099678039551, -4.2795891761779785, -3.7040786743164062, -3.128568172454834, -2.5530576705932617, -1.977547287940979, -1.4020369052886963, -0.826526403427124, -0.25101590156555176, 0.3244943618774414, 0.9000048637390137, 1.475515365600586, 2.051025867462158, 2.6265363693237305, 3.2020466327667236, 3.777557134628296, 4.353067398071289, 4.928577899932861, 5.504088401794434, 6.079598903656006, 6.655109405517578, 7.23061990737915, 7.806130409240723, 8.381640434265137, 8.957151412963867, 9.532661437988281, 10.108171463012695, 10.683682441711426, 11.25919246673584, 11.83470344543457, 12.410213470458984, 12.985724449157715, 13.561234474182129, 14.13674545288086, 14.712255477905273, 15.287765502929688, 15.863275527954102, 16.438785552978516, 17.014297485351562, 17.589807510375977, 18.16531753540039, 18.740827560424805, 19.31633758544922, 19.891849517822266]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 6.0, 10.0, 6.0, 9.0, 18.0, 37.0, 42.0, 49.0, 81.0, 143.0, 281.0, 487.0, 1010.0, 2379.0, 7191.0, 30153.0, 162411.0, 506547.0, 268861.0, 51739.0, 10978.0, 3361.0, 1306.0, 622.0, 304.0, 176.0, 85.0, 71.0, 33.0, 31.0, 26.0, 27.0, 16.0, 9.0, 8.0, 6.0, 3.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1826171875, -8.873046875, -8.5634765625, -8.25390625, -7.9443359375, -7.634765625, -7.3251953125, -7.015625, -6.7060546875, -6.396484375, -6.0869140625, -5.77734375, -5.4677734375, -5.158203125, -4.8486328125, -4.5390625, -4.2294921875, -3.919921875, -3.6103515625, -3.30078125, -2.9912109375, -2.681640625, -2.3720703125, -2.0625, -1.7529296875, -1.443359375, -1.1337890625, -0.82421875, -0.5146484375, -0.205078125, 0.1044921875, 0.4140625, 0.7236328125, 1.033203125, 1.3427734375, 1.65234375, 1.9619140625, 2.271484375, 2.5810546875, 2.890625, 3.2001953125, 3.509765625, 3.8193359375, 4.12890625, 4.4384765625, 4.748046875, 5.0576171875, 5.3671875, 5.6767578125, 5.986328125, 6.2958984375, 6.60546875, 6.9150390625, 7.224609375, 7.5341796875, 7.84375, 8.1533203125, 8.462890625, 8.7724609375, 9.08203125, 9.3916015625, 9.701171875, 10.0107421875, 10.3203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 19.0, 13.0, 29.0, 27.0, 37.0, 51.0, 58.0, 69.0, 78.0, 92.0, 82.0, 91.0, 74.0, 59.0, 53.0, 46.0, 32.0, 20.0, 14.0, 16.0, 7.0, 8.0, 1.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.2902679443359375, -1.254364013671875, -1.2184600830078125, -1.18255615234375, -1.1466522216796875, -1.110748291015625, -1.0748443603515625, -1.0389404296875, -1.0030364990234375, -0.967132568359375, -0.9312286376953125, -0.89532470703125, -0.8594207763671875, -0.823516845703125, -0.7876129150390625, -0.751708984375, -0.7158050537109375, -0.679901123046875, -0.6439971923828125, -0.60809326171875, -0.5721893310546875, -0.536285400390625, -0.5003814697265625, -0.4644775390625, -0.4285736083984375, -0.392669677734375, -0.3567657470703125, -0.32086181640625, -0.2849578857421875, -0.249053955078125, -0.2131500244140625, -0.17724609375, -0.1413421630859375, -0.105438232421875, -0.0695343017578125, -0.03363037109375, 0.0022735595703125, 0.038177490234375, 0.0740814208984375, 0.1099853515625, 0.1458892822265625, 0.181793212890625, 0.2176971435546875, 0.25360107421875, 0.2895050048828125, 0.325408935546875, 0.3613128662109375, 0.397216796875, 0.4331207275390625, 0.469024658203125, 0.5049285888671875, 0.54083251953125, 0.5767364501953125, 0.612640380859375, 0.6485443115234375, 0.6844482421875, 0.7203521728515625, 0.756256103515625, 0.7921600341796875, 0.82806396484375, 0.8639678955078125, 0.899871826171875, 0.9357757568359375, 0.9716796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 18.0, 15.0, 16.0, 47.0, 57.0, 67.0, 104.0, 149.0, 245.0, 306.0, 495.0, 859.0, 1366.0, 2552.0, 4895.0, 11219.0, 28425.0, 78903.0, 207885.0, 337842.0, 227598.0, 88763.0, 31914.0, 12498.0, 5566.0, 2713.0, 1475.0, 854.0, 555.0, 377.0, 262.0, 159.0, 98.0, 78.0, 56.0, 38.0, 26.0, 11.0, 13.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.20703125, -5.03662109375, -4.8662109375, -4.69580078125, -4.525390625, -4.35498046875, -4.1845703125, -4.01416015625, -3.84375, -3.67333984375, -3.5029296875, -3.33251953125, -3.162109375, -2.99169921875, -2.8212890625, -2.65087890625, -2.48046875, -2.31005859375, -2.1396484375, -1.96923828125, -1.798828125, -1.62841796875, -1.4580078125, -1.28759765625, -1.1171875, -0.94677734375, -0.7763671875, -0.60595703125, -0.435546875, -0.26513671875, -0.0947265625, 0.07568359375, 0.24609375, 0.41650390625, 0.5869140625, 0.75732421875, 0.927734375, 1.09814453125, 1.2685546875, 1.43896484375, 1.609375, 1.77978515625, 1.9501953125, 2.12060546875, 2.291015625, 2.46142578125, 2.6318359375, 2.80224609375, 2.97265625, 3.14306640625, 3.3134765625, 3.48388671875, 3.654296875, 3.82470703125, 3.9951171875, 4.16552734375, 4.3359375, 4.50634765625, 4.6767578125, 4.84716796875, 5.017578125, 5.18798828125, 5.3583984375, 5.52880859375, 5.69921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 6.0, 10.0, 12.0, 15.0, 20.0, 28.0, 28.0, 33.0, 31.0, 43.0, 56.0, 50.0, 43.0, 43.0, 50.0, 59.0, 46.0, 53.0, 50.0, 58.0, 36.0, 42.0, 23.0, 17.0, 19.0, 20.0, 23.0, 19.0, 18.0, 12.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.08984375, -4.94091796875, -4.7919921875, -4.64306640625, -4.494140625, -4.34521484375, -4.1962890625, -4.04736328125, -3.8984375, -3.74951171875, -3.6005859375, -3.45166015625, -3.302734375, -3.15380859375, -3.0048828125, -2.85595703125, -2.70703125, -2.55810546875, -2.4091796875, -2.26025390625, -2.111328125, -1.96240234375, -1.8134765625, -1.66455078125, -1.515625, -1.36669921875, -1.2177734375, -1.06884765625, -0.919921875, -0.77099609375, -0.6220703125, -0.47314453125, -0.32421875, -0.17529296875, -0.0263671875, 0.12255859375, 0.271484375, 0.42041015625, 0.5693359375, 0.71826171875, 0.8671875, 1.01611328125, 1.1650390625, 1.31396484375, 1.462890625, 1.61181640625, 1.7607421875, 1.90966796875, 2.05859375, 2.20751953125, 2.3564453125, 2.50537109375, 2.654296875, 2.80322265625, 2.9521484375, 3.10107421875, 3.25, 3.39892578125, 3.5478515625, 3.69677734375, 3.845703125, 3.99462890625, 4.1435546875, 4.29248046875, 4.44140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 3.0, 8.0, 9.0, 19.0, 18.0, 37.0, 41.0, 55.0, 101.0, 182.0, 233.0, 392.0, 686.0, 1242.0, 2705.0, 6547.0, 20806.0, 103301.0, 549399.0, 296961.0, 45564.0, 11826.0, 4201.0, 1868.0, 930.0, 515.0, 299.0, 202.0, 128.0, 79.0, 56.0, 36.0, 29.0, 19.0, 14.0, 9.0, 9.0, 9.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.10546875, -5.87738037109375, -5.6492919921875, -5.42120361328125, -5.193115234375, -4.96502685546875, -4.7369384765625, -4.50885009765625, -4.28076171875, -4.05267333984375, -3.8245849609375, -3.59649658203125, -3.368408203125, -3.14031982421875, -2.9122314453125, -2.68414306640625, -2.4560546875, -2.22796630859375, -1.9998779296875, -1.77178955078125, -1.543701171875, -1.31561279296875, -1.0875244140625, -0.85943603515625, -0.63134765625, -0.40325927734375, -0.1751708984375, 0.05291748046875, 0.281005859375, 0.50909423828125, 0.7371826171875, 0.96527099609375, 1.193359375, 1.42144775390625, 1.6495361328125, 1.87762451171875, 2.105712890625, 2.33380126953125, 2.5618896484375, 2.78997802734375, 3.01806640625, 3.24615478515625, 3.4742431640625, 3.70233154296875, 3.930419921875, 4.15850830078125, 4.3865966796875, 4.61468505859375, 4.8427734375, 5.07086181640625, 5.2989501953125, 5.52703857421875, 5.755126953125, 5.98321533203125, 6.2113037109375, 6.43939208984375, 6.66748046875, 6.89556884765625, 7.1236572265625, 7.35174560546875, 7.579833984375, 7.80792236328125, 8.0360107421875, 8.26409912109375, 8.4921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 6.0, 11.0, 10.0, 28.0, 19.0, 29.0, 31.0, 36.0, 64.0, 47.0, 63.0, 84.0, 73.0, 73.0, 78.0, 37.0, 49.0, 55.0, 25.0, 38.0, 33.0, 23.0, 15.0, 9.0, 8.0, 12.0, 9.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005536079406738281, -0.0005367398262023926, -0.000519871711730957, -0.0005030035972595215, -0.00048613548278808594, -0.0004692673683166504, -0.00045239925384521484, -0.0004355311393737793, -0.00041866302490234375, -0.0004017949104309082, -0.00038492679595947266, -0.0003680586814880371, -0.00035119056701660156, -0.000334322452545166, -0.00031745433807373047, -0.0003005862236022949, -0.0002837181091308594, -0.00026684999465942383, -0.0002499818801879883, -0.00023311376571655273, -0.0002162456512451172, -0.00019937753677368164, -0.0001825094223022461, -0.00016564130783081055, -0.000148773193359375, -0.00013190507888793945, -0.0001150369644165039, -9.816884994506836e-05, -8.130073547363281e-05, -6.443262100219727e-05, -4.756450653076172e-05, -3.069639205932617e-05, -1.3828277587890625e-05, 3.039836883544922e-06, 1.990795135498047e-05, 3.6776065826416016e-05, 5.364418029785156e-05, 7.051229476928711e-05, 8.738040924072266e-05, 0.0001042485237121582, 0.00012111663818359375, 0.0001379847526550293, 0.00015485286712646484, 0.0001717209815979004, 0.00018858909606933594, 0.00020545721054077148, 0.00022232532501220703, 0.00023919343948364258, 0.0002560615539550781, 0.00027292966842651367, 0.0002897977828979492, 0.00030666589736938477, 0.0003235340118408203, 0.00034040212631225586, 0.0003572702407836914, 0.00037413835525512695, 0.0003910064697265625, 0.00040787458419799805, 0.0004247426986694336, 0.00044161081314086914, 0.0004584789276123047, 0.00047534704208374023, 0.0004922151565551758, 0.0005090832710266113, 0.0005259513854980469]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 11.0, 25.0, 28.0, 38.0, 91.0, 148.0, 287.0, 617.0, 1685.0, 5495.0, 25249.0, 229429.0, 659467.0, 105218.0, 14623.0, 3801.0, 1266.0, 503.0, 240.0, 132.0, 76.0, 38.0, 30.0, 23.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0291748046875, -7.745849609375, -7.4625244140625, -7.17919921875, -6.8958740234375, -6.612548828125, -6.3292236328125, -6.0458984375, -5.7625732421875, -5.479248046875, -5.1959228515625, -4.91259765625, -4.6292724609375, -4.345947265625, -4.0626220703125, -3.779296875, -3.4959716796875, -3.212646484375, -2.9293212890625, -2.64599609375, -2.3626708984375, -2.079345703125, -1.7960205078125, -1.5126953125, -1.2293701171875, -0.946044921875, -0.6627197265625, -0.37939453125, -0.0960693359375, 0.187255859375, 0.4705810546875, 0.75390625, 1.0372314453125, 1.320556640625, 1.6038818359375, 1.88720703125, 2.1705322265625, 2.453857421875, 2.7371826171875, 3.0205078125, 3.3038330078125, 3.587158203125, 3.8704833984375, 4.15380859375, 4.4371337890625, 4.720458984375, 5.0037841796875, 5.287109375, 5.5704345703125, 5.853759765625, 6.1370849609375, 6.42041015625, 6.7037353515625, 6.987060546875, 7.2703857421875, 7.5537109375, 7.8370361328125, 8.120361328125, 8.4036865234375, 8.68701171875, 8.9703369140625, 9.253662109375, 9.5369873046875, 9.8203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 11.0, 16.0, 19.0, 20.0, 32.0, 22.0, 43.0, 53.0, 51.0, 81.0, 70.0, 87.0, 85.0, 72.0, 66.0, 46.0, 37.0, 40.0, 39.0, 22.0, 13.0, 12.0, 16.0, 5.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.66015625, -2.563690185546875, -2.46722412109375, -2.370758056640625, -2.2742919921875, -2.177825927734375, -2.08135986328125, -1.984893798828125, -1.888427734375, -1.791961669921875, -1.69549560546875, -1.599029541015625, -1.5025634765625, -1.406097412109375, -1.30963134765625, -1.213165283203125, -1.11669921875, -1.020233154296875, -0.92376708984375, -0.827301025390625, -0.7308349609375, -0.634368896484375, -0.53790283203125, -0.441436767578125, -0.344970703125, -0.248504638671875, -0.15203857421875, -0.055572509765625, 0.0408935546875, 0.137359619140625, 0.23382568359375, 0.330291748046875, 0.4267578125, 0.523223876953125, 0.61968994140625, 0.716156005859375, 0.8126220703125, 0.909088134765625, 1.00555419921875, 1.102020263671875, 1.198486328125, 1.294952392578125, 1.39141845703125, 1.487884521484375, 1.5843505859375, 1.680816650390625, 1.77728271484375, 1.873748779296875, 1.97021484375, 2.066680908203125, 2.16314697265625, 2.259613037109375, 2.3560791015625, 2.452545166015625, 2.54901123046875, 2.645477294921875, 2.741943359375, 2.838409423828125, 2.93487548828125, 3.031341552734375, 3.1278076171875, 3.224273681640625, 3.32073974609375, 3.417205810546875, 3.513671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 10.0, 23.0, 49.0, 139.0, 251.0, 263.0, 171.0, 58.0, 21.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.72164916992188, -78.82286834716797, -75.92408752441406, -73.02530670166016, -70.12652587890625, -67.22773742675781, -64.3289566040039, -61.43017578125, -58.531394958496094, -55.63261413574219, -52.73383331298828, -49.83504867553711, -46.9362678527832, -44.0374870300293, -41.138702392578125, -38.23992156982422, -35.34114074707031, -32.442359924316406, -29.543577194213867, -26.644794464111328, -23.746013641357422, -20.847232818603516, -17.948450088500977, -15.049667358398438, -12.150886535644531, -9.252104759216309, -6.353322982788086, -3.4545412063598633, -0.5557594299316406, 2.343022346496582, 5.241804122924805, 8.140586853027344, 11.039375305175781, 13.938157081604004, 16.836938858032227, 19.735721588134766, 22.634502410888672, 25.533283233642578, 28.432065963745117, 31.330848693847656, 34.22962951660156, 37.12841033935547, 40.027191162109375, 42.92597579956055, 45.82475662231445, 48.72353744506836, 51.62232208251953, 54.52110290527344, 57.419883728027344, 60.31866455078125, 63.217445373535156, 66.11622619628906, 69.0150146484375, 71.9137954711914, 74.81257629394531, 77.71135711669922, 80.61013793945312, 83.50891876220703, 86.40769958496094, 89.30648040771484, 92.20526123046875, 95.10404968261719, 98.0028305053711, 100.901611328125, 103.8003921508789]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 1.0, 4.0, 6.0, 11.0, 15.0, 10.0, 20.0, 17.0, 18.0, 17.0, 17.0, 28.0, 30.0, 39.0, 45.0, 33.0, 45.0, 50.0, 41.0, 45.0, 44.0, 38.0, 51.0, 60.0, 34.0, 36.0, 31.0, 31.0, 29.0, 22.0, 23.0, 18.0, 22.0, 9.0, 19.0, 8.0, 6.0, 7.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.534027099609375, -24.625118255615234, -23.716209411621094, -22.80729866027832, -21.89838981628418, -20.98948097229004, -20.080570220947266, -19.171661376953125, -18.262752532958984, -17.353843688964844, -16.444934844970703, -15.53602409362793, -14.627115249633789, -13.718206405639648, -12.809296607971191, -11.900386810302734, -10.991477966308594, -10.082569122314453, -9.173659324645996, -8.264749526977539, -7.355840682983398, -6.4469313621521, -5.538022041320801, -4.629112720489502, -3.720203399658203, -2.8112940788269043, -1.9023847579956055, -0.9934754371643066, -0.08456611633300781, 0.824343204498291, 1.7332525253295898, 2.6421618461608887, 3.5510711669921875, 4.459980487823486, 5.368889808654785, 6.277799129486084, 7.186708450317383, 8.095617294311523, 9.00452709197998, 9.913436889648438, 10.822345733642578, 11.731254577636719, 12.640164375305176, 13.549074172973633, 14.457983016967773, 15.366891860961914, 16.275802612304688, 17.184711456298828, 18.09362030029297, 19.00252914428711, 19.91143798828125, 20.820348739624023, 21.729257583618164, 22.638166427612305, 23.547077178955078, 24.45598602294922, 25.36489486694336, 26.2738037109375, 27.18271255493164, 28.091623306274414, 29.000532150268555, 29.909440994262695, 30.81835174560547, 31.72726058959961, 32.63616943359375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 11.0, 14.0, 14.0, 14.0, 34.0, 32.0, 56.0, 83.0, 122.0, 166.0, 323.0, 633.0, 1424.0, 3629.0, 11716.0, 58756.0, 3202576.0, 859507.0, 40310.0, 9386.0, 3074.0, 1222.0, 518.0, 252.0, 138.0, 96.0, 63.0, 32.0, 25.0, 13.0, 10.0, 10.0, 8.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.859375, -17.33251953125, -16.8056640625, -16.27880859375, -15.751953125, -15.22509765625, -14.6982421875, -14.17138671875, -13.64453125, -13.11767578125, -12.5908203125, -12.06396484375, -11.537109375, -11.01025390625, -10.4833984375, -9.95654296875, -9.4296875, -8.90283203125, -8.3759765625, -7.84912109375, -7.322265625, -6.79541015625, -6.2685546875, -5.74169921875, -5.21484375, -4.68798828125, -4.1611328125, -3.63427734375, -3.107421875, -2.58056640625, -2.0537109375, -1.52685546875, -1.0, -0.47314453125, 0.0537109375, 0.58056640625, 1.107421875, 1.63427734375, 2.1611328125, 2.68798828125, 3.21484375, 3.74169921875, 4.2685546875, 4.79541015625, 5.322265625, 5.84912109375, 6.3759765625, 6.90283203125, 7.4296875, 7.95654296875, 8.4833984375, 9.01025390625, 9.537109375, 10.06396484375, 10.5908203125, 11.11767578125, 11.64453125, 12.17138671875, 12.6982421875, 13.22509765625, 13.751953125, 14.27880859375, 14.8056640625, 15.33251953125, 15.859375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 6.0, 10.0, 6.0, 20.0, 23.0, 23.0, 17.0, 24.0, 30.0, 44.0, 42.0, 65.0, 47.0, 53.0, 59.0, 58.0, 57.0, 45.0, 53.0, 37.0, 46.0, 42.0, 30.0, 31.0, 26.0, 30.0, 20.0, 5.0, 17.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.9984588623046875, -0.966644287109375, -0.9348297119140625, -0.90301513671875, -0.8712005615234375, -0.839385986328125, -0.8075714111328125, -0.7757568359375, -0.7439422607421875, -0.712127685546875, -0.6803131103515625, -0.64849853515625, -0.6166839599609375, -0.584869384765625, -0.5530548095703125, -0.521240234375, -0.4894256591796875, -0.457611083984375, -0.4257965087890625, -0.39398193359375, -0.3621673583984375, -0.330352783203125, -0.2985382080078125, -0.2667236328125, -0.2349090576171875, -0.203094482421875, -0.1712799072265625, -0.13946533203125, -0.1076507568359375, -0.075836181640625, -0.0440216064453125, -0.01220703125, 0.0196075439453125, 0.051422119140625, 0.0832366943359375, 0.11505126953125, 0.1468658447265625, 0.178680419921875, 0.2104949951171875, 0.2423095703125, 0.2741241455078125, 0.305938720703125, 0.3377532958984375, 0.36956787109375, 0.4013824462890625, 0.433197021484375, 0.4650115966796875, 0.496826171875, 0.5286407470703125, 0.560455322265625, 0.5922698974609375, 0.62408447265625, 0.6558990478515625, 0.687713623046875, 0.7195281982421875, 0.7513427734375, 0.7831573486328125, 0.814971923828125, 0.8467864990234375, 0.87860107421875, 0.9104156494140625, 0.942230224609375, 0.9740447998046875, 1.005859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 19.0, 24.0, 60.0, 83.0, 101.0, 167.0, 292.0, 747.0, 2232.0, 22650.0, 4031163.0, 130689.0, 4261.0, 991.0, 361.0, 156.0, 91.0, 63.0, 46.0, 27.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-44.71875, -43.671142578125, -42.62353515625, -41.575927734375, -40.5283203125, -39.480712890625, -38.43310546875, -37.385498046875, -36.337890625, -35.290283203125, -34.24267578125, -33.195068359375, -32.1474609375, -31.099853515625, -30.05224609375, -29.004638671875, -27.95703125, -26.909423828125, -25.86181640625, -24.814208984375, -23.7666015625, -22.718994140625, -21.67138671875, -20.623779296875, -19.576171875, -18.528564453125, -17.48095703125, -16.433349609375, -15.3857421875, -14.338134765625, -13.29052734375, -12.242919921875, -11.1953125, -10.147705078125, -9.10009765625, -8.052490234375, -7.0048828125, -5.957275390625, -4.90966796875, -3.862060546875, -2.814453125, -1.766845703125, -0.71923828125, 0.328369140625, 1.3759765625, 2.423583984375, 3.47119140625, 4.518798828125, 5.56640625, 6.614013671875, 7.66162109375, 8.709228515625, 9.7568359375, 10.804443359375, 11.85205078125, 12.899658203125, 13.947265625, 14.994873046875, 16.04248046875, 17.090087890625, 18.1376953125, 19.185302734375, 20.23291015625, 21.280517578125, 22.328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 14.0, 32.0, 100.0, 344.0, 2008.0, 1172.0, 233.0, 87.0, 35.0, 17.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.708526611328125, -8.52642822265625, -8.344329833984375, -8.1622314453125, -7.980133056640625, -7.79803466796875, -7.615936279296875, -7.433837890625, -7.251739501953125, -7.06964111328125, -6.887542724609375, -6.7054443359375, -6.523345947265625, -6.34124755859375, -6.159149169921875, -5.97705078125, -5.794952392578125, -5.61285400390625, -5.430755615234375, -5.2486572265625, -5.066558837890625, -4.88446044921875, -4.702362060546875, -4.520263671875, -4.338165283203125, -4.15606689453125, -3.973968505859375, -3.7918701171875, -3.609771728515625, -3.42767333984375, -3.245574951171875, -3.0634765625, -2.881378173828125, -2.69927978515625, -2.517181396484375, -2.3350830078125, -2.152984619140625, -1.97088623046875, -1.788787841796875, -1.606689453125, -1.424591064453125, -1.24249267578125, -1.060394287109375, -0.8782958984375, -0.696197509765625, -0.51409912109375, -0.332000732421875, -0.14990234375, 0.032196044921875, 0.21429443359375, 0.396392822265625, 0.5784912109375, 0.760589599609375, 0.94268798828125, 1.124786376953125, 1.306884765625, 1.488983154296875, 1.67108154296875, 1.853179931640625, 2.0352783203125, 2.217376708984375, 2.39947509765625, 2.581573486328125, 2.763671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 9.0, 12.0, 7.0, 21.0, 60.0, 104.0, 147.0, 198.0, 169.0, 113.0, 78.0, 31.0, 18.0, 12.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.525768280029297, -28.75773048400879, -27.98969268798828, -27.221656799316406, -26.4536190032959, -25.68558120727539, -24.917543411254883, -24.149505615234375, -23.3814697265625, -22.613431930541992, -21.845394134521484, -21.07735824584961, -20.3093204498291, -19.541282653808594, -18.773244857788086, -18.005207061767578, -17.23716926574707, -16.469131469726562, -15.701094627380371, -14.933056831359863, -14.165019989013672, -13.396982192993164, -12.628944396972656, -11.860906600952148, -11.092869758605957, -10.32483196258545, -9.556795120239258, -8.78875732421875, -8.020719528198242, -7.252682685852051, -6.484644889831543, -5.716607570648193, -4.948572158813477, -4.180534839630127, -3.4124972820281982, -2.6444597244262695, -1.87642240524292, -1.1083850860595703, -0.3403472900390625, 0.4276900291442871, 1.1957273483276367, 1.9637647867202759, 2.731802225112915, 3.4998397827148438, 4.267877101898193, 5.035914421081543, 5.803952217102051, 6.5719895362854, 7.34002685546875, 8.108064651489258, 8.87610149383545, 9.644139289855957, 10.412176132202148, 11.180213928222656, 11.948251724243164, 12.716289520263672, 13.484326362609863, 14.252364158630371, 15.020401000976562, 15.78843879699707, 16.556476593017578, 17.324512481689453, 18.092552185058594, 18.86058807373047, 19.628625869750977]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 8.0, 9.0, 22.0, 32.0, 35.0, 37.0, 42.0, 70.0, 87.0, 89.0, 93.0, 97.0, 66.0, 63.0, 59.0, 53.0, 35.0, 30.0, 28.0, 14.0, 9.0, 13.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.939380645751953, -20.400766372680664, -19.862152099609375, -19.323537826538086, -18.784923553466797, -18.246309280395508, -17.70769500732422, -17.16908073425293, -16.63046646118164, -16.09185218811035, -15.553237915039062, -15.014623641967773, -14.476009368896484, -13.937395095825195, -13.398780822753906, -12.860166549682617, -12.321553230285645, -11.782938957214355, -11.244324684143066, -10.705710411071777, -10.167096138000488, -9.6284818649292, -9.089868545532227, -8.551254272460938, -8.012639999389648, -7.474025726318359, -6.93541145324707, -6.396797180175781, -5.858182907104492, -5.319568634033203, -4.780954837799072, -4.242340564727783, -3.703725814819336, -3.165111541748047, -2.626497268676758, -2.087883234024048, -1.5492689609527588, -1.0106546878814697, -0.47204065322875977, 0.0665736198425293, 0.6051878929138184, 1.1438021659851074, 1.682416319847107, 2.2210304737091064, 2.7596447467803955, 3.2982590198516846, 3.8368730545043945, 4.375487327575684, 4.914101600646973, 5.452715873718262, 5.991330146789551, 6.52994441986084, 7.068558692932129, 7.607172966003418, 8.14578628540039, 8.68440055847168, 9.223014831542969, 9.761629104614258, 10.300243377685547, 10.838857650756836, 11.377471923828125, 11.916086196899414, 12.454700469970703, 12.993314743041992, 13.531929016113281]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 8.0, 9.0, 18.0, 22.0, 25.0, 35.0, 54.0, 70.0, 120.0, 153.0, 261.0, 471.0, 851.0, 1672.0, 3609.0, 8844.0, 24967.0, 75779.0, 216904.0, 367680.0, 224744.0, 79226.0, 26052.0, 9435.0, 3682.0, 1700.0, 878.0, 458.0, 272.0, 176.0, 123.0, 67.0, 61.0, 37.0, 17.0, 12.0, 13.0, 3.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.50390625, -6.30987548828125, -6.1158447265625, -5.92181396484375, -5.727783203125, -5.53375244140625, -5.3397216796875, -5.14569091796875, -4.95166015625, -4.75762939453125, -4.5635986328125, -4.36956787109375, -4.175537109375, -3.98150634765625, -3.7874755859375, -3.59344482421875, -3.3994140625, -3.20538330078125, -3.0113525390625, -2.81732177734375, -2.623291015625, -2.42926025390625, -2.2352294921875, -2.04119873046875, -1.84716796875, -1.65313720703125, -1.4591064453125, -1.26507568359375, -1.071044921875, -0.87701416015625, -0.6829833984375, -0.48895263671875, -0.294921875, -0.10089111328125, 0.0931396484375, 0.28717041015625, 0.481201171875, 0.67523193359375, 0.8692626953125, 1.06329345703125, 1.25732421875, 1.45135498046875, 1.6453857421875, 1.83941650390625, 2.033447265625, 2.22747802734375, 2.4215087890625, 2.61553955078125, 2.8095703125, 3.00360107421875, 3.1976318359375, 3.39166259765625, 3.585693359375, 3.77972412109375, 3.9737548828125, 4.16778564453125, 4.36181640625, 4.55584716796875, 4.7498779296875, 4.94390869140625, 5.137939453125, 5.33197021484375, 5.5260009765625, 5.72003173828125, 5.9140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 8.0, 12.0, 13.0, 20.0, 18.0, 30.0, 37.0, 44.0, 44.0, 57.0, 64.0, 68.0, 62.0, 71.0, 57.0, 60.0, 54.0, 49.0, 53.0, 44.0, 25.0, 30.0, 20.0, 15.0, 14.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0868682861328125, -1.050689697265625, -1.0145111083984375, -0.97833251953125, -0.9421539306640625, -0.905975341796875, -0.8697967529296875, -0.8336181640625, -0.7974395751953125, -0.761260986328125, -0.7250823974609375, -0.68890380859375, -0.6527252197265625, -0.616546630859375, -0.5803680419921875, -0.544189453125, -0.5080108642578125, -0.471832275390625, -0.4356536865234375, -0.39947509765625, -0.3632965087890625, -0.327117919921875, -0.2909393310546875, -0.2547607421875, -0.2185821533203125, -0.182403564453125, -0.1462249755859375, -0.11004638671875, -0.0738677978515625, -0.037689208984375, -0.0015106201171875, 0.03466796875, 0.0708465576171875, 0.107025146484375, 0.1432037353515625, 0.17938232421875, 0.2155609130859375, 0.251739501953125, 0.2879180908203125, 0.3240966796875, 0.3602752685546875, 0.396453857421875, 0.4326324462890625, 0.46881103515625, 0.5049896240234375, 0.541168212890625, 0.5773468017578125, 0.613525390625, 0.6497039794921875, 0.685882568359375, 0.7220611572265625, 0.75823974609375, 0.7944183349609375, 0.830596923828125, 0.8667755126953125, 0.9029541015625, 0.9391326904296875, 0.975311279296875, 1.0114898681640625, 1.04766845703125, 1.0838470458984375, 1.120025634765625, 1.1562042236328125, 1.1923828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 10.0, 17.0, 21.0, 34.0, 39.0, 74.0, 118.0, 163.0, 267.0, 404.0, 815.0, 1590.0, 3660.0, 9557.0, 29672.0, 103162.0, 320288.0, 377294.0, 140276.0, 39762.0, 12511.0, 4613.0, 1963.0, 905.0, 532.0, 301.0, 161.0, 105.0, 72.0, 45.0, 36.0, 23.0, 14.0, 12.0, 12.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.10546875, -5.90277099609375, -5.7000732421875, -5.49737548828125, -5.294677734375, -5.09197998046875, -4.8892822265625, -4.68658447265625, -4.48388671875, -4.28118896484375, -4.0784912109375, -3.87579345703125, -3.673095703125, -3.47039794921875, -3.2677001953125, -3.06500244140625, -2.8623046875, -2.65960693359375, -2.4569091796875, -2.25421142578125, -2.051513671875, -1.84881591796875, -1.6461181640625, -1.44342041015625, -1.24072265625, -1.03802490234375, -0.8353271484375, -0.63262939453125, -0.429931640625, -0.22723388671875, -0.0245361328125, 0.17816162109375, 0.380859375, 0.58355712890625, 0.7862548828125, 0.98895263671875, 1.191650390625, 1.39434814453125, 1.5970458984375, 1.79974365234375, 2.00244140625, 2.20513916015625, 2.4078369140625, 2.61053466796875, 2.813232421875, 3.01593017578125, 3.2186279296875, 3.42132568359375, 3.6240234375, 3.82672119140625, 4.0294189453125, 4.23211669921875, 4.434814453125, 4.63751220703125, 4.8402099609375, 5.04290771484375, 5.24560546875, 5.44830322265625, 5.6510009765625, 5.85369873046875, 6.056396484375, 6.25909423828125, 6.4617919921875, 6.66448974609375, 6.8671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 3.0, 2.0, 5.0, 7.0, 5.0, 4.0, 14.0, 7.0, 16.0, 13.0, 20.0, 20.0, 22.0, 32.0, 29.0, 28.0, 29.0, 40.0, 37.0, 29.0, 35.0, 42.0, 39.0, 43.0, 46.0, 43.0, 34.0, 43.0, 43.0, 31.0, 32.0, 22.0, 17.0, 15.0, 23.0, 14.0, 15.0, 18.0, 12.0, 13.0, 10.0, 11.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.2421875, -4.117218017578125, -3.99224853515625, -3.867279052734375, -3.7423095703125, -3.617340087890625, -3.49237060546875, -3.367401123046875, -3.242431640625, -3.117462158203125, -2.99249267578125, -2.867523193359375, -2.7425537109375, -2.617584228515625, -2.49261474609375, -2.367645263671875, -2.24267578125, -2.117706298828125, -1.99273681640625, -1.867767333984375, -1.7427978515625, -1.617828369140625, -1.49285888671875, -1.367889404296875, -1.242919921875, -1.117950439453125, -0.99298095703125, -0.868011474609375, -0.7430419921875, -0.618072509765625, -0.49310302734375, -0.368133544921875, -0.2431640625, -0.118194580078125, 0.00677490234375, 0.131744384765625, 0.2567138671875, 0.381683349609375, 0.50665283203125, 0.631622314453125, 0.756591796875, 0.881561279296875, 1.00653076171875, 1.131500244140625, 1.2564697265625, 1.381439208984375, 1.50640869140625, 1.631378173828125, 1.75634765625, 1.881317138671875, 2.00628662109375, 2.131256103515625, 2.2562255859375, 2.381195068359375, 2.50616455078125, 2.631134033203125, 2.756103515625, 2.881072998046875, 3.00604248046875, 3.131011962890625, 3.2559814453125, 3.380950927734375, 3.50592041015625, 3.630889892578125, 3.755859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 14.0, 19.0, 19.0, 54.0, 64.0, 102.0, 171.0, 313.0, 685.0, 1984.0, 6804.0, 30728.0, 185613.0, 567290.0, 209332.0, 34107.0, 7528.0, 2166.0, 762.0, 348.0, 192.0, 90.0, 63.0, 33.0, 19.0, 16.0, 12.0, 5.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.48175048828125, -4.3189697265625, -4.15618896484375, -3.993408203125, -3.83062744140625, -3.6678466796875, -3.50506591796875, -3.34228515625, -3.17950439453125, -3.0167236328125, -2.85394287109375, -2.691162109375, -2.52838134765625, -2.3656005859375, -2.20281982421875, -2.0400390625, -1.87725830078125, -1.7144775390625, -1.55169677734375, -1.388916015625, -1.22613525390625, -1.0633544921875, -0.90057373046875, -0.73779296875, -0.57501220703125, -0.4122314453125, -0.24945068359375, -0.086669921875, 0.07611083984375, 0.2388916015625, 0.40167236328125, 0.564453125, 0.72723388671875, 0.8900146484375, 1.05279541015625, 1.215576171875, 1.37835693359375, 1.5411376953125, 1.70391845703125, 1.86669921875, 2.02947998046875, 2.1922607421875, 2.35504150390625, 2.517822265625, 2.68060302734375, 2.8433837890625, 3.00616455078125, 3.1689453125, 3.33172607421875, 3.4945068359375, 3.65728759765625, 3.820068359375, 3.98284912109375, 4.1456298828125, 4.30841064453125, 4.47119140625, 4.63397216796875, 4.7967529296875, 4.95953369140625, 5.122314453125, 5.28509521484375, 5.4478759765625, 5.61065673828125, 5.7734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 8.0, 9.0, 12.0, 15.0, 16.0, 24.0, 34.0, 31.0, 48.0, 46.0, 74.0, 74.0, 84.0, 61.0, 91.0, 65.0, 60.0, 51.0, 36.0, 37.0, 33.0, 15.0, 17.0, 16.0, 8.0, 5.0, 12.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004973411560058594, -0.00048185139894485474, -0.0004663616418838501, -0.00045087188482284546, -0.0004353821277618408, -0.0004198923707008362, -0.00040440261363983154, -0.0003889128565788269, -0.00037342309951782227, -0.0003579333424568176, -0.000342443585395813, -0.00032695382833480835, -0.0003114640712738037, -0.00029597431421279907, -0.00028048455715179443, -0.0002649948000907898, -0.00024950504302978516, -0.00023401528596878052, -0.00021852552890777588, -0.00020303577184677124, -0.0001875460147857666, -0.00017205625772476196, -0.00015656650066375732, -0.00014107674360275269, -0.00012558698654174805, -0.00011009722948074341, -9.460747241973877e-05, -7.911771535873413e-05, -6.362795829772949e-05, -4.8138201236724854e-05, -3.2648444175720215e-05, -1.7158687114715576e-05, -1.6689300537109375e-06, 1.3820827007293701e-05, 2.931058406829834e-05, 4.480034112930298e-05, 6.029009819030762e-05, 7.577985525131226e-05, 9.12696123123169e-05, 0.00010675936937332153, 0.00012224912643432617, 0.0001377388834953308, 0.00015322864055633545, 0.0001687183976173401, 0.00018420815467834473, 0.00019969791173934937, 0.000215187668800354, 0.00023067742586135864, 0.0002461671829223633, 0.0002616569399833679, 0.00027714669704437256, 0.0002926364541053772, 0.00030812621116638184, 0.0003236159682273865, 0.0003391057252883911, 0.00035459548234939575, 0.0003700852394104004, 0.00038557499647140503, 0.00040106475353240967, 0.0004165545105934143, 0.00043204426765441895, 0.0004475340247154236, 0.0004630237817764282, 0.00047851353883743286, 0.0004940032958984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 7.0, 3.0, 9.0, 13.0, 26.0, 21.0, 39.0, 65.0, 97.0, 136.0, 220.0, 382.0, 698.0, 1262.0, 2715.0, 6640.0, 19380.0, 77796.0, 330011.0, 437918.0, 125941.0, 29040.0, 9021.0, 3443.0, 1586.0, 828.0, 487.0, 261.0, 191.0, 103.0, 74.0, 27.0, 37.0, 27.0, 16.0, 11.0, 9.0, 4.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.7742919921875, -4.634521484375, -4.4947509765625, -4.35498046875, -4.2152099609375, -4.075439453125, -3.9356689453125, -3.7958984375, -3.6561279296875, -3.516357421875, -3.3765869140625, -3.23681640625, -3.0970458984375, -2.957275390625, -2.8175048828125, -2.677734375, -2.5379638671875, -2.398193359375, -2.2584228515625, -2.11865234375, -1.9788818359375, -1.839111328125, -1.6993408203125, -1.5595703125, -1.4197998046875, -1.280029296875, -1.1402587890625, -1.00048828125, -0.8607177734375, -0.720947265625, -0.5811767578125, -0.44140625, -0.3016357421875, -0.161865234375, -0.0220947265625, 0.11767578125, 0.2574462890625, 0.397216796875, 0.5369873046875, 0.6767578125, 0.8165283203125, 0.956298828125, 1.0960693359375, 1.23583984375, 1.3756103515625, 1.515380859375, 1.6551513671875, 1.794921875, 1.9346923828125, 2.074462890625, 2.2142333984375, 2.35400390625, 2.4937744140625, 2.633544921875, 2.7733154296875, 2.9130859375, 3.0528564453125, 3.192626953125, 3.3323974609375, 3.47216796875, 3.6119384765625, 3.751708984375, 3.8914794921875, 4.03125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 6.0, 19.0, 17.0, 26.0, 33.0, 47.0, 49.0, 57.0, 73.0, 76.0, 89.0, 81.0, 62.0, 69.0, 52.0, 45.0, 45.0, 31.0, 16.0, 15.0, 13.0, 17.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2421875, -3.1595458984375, -3.076904296875, -2.9942626953125, -2.91162109375, -2.8289794921875, -2.746337890625, -2.6636962890625, -2.5810546875, -2.4984130859375, -2.415771484375, -2.3331298828125, -2.25048828125, -2.1678466796875, -2.085205078125, -2.0025634765625, -1.919921875, -1.8372802734375, -1.754638671875, -1.6719970703125, -1.58935546875, -1.5067138671875, -1.424072265625, -1.3414306640625, -1.2587890625, -1.1761474609375, -1.093505859375, -1.0108642578125, -0.92822265625, -0.8455810546875, -0.762939453125, -0.6802978515625, -0.59765625, -0.5150146484375, -0.432373046875, -0.3497314453125, -0.26708984375, -0.1844482421875, -0.101806640625, -0.0191650390625, 0.0634765625, 0.1461181640625, 0.228759765625, 0.3114013671875, 0.39404296875, 0.4766845703125, 0.559326171875, 0.6419677734375, 0.724609375, 0.8072509765625, 0.889892578125, 0.9725341796875, 1.05517578125, 1.1378173828125, 1.220458984375, 1.3031005859375, 1.3857421875, 1.4683837890625, 1.551025390625, 1.6336669921875, 1.71630859375, 1.7989501953125, 1.881591796875, 1.9642333984375, 2.046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 6.0, 5.0, 7.0, 9.0, 32.0, 33.0, 66.0, 65.0, 97.0, 106.0, 109.0, 112.0, 91.0, 86.0, 53.0, 37.0, 28.0, 17.0, 14.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.335386276245117, -24.24995994567871, -23.164535522460938, -22.07910919189453, -20.993682861328125, -19.90825843811035, -18.822832107543945, -17.737407684326172, -16.651981353759766, -15.566555976867676, -14.481130599975586, -13.39570426940918, -12.31027889251709, -11.224853515625, -10.139427185058594, -9.054001808166504, -7.968576431274414, -6.883151054382324, -5.797725200653076, -4.712299346923828, -3.6268739700317383, -2.5414485931396484, -1.4560227394104004, -0.37059688568115234, 0.7148284912109375, 1.8002541065216064, 2.8856797218322754, 3.9711053371429443, 5.056530952453613, 6.141956329345703, 7.227382183074951, 8.3128080368042, 9.398235321044922, 10.483660697937012, 11.569086074829102, 12.654512405395508, 13.739937782287598, 14.825363159179688, 15.910789489746094, 16.9962158203125, 18.081640243530273, 19.16706657409668, 20.252490997314453, 21.33791732788086, 22.423343658447266, 23.50876808166504, 24.594194412231445, 25.67961883544922, 26.765045166015625, 27.85047149658203, 28.935895919799805, 30.02132225036621, 31.106746673583984, 32.19217300415039, 33.2775993347168, 34.3630256652832, 35.448448181152344, 36.53387451171875, 37.619300842285156, 38.7047233581543, 39.7901496887207, 40.87557601928711, 41.961002349853516, 43.04642868041992, 44.13185501098633]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 8.0, 11.0, 12.0, 19.0, 18.0, 16.0, 28.0, 34.0, 29.0, 41.0, 43.0, 70.0, 64.0, 50.0, 52.0, 63.0, 43.0, 57.0, 43.0, 44.0, 52.0, 27.0, 36.0, 31.0, 20.0, 9.0, 13.0, 12.0, 13.0, 9.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.236547470092773, -30.21830177307129, -29.200056076049805, -28.181808471679688, -27.163562774658203, -26.14531707763672, -25.127071380615234, -24.10882568359375, -23.090579986572266, -22.07233428955078, -21.054088592529297, -20.035842895507812, -19.017595291137695, -17.99934959411621, -16.981103897094727, -15.962858200073242, -14.944610595703125, -13.92636489868164, -12.90811824798584, -11.889872550964355, -10.871625900268555, -9.85338020324707, -8.835134506225586, -7.816888332366943, -6.798642158508301, -5.780395984649658, -4.762149810791016, -3.7439041137695312, -2.7256579399108887, -1.707411766052246, -0.6891660690307617, 0.32908010482788086, 1.3473281860351562, 2.365574359893799, 3.3838202953338623, 4.402066230773926, 5.420312404632568, 6.438558578491211, 7.456804275512695, 8.47504997253418, 9.49329662322998, 10.511542320251465, 11.529788970947266, 12.54803466796875, 13.566280364990234, 14.584527015686035, 15.60277271270752, 16.62101936340332, 17.639265060424805, 18.65751075744629, 19.675756454467773, 20.69400405883789, 21.712249755859375, 22.73049545288086, 23.748741149902344, 24.766986846923828, 25.785232543945312, 26.803478240966797, 27.82172393798828, 28.839969635009766, 29.858217239379883, 30.876462936401367, 31.89470863342285, 32.91295623779297, 33.93120193481445]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 0.0, 3.0, 7.0, 10.0, 16.0, 17.0, 24.0, 30.0, 48.0, 55.0, 65.0, 73.0, 140.0, 219.0, 347.0, 611.0, 1020.0, 2182.0, 5349.0, 16607.0, 81158.0, 3234237.0, 782470.0, 49430.0, 12125.0, 4129.0, 1858.0, 861.0, 461.0, 277.0, 146.0, 95.0, 72.0, 38.0, 29.0, 22.0, 8.0, 11.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.7135009765625, -11.395751953125, -11.0780029296875, -10.76025390625, -10.4425048828125, -10.124755859375, -9.8070068359375, -9.4892578125, -9.1715087890625, -8.853759765625, -8.5360107421875, -8.21826171875, -7.9005126953125, -7.582763671875, -7.2650146484375, -6.947265625, -6.6295166015625, -6.311767578125, -5.9940185546875, -5.67626953125, -5.3585205078125, -5.040771484375, -4.7230224609375, -4.4052734375, -4.0875244140625, -3.769775390625, -3.4520263671875, -3.13427734375, -2.8165283203125, -2.498779296875, -2.1810302734375, -1.86328125, -1.5455322265625, -1.227783203125, -0.9100341796875, -0.59228515625, -0.2745361328125, 0.043212890625, 0.3609619140625, 0.6787109375, 0.9964599609375, 1.314208984375, 1.6319580078125, 1.94970703125, 2.2674560546875, 2.585205078125, 2.9029541015625, 3.220703125, 3.5384521484375, 3.856201171875, 4.1739501953125, 4.49169921875, 4.8094482421875, 5.127197265625, 5.4449462890625, 5.7626953125, 6.0804443359375, 6.398193359375, 6.7159423828125, 7.03369140625, 7.3514404296875, 7.669189453125, 7.9869384765625, 8.3046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 10.0, 16.0, 19.0, 29.0, 29.0, 52.0, 54.0, 56.0, 55.0, 66.0, 76.0, 63.0, 77.0, 71.0, 69.0, 51.0, 50.0, 35.0, 22.0, 27.0, 18.0, 19.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.39453125, -1.35260009765625, -1.3106689453125, -1.26873779296875, -1.226806640625, -1.18487548828125, -1.1429443359375, -1.10101318359375, -1.05908203125, -1.01715087890625, -0.9752197265625, -0.93328857421875, -0.891357421875, -0.84942626953125, -0.8074951171875, -0.76556396484375, -0.7236328125, -0.68170166015625, -0.6397705078125, -0.59783935546875, -0.555908203125, -0.51397705078125, -0.4720458984375, -0.43011474609375, -0.38818359375, -0.34625244140625, -0.3043212890625, -0.26239013671875, -0.220458984375, -0.17852783203125, -0.1365966796875, -0.09466552734375, -0.052734375, -0.01080322265625, 0.0311279296875, 0.07305908203125, 0.114990234375, 0.15692138671875, 0.1988525390625, 0.24078369140625, 0.28271484375, 0.32464599609375, 0.3665771484375, 0.40850830078125, 0.450439453125, 0.49237060546875, 0.5343017578125, 0.57623291015625, 0.6181640625, 0.66009521484375, 0.7020263671875, 0.74395751953125, 0.785888671875, 0.82781982421875, 0.8697509765625, 0.91168212890625, 0.95361328125, 0.99554443359375, 1.0374755859375, 1.07940673828125, 1.121337890625, 1.16326904296875, 1.2052001953125, 1.24713134765625, 1.2890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 14.0, 13.0, 39.0, 34.0, 50.0, 70.0, 131.0, 164.0, 363.0, 1314.0, 18001.0, 4046622.0, 123616.0, 2758.0, 561.0, 215.0, 118.0, 75.0, 49.0, 33.0, 18.0, 19.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.625, -38.71826171875, -37.8115234375, -36.90478515625, -35.998046875, -35.09130859375, -34.1845703125, -33.27783203125, -32.37109375, -31.46435546875, -30.5576171875, -29.65087890625, -28.744140625, -27.83740234375, -26.9306640625, -26.02392578125, -25.1171875, -24.21044921875, -23.3037109375, -22.39697265625, -21.490234375, -20.58349609375, -19.6767578125, -18.77001953125, -17.86328125, -16.95654296875, -16.0498046875, -15.14306640625, -14.236328125, -13.32958984375, -12.4228515625, -11.51611328125, -10.609375, -9.70263671875, -8.7958984375, -7.88916015625, -6.982421875, -6.07568359375, -5.1689453125, -4.26220703125, -3.35546875, -2.44873046875, -1.5419921875, -0.63525390625, 0.271484375, 1.17822265625, 2.0849609375, 2.99169921875, 3.8984375, 4.80517578125, 5.7119140625, 6.61865234375, 7.525390625, 8.43212890625, 9.3388671875, 10.24560546875, 11.15234375, 12.05908203125, 12.9658203125, 13.87255859375, 14.779296875, 15.68603515625, 16.5927734375, 17.49951171875, 18.40625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 11.0, 10.0, 16.0, 44.0, 84.0, 193.0, 670.0, 2019.0, 714.0, 186.0, 67.0, 31.0, 17.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.31640625, -6.183441162109375, -6.05047607421875, -5.917510986328125, -5.7845458984375, -5.651580810546875, -5.51861572265625, -5.385650634765625, -5.252685546875, -5.119720458984375, -4.98675537109375, -4.853790283203125, -4.7208251953125, -4.587860107421875, -4.45489501953125, -4.321929931640625, -4.18896484375, -4.055999755859375, -3.92303466796875, -3.790069580078125, -3.6571044921875, -3.524139404296875, -3.39117431640625, -3.258209228515625, -3.125244140625, -2.992279052734375, -2.85931396484375, -2.726348876953125, -2.5933837890625, -2.460418701171875, -2.32745361328125, -2.194488525390625, -2.0615234375, -1.928558349609375, -1.79559326171875, -1.662628173828125, -1.5296630859375, -1.396697998046875, -1.26373291015625, -1.130767822265625, -0.997802734375, -0.864837646484375, -0.73187255859375, -0.598907470703125, -0.4659423828125, -0.332977294921875, -0.20001220703125, -0.067047119140625, 0.06591796875, 0.198883056640625, 0.33184814453125, 0.464813232421875, 0.5977783203125, 0.730743408203125, 0.86370849609375, 0.996673583984375, 1.129638671875, 1.262603759765625, 1.39556884765625, 1.528533935546875, 1.6614990234375, 1.794464111328125, 1.92742919921875, 2.060394287109375, 2.193359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 12.0, 59.0, 217.0, 379.0, 225.0, 78.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.93046569824219, -54.700653076171875, -53.4708366394043, -52.241024017333984, -51.01121139526367, -49.781394958496094, -48.55158233642578, -47.32176971435547, -46.091957092285156, -44.862144470214844, -43.632328033447266, -42.40251541137695, -41.17270278930664, -39.94288635253906, -38.71307373046875, -37.48326110839844, -36.25344467163086, -35.02363204956055, -33.79381561279297, -32.564002990722656, -31.334190368652344, -30.1043758392334, -28.874561309814453, -27.64474868774414, -26.414934158325195, -25.18511962890625, -23.955307006835938, -22.725492477416992, -21.495677947998047, -20.265865325927734, -19.03605079650879, -17.806236267089844, -16.576419830322266, -15.346606254577637, -14.116792678833008, -12.886978149414062, -11.657164573669434, -10.427350997924805, -9.19753646850586, -7.9677228927612305, -6.737909317016602, -5.508095741271973, -4.2782816886901855, -3.0484678745269775, -1.8186540603637695, -0.5888404846191406, 0.6409735679626465, 1.8707876205444336, 3.1006011962890625, 4.330414772033691, 5.5602288246154785, 6.790042877197266, 8.019856452941895, 9.249670028686523, 10.479484558105469, 11.709298133850098, 12.939111709594727, 14.168925285339355, 15.398738861083984, 16.62855339050293, 17.858367919921875, 19.088180541992188, 20.317995071411133, 21.547809600830078, 22.77762222290039]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 12.0, 15.0, 27.0, 37.0, 56.0, 61.0, 88.0, 91.0, 95.0, 94.0, 101.0, 83.0, 64.0, 60.0, 48.0, 26.0, 17.0, 8.0, 13.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1952543258667, -13.685111999511719, -13.174970626831055, -12.664828300476074, -12.154685974121094, -11.644543647766113, -11.134401321411133, -10.624259948730469, -10.114117622375488, -9.603975296020508, -9.093833923339844, -8.583691596984863, -8.073549270629883, -7.563406944274902, -7.05326509475708, -6.543123245239258, -6.032980918884277, -5.522838592529297, -5.012696743011475, -4.502554893493652, -3.992412567138672, -3.4822704792022705, -2.972128391265869, -2.4619863033294678, -1.9518442153930664, -1.441702127456665, -0.9315600395202637, -0.4214179515838623, 0.08872413635253906, 0.5988662242889404, 1.1090083122253418, 1.6191504001617432, 2.129291534423828, 2.6394336223602295, 3.149575710296631, 3.6597177982330322, 4.169859886169434, 4.680002212524414, 5.190144062042236, 5.700285911560059, 6.210428237915039, 6.7205705642700195, 7.230712413787842, 7.740854263305664, 8.250996589660645, 8.761138916015625, 9.271280288696289, 9.78142261505127, 10.29156494140625, 10.80170726776123, 11.311849594116211, 11.821990966796875, 12.332133293151855, 12.842275619506836, 13.3524169921875, 13.86255931854248, 14.372701644897461, 14.882843971252441, 15.392986297607422, 15.903127670288086, 16.41326904296875, 16.923412322998047, 17.43355369567871, 17.943696975708008, 18.453838348388672]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 13.0, 10.0, 24.0, 39.0, 54.0, 89.0, 133.0, 250.0, 456.0, 809.0, 1679.0, 3829.0, 10796.0, 37315.0, 140184.0, 374884.0, 327032.0, 107368.0, 28710.0, 8689.0, 3173.0, 1378.0, 677.0, 394.0, 206.0, 130.0, 71.0, 58.0, 22.0, 24.0, 20.0, 12.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.8203125, -7.61395263671875, -7.4075927734375, -7.20123291015625, -6.994873046875, -6.78851318359375, -6.5821533203125, -6.37579345703125, -6.16943359375, -5.96307373046875, -5.7567138671875, -5.55035400390625, -5.343994140625, -5.13763427734375, -4.9312744140625, -4.72491455078125, -4.5185546875, -4.31219482421875, -4.1058349609375, -3.89947509765625, -3.693115234375, -3.48675537109375, -3.2803955078125, -3.07403564453125, -2.86767578125, -2.66131591796875, -2.4549560546875, -2.24859619140625, -2.042236328125, -1.83587646484375, -1.6295166015625, -1.42315673828125, -1.216796875, -1.01043701171875, -0.8040771484375, -0.59771728515625, -0.391357421875, -0.18499755859375, 0.0213623046875, 0.22772216796875, 0.43408203125, 0.64044189453125, 0.8468017578125, 1.05316162109375, 1.259521484375, 1.46588134765625, 1.6722412109375, 1.87860107421875, 2.0849609375, 2.29132080078125, 2.4976806640625, 2.70404052734375, 2.910400390625, 3.11676025390625, 3.3231201171875, 3.52947998046875, 3.73583984375, 3.94219970703125, 4.1485595703125, 4.35491943359375, 4.561279296875, 4.76763916015625, 4.9739990234375, 5.18035888671875, 5.38671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 12.0, 21.0, 37.0, 42.0, 43.0, 46.0, 66.0, 62.0, 81.0, 70.0, 83.0, 64.0, 66.0, 54.0, 61.0, 42.0, 38.0, 23.0, 17.0, 17.0, 7.0, 5.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.53125, -1.4858856201171875, -1.440521240234375, -1.3951568603515625, -1.34979248046875, -1.3044281005859375, -1.259063720703125, -1.2136993408203125, -1.1683349609375, -1.1229705810546875, -1.077606201171875, -1.0322418212890625, -0.98687744140625, -0.9415130615234375, -0.896148681640625, -0.8507843017578125, -0.805419921875, -0.7600555419921875, -0.714691162109375, -0.6693267822265625, -0.62396240234375, -0.5785980224609375, -0.533233642578125, -0.4878692626953125, -0.4425048828125, -0.3971405029296875, -0.351776123046875, -0.3064117431640625, -0.26104736328125, -0.2156829833984375, -0.170318603515625, -0.1249542236328125, -0.07958984375, -0.0342254638671875, 0.011138916015625, 0.0565032958984375, 0.10186767578125, 0.1472320556640625, 0.192596435546875, 0.2379608154296875, 0.2833251953125, 0.3286895751953125, 0.374053955078125, 0.4194183349609375, 0.46478271484375, 0.5101470947265625, 0.555511474609375, 0.6008758544921875, 0.646240234375, 0.6916046142578125, 0.736968994140625, 0.7823333740234375, 0.82769775390625, 0.8730621337890625, 0.918426513671875, 0.9637908935546875, 1.0091552734375, 1.0545196533203125, 1.099884033203125, 1.1452484130859375, 1.19061279296875, 1.2359771728515625, 1.281341552734375, 1.3267059326171875, 1.3720703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 8.0, 3.0, 5.0, 5.0, 14.0, 19.0, 25.0, 34.0, 40.0, 78.0, 124.0, 218.0, 320.0, 539.0, 1063.0, 2310.0, 6247.0, 19631.0, 79013.0, 300475.0, 427653.0, 156265.0, 37185.0, 10315.0, 3560.0, 1546.0, 796.0, 394.0, 244.0, 155.0, 76.0, 74.0, 43.0, 22.0, 22.0, 9.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.390625, -6.18603515625, -5.9814453125, -5.77685546875, -5.572265625, -5.36767578125, -5.1630859375, -4.95849609375, -4.75390625, -4.54931640625, -4.3447265625, -4.14013671875, -3.935546875, -3.73095703125, -3.5263671875, -3.32177734375, -3.1171875, -2.91259765625, -2.7080078125, -2.50341796875, -2.298828125, -2.09423828125, -1.8896484375, -1.68505859375, -1.48046875, -1.27587890625, -1.0712890625, -0.86669921875, -0.662109375, -0.45751953125, -0.2529296875, -0.04833984375, 0.15625, 0.36083984375, 0.5654296875, 0.77001953125, 0.974609375, 1.17919921875, 1.3837890625, 1.58837890625, 1.79296875, 1.99755859375, 2.2021484375, 2.40673828125, 2.611328125, 2.81591796875, 3.0205078125, 3.22509765625, 3.4296875, 3.63427734375, 3.8388671875, 4.04345703125, 4.248046875, 4.45263671875, 4.6572265625, 4.86181640625, 5.06640625, 5.27099609375, 5.4755859375, 5.68017578125, 5.884765625, 6.08935546875, 6.2939453125, 6.49853515625, 6.703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 0.0, 14.0, 8.0, 15.0, 14.0, 14.0, 26.0, 20.0, 37.0, 31.0, 34.0, 31.0, 41.0, 38.0, 48.0, 36.0, 42.0, 49.0, 47.0, 48.0, 40.0, 48.0, 39.0, 33.0, 47.0, 30.0, 23.0, 14.0, 17.0, 16.0, 18.0, 14.0, 13.0, 12.0, 7.0, 5.0, 5.0, 4.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.68359375, -4.54010009765625, -4.3966064453125, -4.25311279296875, -4.109619140625, -3.96612548828125, -3.8226318359375, -3.67913818359375, -3.53564453125, -3.39215087890625, -3.2486572265625, -3.10516357421875, -2.961669921875, -2.81817626953125, -2.6746826171875, -2.53118896484375, -2.3876953125, -2.24420166015625, -2.1007080078125, -1.95721435546875, -1.813720703125, -1.67022705078125, -1.5267333984375, -1.38323974609375, -1.23974609375, -1.09625244140625, -0.9527587890625, -0.80926513671875, -0.665771484375, -0.52227783203125, -0.3787841796875, -0.23529052734375, -0.091796875, 0.05169677734375, 0.1951904296875, 0.33868408203125, 0.482177734375, 0.62567138671875, 0.7691650390625, 0.91265869140625, 1.05615234375, 1.19964599609375, 1.3431396484375, 1.48663330078125, 1.630126953125, 1.77362060546875, 1.9171142578125, 2.06060791015625, 2.2041015625, 2.34759521484375, 2.4910888671875, 2.63458251953125, 2.778076171875, 2.92156982421875, 3.0650634765625, 3.20855712890625, 3.35205078125, 3.49554443359375, 3.6390380859375, 3.78253173828125, 3.926025390625, 4.06951904296875, 4.2130126953125, 4.35650634765625, 4.5]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 9.0, 19.0, 24.0, 28.0, 38.0, 65.0, 111.0, 183.0, 388.0, 791.0, 1924.0, 5638.0, 23445.0, 172230.0, 647833.0, 164337.0, 22544.0, 5340.0, 1868.0, 779.0, 369.0, 206.0, 108.0, 75.0, 42.0, 37.0, 20.0, 12.0, 12.0, 15.0, 9.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.578125, -5.41156005859375, -5.2449951171875, -5.07843017578125, -4.911865234375, -4.74530029296875, -4.5787353515625, -4.41217041015625, -4.24560546875, -4.07904052734375, -3.9124755859375, -3.74591064453125, -3.579345703125, -3.41278076171875, -3.2462158203125, -3.07965087890625, -2.9130859375, -2.74652099609375, -2.5799560546875, -2.41339111328125, -2.246826171875, -2.08026123046875, -1.9136962890625, -1.74713134765625, -1.58056640625, -1.41400146484375, -1.2474365234375, -1.08087158203125, -0.914306640625, -0.74774169921875, -0.5811767578125, -0.41461181640625, -0.248046875, -0.08148193359375, 0.0850830078125, 0.25164794921875, 0.418212890625, 0.58477783203125, 0.7513427734375, 0.91790771484375, 1.08447265625, 1.25103759765625, 1.4176025390625, 1.58416748046875, 1.750732421875, 1.91729736328125, 2.0838623046875, 2.25042724609375, 2.4169921875, 2.58355712890625, 2.7501220703125, 2.91668701171875, 3.083251953125, 3.24981689453125, 3.4163818359375, 3.58294677734375, 3.74951171875, 3.91607666015625, 4.0826416015625, 4.24920654296875, 4.415771484375, 4.58233642578125, 4.7489013671875, 4.91546630859375, 5.08203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 11.0, 11.0, 15.0, 18.0, 24.0, 28.0, 25.0, 31.0, 45.0, 60.0, 73.0, 89.0, 103.0, 90.0, 63.0, 53.0, 38.0, 39.0, 36.0, 28.0, 24.0, 11.0, 15.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0005054473876953125, -0.0004906728863716125, -0.0004758983850479126, -0.00046112388372421265, -0.0004463493824005127, -0.00043157488107681274, -0.0004168003797531128, -0.00040202587842941284, -0.0003872513771057129, -0.00037247687578201294, -0.000357702374458313, -0.00034292787313461304, -0.0003281533718109131, -0.00031337887048721313, -0.0002986043691635132, -0.00028382986783981323, -0.0002690553665161133, -0.00025428086519241333, -0.00023950636386871338, -0.00022473186254501343, -0.00020995736122131348, -0.00019518285989761353, -0.00018040835857391357, -0.00016563385725021362, -0.00015085935592651367, -0.00013608485460281372, -0.00012131035327911377, -0.00010653585195541382, -9.176135063171387e-05, -7.698684930801392e-05, -6.221234798431396e-05, -4.7437846660614014e-05, -3.266334533691406e-05, -1.788884401321411e-05, -3.11434268951416e-06, 1.1660158634185791e-05, 2.6434659957885742e-05, 4.120916128158569e-05, 5.5983662605285645e-05, 7.07581639289856e-05, 8.553266525268555e-05, 0.0001003071665763855, 0.00011508166790008545, 0.0001298561692237854, 0.00014463067054748535, 0.0001594051718711853, 0.00017417967319488525, 0.0001889541745185852, 0.00020372867584228516, 0.0002185031771659851, 0.00023327767848968506, 0.000248052179813385, 0.00026282668113708496, 0.0002776011824607849, 0.00029237568378448486, 0.0003071501851081848, 0.00032192468643188477, 0.0003366991877555847, 0.00035147368907928467, 0.0003662481904029846, 0.00038102269172668457, 0.0003957971930503845, 0.00041057169437408447, 0.0004253461956977844, 0.0004401206970214844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 4.0, 11.0, 20.0, 22.0, 36.0, 67.0, 95.0, 179.0, 297.0, 597.0, 1319.0, 3322.0, 13132.0, 128591.0, 775383.0, 108106.0, 11648.0, 3198.0, 1216.0, 536.0, 272.0, 186.0, 115.0, 55.0, 41.0, 31.0, 21.0, 15.0, 17.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.5164794921875, -8.282958984375, -8.0494384765625, -7.81591796875, -7.5823974609375, -7.348876953125, -7.1153564453125, -6.8818359375, -6.6483154296875, -6.414794921875, -6.1812744140625, -5.94775390625, -5.7142333984375, -5.480712890625, -5.2471923828125, -5.013671875, -4.7801513671875, -4.546630859375, -4.3131103515625, -4.07958984375, -3.8460693359375, -3.612548828125, -3.3790283203125, -3.1455078125, -2.9119873046875, -2.678466796875, -2.4449462890625, -2.21142578125, -1.9779052734375, -1.744384765625, -1.5108642578125, -1.27734375, -1.0438232421875, -0.810302734375, -0.5767822265625, -0.34326171875, -0.1097412109375, 0.123779296875, 0.3572998046875, 0.5908203125, 0.8243408203125, 1.057861328125, 1.2913818359375, 1.52490234375, 1.7584228515625, 1.991943359375, 2.2254638671875, 2.458984375, 2.6925048828125, 2.926025390625, 3.1595458984375, 3.39306640625, 3.6265869140625, 3.860107421875, 4.0936279296875, 4.3271484375, 4.5606689453125, 4.794189453125, 5.0277099609375, 5.26123046875, 5.4947509765625, 5.728271484375, 5.9617919921875, 6.1953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 21.0, 42.0, 85.0, 146.0, 180.0, 196.0, 144.0, 65.0, 37.0, 22.0, 12.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2421875, -7.05120849609375, -6.8602294921875, -6.66925048828125, -6.478271484375, -6.28729248046875, -6.0963134765625, -5.90533447265625, -5.71435546875, -5.52337646484375, -5.3323974609375, -5.14141845703125, -4.950439453125, -4.75946044921875, -4.5684814453125, -4.37750244140625, -4.1865234375, -3.99554443359375, -3.8045654296875, -3.61358642578125, -3.422607421875, -3.23162841796875, -3.0406494140625, -2.84967041015625, -2.65869140625, -2.46771240234375, -2.2767333984375, -2.08575439453125, -1.894775390625, -1.70379638671875, -1.5128173828125, -1.32183837890625, -1.130859375, -0.93988037109375, -0.7489013671875, -0.55792236328125, -0.366943359375, -0.17596435546875, 0.0150146484375, 0.20599365234375, 0.39697265625, 0.58795166015625, 0.7789306640625, 0.96990966796875, 1.160888671875, 1.35186767578125, 1.5428466796875, 1.73382568359375, 1.9248046875, 2.11578369140625, 2.3067626953125, 2.49774169921875, 2.688720703125, 2.87969970703125, 3.0706787109375, 3.26165771484375, 3.45263671875, 3.64361572265625, 3.8345947265625, 4.02557373046875, 4.216552734375, 4.40753173828125, 4.5985107421875, 4.78948974609375, 4.98046875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 23.0, 25.0, 44.0, 96.0, 129.0, 180.0, 171.0, 104.0, 90.0, 51.0, 39.0, 16.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.99909210205078, -68.32417297363281, -66.64925384521484, -64.97433471679688, -63.29941940307617, -61.62450408935547, -59.9495849609375, -58.27466583251953, -56.59974670410156, -54.924827575683594, -53.24991226196289, -51.57499313354492, -49.90007400512695, -48.22515869140625, -46.55023956298828, -44.87532043457031, -43.20040512084961, -41.52548599243164, -39.85057067871094, -38.17565155029297, -36.500732421875, -34.82581329345703, -33.15089797973633, -31.47597885131836, -29.801061630249023, -28.126144409179688, -26.45122528076172, -24.776308059692383, -23.101390838623047, -21.426471710205078, -19.751554489135742, -18.076637268066406, -16.401714324951172, -14.72679615020752, -13.051877975463867, -11.376960754394531, -9.702042579650879, -8.027124404907227, -6.352207183837891, -4.677289009094238, -3.002370834350586, -1.3274528980255127, 0.34746503829956055, 2.0223827362060547, 3.697300910949707, 5.372219085693359, 7.047136306762695, 8.722054481506348, 10.39697265625, 12.071890830993652, 13.746809005737305, 15.42172622680664, 17.09664535522461, 18.771562576293945, 20.44647979736328, 22.12139892578125, 23.796316146850586, 25.471233367919922, 27.14615249633789, 28.821069717407227, 30.495986938476562, 32.17090606689453, 33.8458251953125, 35.5207405090332, 37.19565963745117]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 9.0, 3.0, 2.0, 4.0, 9.0, 6.0, 6.0, 15.0, 17.0, 11.0, 25.0, 19.0, 29.0, 27.0, 29.0, 27.0, 43.0, 34.0, 28.0, 33.0, 51.0, 48.0, 48.0, 34.0, 43.0, 51.0, 44.0, 40.0, 25.0, 27.0, 29.0, 25.0, 28.0, 27.0, 15.0, 17.0, 15.0, 9.0, 5.0, 11.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.178316116333008, -24.424631118774414, -23.67094612121582, -22.917261123657227, -22.163576126098633, -21.40989112854004, -20.656208038330078, -19.902523040771484, -19.14883804321289, -18.395153045654297, -17.641468048095703, -16.88778305053711, -16.134098052978516, -15.380413055419922, -14.626729011535645, -13.87304401397705, -13.11935806274414, -12.365673065185547, -11.611988067626953, -10.85830307006836, -10.104618072509766, -9.350933074951172, -8.597249031066895, -7.843564033508301, -7.089879035949707, -6.336194038391113, -5.5825090408325195, -4.828824520111084, -4.07513952255249, -3.3214545249938965, -2.567770004272461, -1.8140850067138672, -1.0604019165039062, -0.30671703815460205, 0.44696784019470215, 1.2006525993347168, 1.9543375968933105, 2.7080225944519043, 3.46170711517334, 4.215392112731934, 4.969077110290527, 5.722762107849121, 6.476447105407715, 7.23013162612915, 7.983816623687744, 8.73750114440918, 9.491186141967773, 10.244871139526367, 10.998556137084961, 11.752241134643555, 12.505926132202148, 13.259611129760742, 14.013296127319336, 14.76698112487793, 15.520665168762207, 16.274349212646484, 17.028034210205078, 17.781719207763672, 18.535404205322266, 19.28908920288086, 20.042774200439453, 20.796459197998047, 21.55014419555664, 22.303829193115234, 23.057514190673828]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 13.0, 19.0, 21.0, 39.0, 61.0, 74.0, 145.0, 186.0, 404.0, 619.0, 1265.0, 2908.0, 7725.0, 27402.0, 177429.0, 3560322.0, 358058.0, 40729.0, 10222.0, 3595.0, 1482.0, 698.0, 332.0, 221.0, 111.0, 57.0, 38.0, 21.0, 18.0, 14.0, 9.0, 7.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5703125, -12.2530517578125, -11.935791015625, -11.6185302734375, -11.30126953125, -10.9840087890625, -10.666748046875, -10.3494873046875, -10.0322265625, -9.7149658203125, -9.397705078125, -9.0804443359375, -8.76318359375, -8.4459228515625, -8.128662109375, -7.8114013671875, -7.494140625, -7.1768798828125, -6.859619140625, -6.5423583984375, -6.22509765625, -5.9078369140625, -5.590576171875, -5.2733154296875, -4.9560546875, -4.6387939453125, -4.321533203125, -4.0042724609375, -3.68701171875, -3.3697509765625, -3.052490234375, -2.7352294921875, -2.41796875, -2.1007080078125, -1.783447265625, -1.4661865234375, -1.14892578125, -0.8316650390625, -0.514404296875, -0.1971435546875, 0.1201171875, 0.4373779296875, 0.754638671875, 1.0718994140625, 1.38916015625, 1.7064208984375, 2.023681640625, 2.3409423828125, 2.658203125, 2.9754638671875, 3.292724609375, 3.6099853515625, 3.92724609375, 4.2445068359375, 4.561767578125, 4.8790283203125, 5.1962890625, 5.5135498046875, 5.830810546875, 6.1480712890625, 6.46533203125, 6.7825927734375, 7.099853515625, 7.4171142578125, 7.734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 8.0, 9.0, 14.0, 18.0, 23.0, 30.0, 31.0, 45.0, 46.0, 77.0, 78.0, 72.0, 73.0, 86.0, 71.0, 67.0, 63.0, 44.0, 44.0, 31.0, 9.0, 21.0, 12.0, 7.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541015625, -1.4920501708984375, -1.443084716796875, -1.3941192626953125, -1.34515380859375, -1.2961883544921875, -1.247222900390625, -1.1982574462890625, -1.1492919921875, -1.1003265380859375, -1.051361083984375, -1.0023956298828125, -0.95343017578125, -0.9044647216796875, -0.855499267578125, -0.8065338134765625, -0.757568359375, -0.7086029052734375, -0.659637451171875, -0.6106719970703125, -0.56170654296875, -0.5127410888671875, -0.463775634765625, -0.4148101806640625, -0.3658447265625, -0.3168792724609375, -0.267913818359375, -0.2189483642578125, -0.16998291015625, -0.1210174560546875, -0.072052001953125, -0.0230865478515625, 0.02587890625, 0.0748443603515625, 0.123809814453125, 0.1727752685546875, 0.22174072265625, 0.2707061767578125, 0.319671630859375, 0.3686370849609375, 0.4176025390625, 0.4665679931640625, 0.515533447265625, 0.5644989013671875, 0.61346435546875, 0.6624298095703125, 0.711395263671875, 0.7603607177734375, 0.809326171875, 0.8582916259765625, 0.907257080078125, 0.9562225341796875, 1.00518798828125, 1.0541534423828125, 1.103118896484375, 1.1520843505859375, 1.2010498046875, 1.2500152587890625, 1.298980712890625, 1.3479461669921875, 1.39691162109375, 1.4458770751953125, 1.494842529296875, 1.5438079833984375, 1.5927734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 40.0, 70.0, 93.0, 220.0, 487.0, 10194.0, 4179131.0, 3088.0, 410.0, 207.0, 135.0, 96.0, 42.0, 23.0, 14.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -35.6494140625, -32.986328125, -30.3232421875, -27.66015625, -24.9970703125, -22.333984375, -19.6708984375, -17.0078125, -14.3447265625, -11.681640625, -9.0185546875, -6.35546875, -3.6923828125, -1.029296875, 1.6337890625, 4.296875, 6.9599609375, 9.623046875, 12.2861328125, 14.94921875, 17.6123046875, 20.275390625, 22.9384765625, 25.6015625, 28.2646484375, 30.927734375, 33.5908203125, 36.25390625, 38.9169921875, 41.580078125, 44.2431640625, 46.90625, 49.5693359375, 52.232421875, 54.8955078125, 57.55859375, 60.2216796875, 62.884765625, 65.5478515625, 68.2109375, 70.8740234375, 73.537109375, 76.2001953125, 78.86328125, 81.5263671875, 84.189453125, 86.8525390625, 89.515625, 92.1787109375, 94.841796875, 97.5048828125, 100.16796875, 102.8310546875, 105.494140625, 108.1572265625, 110.8203125, 113.4833984375, 116.146484375, 118.8095703125, 121.47265625, 124.1357421875, 126.798828125, 129.4619140625, 132.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 7.0, 7.0, 29.0, 97.0, 1101.0, 2603.0, 198.0, 29.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.0546875, -8.5823974609375, -8.110107421875, -7.6378173828125, -7.16552734375, -6.6932373046875, -6.220947265625, -5.7486572265625, -5.2763671875, -4.8040771484375, -4.331787109375, -3.8594970703125, -3.38720703125, -2.9149169921875, -2.442626953125, -1.9703369140625, -1.498046875, -1.0257568359375, -0.553466796875, -0.0811767578125, 0.39111328125, 0.8634033203125, 1.335693359375, 1.8079833984375, 2.2802734375, 2.7525634765625, 3.224853515625, 3.6971435546875, 4.16943359375, 4.6417236328125, 5.114013671875, 5.5863037109375, 6.05859375, 6.5308837890625, 7.003173828125, 7.4754638671875, 7.94775390625, 8.4200439453125, 8.892333984375, 9.3646240234375, 9.8369140625, 10.3092041015625, 10.781494140625, 11.2537841796875, 11.72607421875, 12.1983642578125, 12.670654296875, 13.1429443359375, 13.615234375, 14.0875244140625, 14.559814453125, 15.0321044921875, 15.50439453125, 15.9766845703125, 16.448974609375, 16.9212646484375, 17.3935546875, 17.8658447265625, 18.338134765625, 18.8104248046875, 19.28271484375, 19.7550048828125, 20.227294921875, 20.6995849609375, 21.171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 18.0, 132.0, 429.0, 294.0, 87.0, 15.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-148.68505859375, -145.81625366210938, -142.9474639892578, -140.0786590576172, -137.20986938476562, -134.341064453125, -131.47225952148438, -128.6034698486328, -125.73467254638672, -122.86587524414062, -119.99707794189453, -117.12828063964844, -114.25947570800781, -111.39067840576172, -108.52188110351562, -105.65308380126953, -102.78428649902344, -99.91548919677734, -97.04669189453125, -94.17788696289062, -91.30908966064453, -88.44029235839844, -85.57149505615234, -82.70269775390625, -79.83389282226562, -76.96509552001953, -74.09629821777344, -71.22749328613281, -68.35869598388672, -65.48989868164062, -62.62110137939453, -59.75230407714844, -56.88351058959961, -54.014713287353516, -51.145912170410156, -48.27711486816406, -45.40831756591797, -42.539520263671875, -39.670719146728516, -36.80192184448242, -33.93312072753906, -31.064321517944336, -28.195524215698242, -25.326725006103516, -22.457927703857422, -19.589128494262695, -16.72032928466797, -13.851531982421875, -10.982734680175781, -8.113936424255371, -5.245137691497803, -2.3763389587402344, 0.4924592971801758, 3.361257553100586, 6.2300567626953125, 9.098854064941406, 11.967653274536133, 14.836451530456543, 17.705249786376953, 20.57404899597168, 23.442848205566406, 26.3116455078125, 29.180444717407227, 32.04924011230469, 34.91804122924805]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 19.0, 30.0, 37.0, 53.0, 68.0, 87.0, 86.0, 96.0, 110.0, 87.0, 60.0, 67.0, 57.0, 28.0, 25.0, 21.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.165000915527344, -30.171253204345703, -29.177507400512695, -28.183759689331055, -27.190011978149414, -26.196266174316406, -25.202518463134766, -24.208770751953125, -23.215024948120117, -22.221277236938477, -21.22753143310547, -20.233783721923828, -19.240036010742188, -18.24629020690918, -17.25254249572754, -16.25879669189453, -15.265048027038574, -14.27130126953125, -13.27755355834961, -12.283806800842285, -11.290060043334961, -10.29631233215332, -9.302565574645996, -8.308818817138672, -7.3150715827941895, -6.321324348449707, -5.327577590942383, -4.3338303565979, -3.340083360671997, -2.3463363647460938, -1.3525891304016113, -0.3588423728942871, 0.6349048614501953, 1.6286518573760986, 2.622398853302002, 3.6161460876464844, 4.609892845153809, 5.603640079498291, 6.597387313842773, 7.591134071350098, 8.584880828857422, 9.578627586364746, 10.572375297546387, 11.566122055053711, 12.559868812561035, 13.55361557006836, 14.54736328125, 15.541110038757324, 16.53485870361328, 17.528606414794922, 18.52235221862793, 19.51609992980957, 20.50984764099121, 21.50359344482422, 22.49734115600586, 23.4910888671875, 24.484834671020508, 25.47858238220215, 26.472328186035156, 27.466075897216797, 28.459823608398438, 29.453569412231445, 30.447317123413086, 31.441062927246094, 32.434810638427734]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 12.0, 9.0, 13.0, 29.0, 41.0, 58.0, 103.0, 134.0, 205.0, 275.0, 414.0, 582.0, 887.0, 1459.0, 2502.0, 4868.0, 10568.0, 26440.0, 70312.0, 191053.0, 364098.0, 230750.0, 86231.0, 31741.0, 12661.0, 5664.0, 2857.0, 1560.0, 990.0, 630.0, 449.0, 285.0, 206.0, 144.0, 110.0, 61.0, 40.0, 31.0, 27.0, 13.0, 9.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.46484375, -6.26654052734375, -6.0682373046875, -5.86993408203125, -5.671630859375, -5.47332763671875, -5.2750244140625, -5.07672119140625, -4.87841796875, -4.68011474609375, -4.4818115234375, -4.28350830078125, -4.085205078125, -3.88690185546875, -3.6885986328125, -3.49029541015625, -3.2919921875, -3.09368896484375, -2.8953857421875, -2.69708251953125, -2.498779296875, -2.30047607421875, -2.1021728515625, -1.90386962890625, -1.70556640625, -1.50726318359375, -1.3089599609375, -1.11065673828125, -0.912353515625, -0.71405029296875, -0.5157470703125, -0.31744384765625, -0.119140625, 0.07916259765625, 0.2774658203125, 0.47576904296875, 0.674072265625, 0.87237548828125, 1.0706787109375, 1.26898193359375, 1.46728515625, 1.66558837890625, 1.8638916015625, 2.06219482421875, 2.260498046875, 2.45880126953125, 2.6571044921875, 2.85540771484375, 3.0537109375, 3.25201416015625, 3.4503173828125, 3.64862060546875, 3.846923828125, 4.04522705078125, 4.2435302734375, 4.44183349609375, 4.64013671875, 4.83843994140625, 5.0367431640625, 5.23504638671875, 5.433349609375, 5.63165283203125, 5.8299560546875, 6.02825927734375, 6.2265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 8.0, 10.0, 7.0, 20.0, 23.0, 41.0, 27.0, 50.0, 46.0, 50.0, 68.0, 78.0, 61.0, 64.0, 66.0, 63.0, 59.0, 49.0, 44.0, 41.0, 38.0, 20.0, 15.0, 8.0, 14.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.751953125, -1.70025634765625, -1.6485595703125, -1.59686279296875, -1.545166015625, -1.49346923828125, -1.4417724609375, -1.39007568359375, -1.33837890625, -1.28668212890625, -1.2349853515625, -1.18328857421875, -1.131591796875, -1.07989501953125, -1.0281982421875, -0.97650146484375, -0.9248046875, -0.87310791015625, -0.8214111328125, -0.76971435546875, -0.718017578125, -0.66632080078125, -0.6146240234375, -0.56292724609375, -0.51123046875, -0.45953369140625, -0.4078369140625, -0.35614013671875, -0.304443359375, -0.25274658203125, -0.2010498046875, -0.14935302734375, -0.09765625, -0.04595947265625, 0.0057373046875, 0.05743408203125, 0.109130859375, 0.16082763671875, 0.2125244140625, 0.26422119140625, 0.31591796875, 0.36761474609375, 0.4193115234375, 0.47100830078125, 0.522705078125, 0.57440185546875, 0.6260986328125, 0.67779541015625, 0.7294921875, 0.78118896484375, 0.8328857421875, 0.88458251953125, 0.936279296875, 0.98797607421875, 1.0396728515625, 1.09136962890625, 1.14306640625, 1.19476318359375, 1.2464599609375, 1.29815673828125, 1.349853515625, 1.40155029296875, 1.4532470703125, 1.50494384765625, 1.556640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 3.0, 12.0, 10.0, 25.0, 34.0, 54.0, 66.0, 115.0, 150.0, 248.0, 473.0, 839.0, 1840.0, 4313.0, 11413.0, 35377.0, 118909.0, 330556.0, 351283.0, 131796.0, 39559.0, 12685.0, 4646.0, 1924.0, 938.0, 496.0, 266.0, 160.0, 114.0, 91.0, 45.0, 22.0, 19.0, 14.0, 12.0, 8.0, 10.0, 5.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1015625, -4.9317626953125, -4.761962890625, -4.5921630859375, -4.42236328125, -4.2525634765625, -4.082763671875, -3.9129638671875, -3.7431640625, -3.5733642578125, -3.403564453125, -3.2337646484375, -3.06396484375, -2.8941650390625, -2.724365234375, -2.5545654296875, -2.384765625, -2.2149658203125, -2.045166015625, -1.8753662109375, -1.70556640625, -1.5357666015625, -1.365966796875, -1.1961669921875, -1.0263671875, -0.8565673828125, -0.686767578125, -0.5169677734375, -0.34716796875, -0.1773681640625, -0.007568359375, 0.1622314453125, 0.33203125, 0.5018310546875, 0.671630859375, 0.8414306640625, 1.01123046875, 1.1810302734375, 1.350830078125, 1.5206298828125, 1.6904296875, 1.8602294921875, 2.030029296875, 2.1998291015625, 2.36962890625, 2.5394287109375, 2.709228515625, 2.8790283203125, 3.048828125, 3.2186279296875, 3.388427734375, 3.5582275390625, 3.72802734375, 3.8978271484375, 4.067626953125, 4.2374267578125, 4.4072265625, 4.5770263671875, 4.746826171875, 4.9166259765625, 5.08642578125, 5.2562255859375, 5.426025390625, 5.5958251953125, 5.765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 12.0, 9.0, 14.0, 11.0, 10.0, 13.0, 20.0, 26.0, 20.0, 24.0, 42.0, 50.0, 54.0, 46.0, 62.0, 51.0, 42.0, 52.0, 58.0, 50.0, 46.0, 33.0, 39.0, 39.0, 31.0, 23.0, 30.0, 17.0, 17.0, 15.0, 11.0, 9.0, 10.0, 4.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.0625, -5.89349365234375, -5.7244873046875, -5.55548095703125, -5.386474609375, -5.21746826171875, -5.0484619140625, -4.87945556640625, -4.71044921875, -4.54144287109375, -4.3724365234375, -4.20343017578125, -4.034423828125, -3.86541748046875, -3.6964111328125, -3.52740478515625, -3.3583984375, -3.18939208984375, -3.0203857421875, -2.85137939453125, -2.682373046875, -2.51336669921875, -2.3443603515625, -2.17535400390625, -2.00634765625, -1.83734130859375, -1.6683349609375, -1.49932861328125, -1.330322265625, -1.16131591796875, -0.9923095703125, -0.82330322265625, -0.654296875, -0.48529052734375, -0.3162841796875, -0.14727783203125, 0.021728515625, 0.19073486328125, 0.3597412109375, 0.52874755859375, 0.69775390625, 0.86676025390625, 1.0357666015625, 1.20477294921875, 1.373779296875, 1.54278564453125, 1.7117919921875, 1.88079833984375, 2.0498046875, 2.21881103515625, 2.3878173828125, 2.55682373046875, 2.725830078125, 2.89483642578125, 3.0638427734375, 3.23284912109375, 3.40185546875, 3.57086181640625, 3.7398681640625, 3.90887451171875, 4.077880859375, 4.24688720703125, 4.4158935546875, 4.58489990234375, 4.75390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 8.0, 16.0, 14.0, 9.0, 19.0, 42.0, 60.0, 90.0, 165.0, 248.0, 529.0, 1029.0, 2082.0, 5158.0, 22039.0, 294473.0, 658785.0, 49746.0, 8250.0, 2963.0, 1276.0, 659.0, 338.0, 203.0, 105.0, 61.0, 41.0, 24.0, 24.0, 20.0, 7.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.27734375, -7.04400634765625, -6.8106689453125, -6.57733154296875, -6.343994140625, -6.11065673828125, -5.8773193359375, -5.64398193359375, -5.41064453125, -5.17730712890625, -4.9439697265625, -4.71063232421875, -4.477294921875, -4.24395751953125, -4.0106201171875, -3.77728271484375, -3.5439453125, -3.31060791015625, -3.0772705078125, -2.84393310546875, -2.610595703125, -2.37725830078125, -2.1439208984375, -1.91058349609375, -1.67724609375, -1.44390869140625, -1.2105712890625, -0.97723388671875, -0.743896484375, -0.51055908203125, -0.2772216796875, -0.04388427734375, 0.189453125, 0.42279052734375, 0.6561279296875, 0.88946533203125, 1.122802734375, 1.35614013671875, 1.5894775390625, 1.82281494140625, 2.05615234375, 2.28948974609375, 2.5228271484375, 2.75616455078125, 2.989501953125, 3.22283935546875, 3.4561767578125, 3.68951416015625, 3.9228515625, 4.15618896484375, 4.3895263671875, 4.62286376953125, 4.856201171875, 5.08953857421875, 5.3228759765625, 5.55621337890625, 5.78955078125, 6.02288818359375, 6.2562255859375, 6.48956298828125, 6.722900390625, 6.95623779296875, 7.1895751953125, 7.42291259765625, 7.65625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 9.0, 13.0, 17.0, 29.0, 42.0, 61.0, 96.0, 122.0, 169.0, 119.0, 91.0, 66.0, 34.0, 40.0, 16.0, 19.0, 10.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000652313232421875, -0.0006286203861236572, -0.0006049275398254395, -0.0005812346935272217, -0.0005575418472290039, -0.0005338490009307861, -0.0005101561546325684, -0.0004864633083343506, -0.0004627704620361328, -0.00043907761573791504, -0.00041538476943969727, -0.0003916919231414795, -0.0003679990768432617, -0.00034430623054504395, -0.00032061338424682617, -0.0002969205379486084, -0.0002732276916503906, -0.00024953484535217285, -0.00022584199905395508, -0.0002021491527557373, -0.00017845630645751953, -0.00015476346015930176, -0.00013107061386108398, -0.00010737776756286621, -8.368492126464844e-05, -5.9992074966430664e-05, -3.629922866821289e-05, -1.2606382369995117e-05, 1.1086463928222656e-05, 3.477931022644043e-05, 5.84721565246582e-05, 8.216500282287598e-05, 0.00010585784912109375, 0.00012955069541931152, 0.0001532435417175293, 0.00017693638801574707, 0.00020062923431396484, 0.00022432208061218262, 0.0002480149269104004, 0.00027170777320861816, 0.00029540061950683594, 0.0003190934658050537, 0.0003427863121032715, 0.00036647915840148926, 0.00039017200469970703, 0.0004138648509979248, 0.0004375576972961426, 0.00046125054359436035, 0.0004849433898925781, 0.0005086362361907959, 0.0005323290824890137, 0.0005560219287872314, 0.0005797147750854492, 0.000603407621383667, 0.0006271004676818848, 0.0006507933139801025, 0.0006744861602783203, 0.0006981790065765381, 0.0007218718528747559, 0.0007455646991729736, 0.0007692575454711914, 0.0007929503917694092, 0.000816643238067627, 0.0008403360843658447, 0.0008640289306640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 12.0, 18.0, 27.0, 32.0, 59.0, 134.0, 223.0, 467.0, 1062.0, 2768.0, 9161.0, 132892.0, 861297.0, 31555.0, 5445.0, 1820.0, 782.0, 349.0, 185.0, 102.0, 64.0, 27.0, 19.0, 12.0, 13.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.754150390625, -9.38330078125, -9.012451171875, -8.6416015625, -8.270751953125, -7.89990234375, -7.529052734375, -7.158203125, -6.787353515625, -6.41650390625, -6.045654296875, -5.6748046875, -5.303955078125, -4.93310546875, -4.562255859375, -4.19140625, -3.820556640625, -3.44970703125, -3.078857421875, -2.7080078125, -2.337158203125, -1.96630859375, -1.595458984375, -1.224609375, -0.853759765625, -0.48291015625, -0.112060546875, 0.2587890625, 0.629638671875, 1.00048828125, 1.371337890625, 1.7421875, 2.113037109375, 2.48388671875, 2.854736328125, 3.2255859375, 3.596435546875, 3.96728515625, 4.338134765625, 4.708984375, 5.079833984375, 5.45068359375, 5.821533203125, 6.1923828125, 6.563232421875, 6.93408203125, 7.304931640625, 7.67578125, 8.046630859375, 8.41748046875, 8.788330078125, 9.1591796875, 9.530029296875, 9.90087890625, 10.271728515625, 10.642578125, 11.013427734375, 11.38427734375, 11.755126953125, 12.1259765625, 12.496826171875, 12.86767578125, 13.238525390625, 13.609375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 8.0, 17.0, 26.0, 66.0, 126.0, 210.0, 210.0, 167.0, 70.0, 47.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.1484375, -7.922607421875, -7.69677734375, -7.470947265625, -7.2451171875, -7.019287109375, -6.79345703125, -6.567626953125, -6.341796875, -6.115966796875, -5.89013671875, -5.664306640625, -5.4384765625, -5.212646484375, -4.98681640625, -4.760986328125, -4.53515625, -4.309326171875, -4.08349609375, -3.857666015625, -3.6318359375, -3.406005859375, -3.18017578125, -2.954345703125, -2.728515625, -2.502685546875, -2.27685546875, -2.051025390625, -1.8251953125, -1.599365234375, -1.37353515625, -1.147705078125, -0.921875, -0.696044921875, -0.47021484375, -0.244384765625, -0.0185546875, 0.207275390625, 0.43310546875, 0.658935546875, 0.884765625, 1.110595703125, 1.33642578125, 1.562255859375, 1.7880859375, 2.013916015625, 2.23974609375, 2.465576171875, 2.69140625, 2.917236328125, 3.14306640625, 3.368896484375, 3.5947265625, 3.820556640625, 4.04638671875, 4.272216796875, 4.498046875, 4.723876953125, 4.94970703125, 5.175537109375, 5.4013671875, 5.627197265625, 5.85302734375, 6.078857421875, 6.3046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 16.0, 25.0, 55.0, 170.0, 243.0, 226.0, 162.0, 52.0, 29.0, 11.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-106.92169952392578, -104.16947937011719, -101.4172592163086, -98.6650390625, -95.9128189086914, -93.16059875488281, -90.40837097167969, -87.6561508178711, -84.9039306640625, -82.1517105102539, -79.39949035644531, -76.64727020263672, -73.89505004882812, -71.142822265625, -68.39060974121094, -65.63838195800781, -62.886165618896484, -60.13394546508789, -57.3817253112793, -54.62950134277344, -51.877281188964844, -49.12506103515625, -46.372840881347656, -43.62062072753906, -40.86840057373047, -38.116180419921875, -35.36396026611328, -32.61174011230469, -29.859516143798828, -27.107295989990234, -24.35507583618164, -21.602853775024414, -18.850631713867188, -16.098411560058594, -13.346189498901367, -10.593969345092773, -7.841748237609863, -5.089527130126953, -2.3373069763183594, 0.4149150848388672, 3.167135238647461, 5.919356346130371, 8.671577453613281, 11.423797607421875, 14.176018714904785, 16.928239822387695, 19.68045997619629, 22.432682037353516, 25.18490219116211, 27.937122344970703, 30.68934440612793, 33.441566467285156, 36.19378662109375, 38.946006774902344, 41.69822692871094, 44.45044708251953, 47.202667236328125, 49.95488739013672, 52.70710754394531, 55.459327697753906, 58.211551666259766, 60.96377182006836, 63.71599197387695, 66.46821594238281, 69.2204360961914]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 7.0, 9.0, 11.0, 8.0, 13.0, 15.0, 18.0, 23.0, 33.0, 29.0, 45.0, 41.0, 49.0, 44.0, 45.0, 40.0, 62.0, 65.0, 45.0, 49.0, 50.0, 48.0, 45.0, 33.0, 25.0, 34.0, 23.0, 19.0, 17.0, 15.0, 12.0, 6.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.707359313964844, -33.5610466003418, -32.41473388671875, -31.26841926574707, -30.12210464477539, -28.975791931152344, -27.829479217529297, -26.68316650390625, -25.53685188293457, -24.390539169311523, -23.244224548339844, -22.097911834716797, -20.95159912109375, -19.80528450012207, -18.658971786499023, -17.512657165527344, -16.366344451904297, -15.220030784606934, -14.07371711730957, -12.927404403686523, -11.78109073638916, -10.634777069091797, -9.48846435546875, -8.342150688171387, -7.195837020874023, -6.04952335357666, -4.903210163116455, -3.756896734237671, -2.6105833053588867, -1.4642696380615234, -0.31795644760131836, 0.8283567428588867, 1.97467041015625, 3.120983839035034, 4.267297267913818, 5.413610458374023, 6.559924125671387, 7.70623779296875, 8.852550506591797, 9.99886417388916, 11.145177841186523, 12.291491508483887, 13.43780517578125, 14.584117889404297, 15.73043155670166, 16.876745223999023, 18.02305793762207, 19.16937255859375, 20.315685272216797, 21.461997985839844, 22.608312606811523, 23.75462532043457, 24.90093994140625, 26.047252655029297, 27.193565368652344, 28.33987808227539, 29.48619270324707, 30.632505416870117, 31.778820037841797, 32.925132751464844, 34.07144546508789, 35.21775817871094, 36.36407470703125, 37.5103874206543, 38.656700134277344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 9.0, 15.0, 8.0, 11.0, 17.0, 30.0, 42.0, 49.0, 78.0, 105.0, 161.0, 259.0, 431.0, 838.0, 1671.0, 4081.0, 11278.0, 48358.0, 1170546.0, 2872714.0, 61727.0, 13463.0, 4577.0, 1793.0, 896.0, 434.0, 269.0, 145.0, 88.0, 70.0, 29.0, 21.0, 21.0, 9.0, 11.0, 10.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8515625, -11.5135498046875, -11.175537109375, -10.8375244140625, -10.49951171875, -10.1614990234375, -9.823486328125, -9.4854736328125, -9.1474609375, -8.8094482421875, -8.471435546875, -8.1334228515625, -7.79541015625, -7.4573974609375, -7.119384765625, -6.7813720703125, -6.443359375, -6.1053466796875, -5.767333984375, -5.4293212890625, -5.09130859375, -4.7532958984375, -4.415283203125, -4.0772705078125, -3.7392578125, -3.4012451171875, -3.063232421875, -2.7252197265625, -2.38720703125, -2.0491943359375, -1.711181640625, -1.3731689453125, -1.03515625, -0.6971435546875, -0.359130859375, -0.0211181640625, 0.31689453125, 0.6549072265625, 0.992919921875, 1.3309326171875, 1.6689453125, 2.0069580078125, 2.344970703125, 2.6829833984375, 3.02099609375, 3.3590087890625, 3.697021484375, 4.0350341796875, 4.373046875, 4.7110595703125, 5.049072265625, 5.3870849609375, 5.72509765625, 6.0631103515625, 6.401123046875, 6.7391357421875, 7.0771484375, 7.4151611328125, 7.753173828125, 8.0911865234375, 8.42919921875, 8.7672119140625, 9.105224609375, 9.4432373046875, 9.78125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 12.0, 12.0, 14.0, 22.0, 18.0, 26.0, 29.0, 38.0, 48.0, 42.0, 79.0, 66.0, 80.0, 74.0, 55.0, 63.0, 57.0, 52.0, 45.0, 43.0, 30.0, 20.0, 19.0, 17.0, 10.0, 7.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.939453125, -1.885650634765625, -1.83184814453125, -1.778045654296875, -1.7242431640625, -1.670440673828125, -1.61663818359375, -1.562835693359375, -1.509033203125, -1.455230712890625, -1.40142822265625, -1.347625732421875, -1.2938232421875, -1.240020751953125, -1.18621826171875, -1.132415771484375, -1.07861328125, -1.024810791015625, -0.97100830078125, -0.917205810546875, -0.8634033203125, -0.809600830078125, -0.75579833984375, -0.701995849609375, -0.648193359375, -0.594390869140625, -0.54058837890625, -0.486785888671875, -0.4329833984375, -0.379180908203125, -0.32537841796875, -0.271575927734375, -0.2177734375, -0.163970947265625, -0.11016845703125, -0.056365966796875, -0.0025634765625, 0.051239013671875, 0.10504150390625, 0.158843994140625, 0.212646484375, 0.266448974609375, 0.32025146484375, 0.374053955078125, 0.4278564453125, 0.481658935546875, 0.53546142578125, 0.589263916015625, 0.64306640625, 0.696868896484375, 0.75067138671875, 0.804473876953125, 0.8582763671875, 0.912078857421875, 0.96588134765625, 1.019683837890625, 1.073486328125, 1.127288818359375, 1.18109130859375, 1.234893798828125, 1.2886962890625, 1.342498779296875, 1.39630126953125, 1.450103759765625, 1.50390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 7.0, 22.0, 39.0, 59.0, 81.0, 177.0, 638.0, 3425033.0, 767177.0, 598.0, 169.0, 105.0, 69.0, 40.0, 27.0, 13.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -27.923095703125, -25.92431640625, -23.925537109375, -21.9267578125, -19.927978515625, -17.92919921875, -15.930419921875, -13.931640625, -11.932861328125, -9.93408203125, -7.935302734375, -5.9365234375, -3.937744140625, -1.93896484375, 0.059814453125, 2.05859375, 4.057373046875, 6.05615234375, 8.054931640625, 10.0537109375, 12.052490234375, 14.05126953125, 16.050048828125, 18.048828125, 20.047607421875, 22.04638671875, 24.045166015625, 26.0439453125, 28.042724609375, 30.04150390625, 32.040283203125, 34.0390625, 36.037841796875, 38.03662109375, 40.035400390625, 42.0341796875, 44.032958984375, 46.03173828125, 48.030517578125, 50.029296875, 52.028076171875, 54.02685546875, 56.025634765625, 58.0244140625, 60.023193359375, 62.02197265625, 64.020751953125, 66.01953125, 68.018310546875, 70.01708984375, 72.015869140625, 74.0146484375, 76.013427734375, 78.01220703125, 80.010986328125, 82.009765625, 84.008544921875, 86.00732421875, 88.006103515625, 90.0048828125, 92.003662109375, 94.00244140625, 96.001220703125, 98.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 28.0, 71.0, 395.0, 3010.0, 468.0, 68.0, 24.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.087799072265625, -2.76348876953125, -2.439178466796875, -2.1148681640625, -1.790557861328125, -1.46624755859375, -1.141937255859375, -0.817626953125, -0.493316650390625, -0.16900634765625, 0.155303955078125, 0.4796142578125, 0.803924560546875, 1.12823486328125, 1.452545166015625, 1.77685546875, 2.101165771484375, 2.42547607421875, 2.749786376953125, 3.0740966796875, 3.398406982421875, 3.72271728515625, 4.047027587890625, 4.371337890625, 4.695648193359375, 5.01995849609375, 5.344268798828125, 5.6685791015625, 5.992889404296875, 6.31719970703125, 6.641510009765625, 6.9658203125, 7.290130615234375, 7.61444091796875, 7.938751220703125, 8.2630615234375, 8.587371826171875, 8.91168212890625, 9.235992431640625, 9.560302734375, 9.884613037109375, 10.20892333984375, 10.533233642578125, 10.8575439453125, 11.181854248046875, 11.50616455078125, 11.830474853515625, 12.15478515625, 12.479095458984375, 12.80340576171875, 13.127716064453125, 13.4520263671875, 13.776336669921875, 14.10064697265625, 14.424957275390625, 14.749267578125, 15.073577880859375, 15.39788818359375, 15.722198486328125, 16.0465087890625, 16.370819091796875, 16.69512939453125, 17.019439697265625, 17.34375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 14.0, 53.0, 131.0, 245.0, 283.0, 150.0, 57.0, 33.0, 15.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.94773864746094, -54.585166931152344, -53.222591400146484, -51.86001968383789, -50.4974479675293, -49.1348762512207, -47.772300720214844, -46.40972900390625, -45.047157287597656, -43.68458557128906, -42.3220100402832, -40.95943832397461, -39.596866607666016, -38.23429489135742, -36.87171936035156, -35.50914764404297, -34.146575927734375, -32.78400421142578, -31.421430587768555, -30.058856964111328, -28.696285247802734, -27.333711624145508, -25.97113800048828, -24.608566284179688, -23.245990753173828, -21.8834171295166, -20.520845413208008, -19.15827178955078, -17.795700073242188, -16.43312644958496, -15.07055377960205, -13.70798110961914, -12.345407485961914, -10.982834815979004, -9.620262145996094, -8.257688522338867, -6.895116329193115, -5.532543659210205, -4.169970512390137, -2.8073978424072266, -1.4448251724243164, -0.0822523832321167, 1.280320405960083, 2.6428933143615723, 4.005465984344482, 5.368038654327393, 6.730611801147461, 8.093184471130371, 9.455757141113281, 10.818329811096191, 12.180902481079102, 13.543476104736328, 14.906047821044922, 16.26862144470215, 17.631195068359375, 18.99376678466797, 20.356338500976562, 21.71891212463379, 23.081483840942383, 24.44405746459961, 25.806629180908203, 27.16920280456543, 28.531776428222656, 29.89434814453125, 31.256921768188477]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 13.0, 21.0, 49.0, 56.0, 79.0, 109.0, 132.0, 127.0, 114.0, 91.0, 73.0, 60.0, 37.0, 20.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.86408996582031, -33.90414810180664, -32.944210052490234, -31.984268188476562, -31.024328231811523, -30.06438636779785, -29.104446411132812, -28.14450454711914, -27.1845645904541, -26.224624633789062, -25.26468276977539, -24.30474281311035, -23.344802856445312, -22.38486099243164, -21.4249210357666, -20.464981079101562, -19.50503921508789, -18.54509925842285, -17.58515739440918, -16.62521743774414, -15.665276527404785, -14.70533561706543, -13.74539566040039, -12.785454750061035, -11.825515747070312, -10.865574836730957, -9.905634880065918, -8.945693969726562, -7.985753059387207, -7.02581262588501, -6.0658721923828125, -5.105931282043457, -4.145990371704102, -3.186049699783325, -2.226109027862549, -1.2661685943603516, -0.3062279224395752, 0.6537127494812012, 1.6136531829833984, 2.573594093322754, 3.533534526824951, 4.493474960327148, 5.453415870666504, 6.413356304168701, 7.373296737670898, 8.333237648010254, 9.29317855834961, 10.253118515014648, 11.213059425354004, 12.17300033569336, 13.132940292358398, 14.092881202697754, 15.05282211303711, 16.01276206970215, 16.972702026367188, 17.93264389038086, 18.8925838470459, 19.852523803710938, 20.81246566772461, 21.77240562438965, 22.732345581054688, 23.69228744506836, 24.6522274017334, 25.612167358398438, 26.57210922241211]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 12.0, 14.0, 21.0, 41.0, 53.0, 87.0, 155.0, 247.0, 408.0, 748.0, 1358.0, 2781.0, 6685.0, 20038.0, 72567.0, 291754.0, 457892.0, 139321.0, 35310.0, 10737.0, 4079.0, 1857.0, 1001.0, 544.0, 287.0, 197.0, 124.0, 80.0, 50.0, 34.0, 20.0, 15.0, 8.0, 11.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.7109375, -11.3785400390625, -11.046142578125, -10.7137451171875, -10.38134765625, -10.0489501953125, -9.716552734375, -9.3841552734375, -9.0517578125, -8.7193603515625, -8.386962890625, -8.0545654296875, -7.72216796875, -7.3897705078125, -7.057373046875, -6.7249755859375, -6.392578125, -6.0601806640625, -5.727783203125, -5.3953857421875, -5.06298828125, -4.7305908203125, -4.398193359375, -4.0657958984375, -3.7333984375, -3.4010009765625, -3.068603515625, -2.7362060546875, -2.40380859375, -2.0714111328125, -1.739013671875, -1.4066162109375, -1.07421875, -0.7418212890625, -0.409423828125, -0.0770263671875, 0.25537109375, 0.5877685546875, 0.920166015625, 1.2525634765625, 1.5849609375, 1.9173583984375, 2.249755859375, 2.5821533203125, 2.91455078125, 3.2469482421875, 3.579345703125, 3.9117431640625, 4.244140625, 4.5765380859375, 4.908935546875, 5.2413330078125, 5.57373046875, 5.9061279296875, 6.238525390625, 6.5709228515625, 6.9033203125, 7.2357177734375, 7.568115234375, 7.9005126953125, 8.23291015625, 8.5653076171875, 8.897705078125, 9.2301025390625, 9.5625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 9.0, 14.0, 16.0, 14.0, 37.0, 30.0, 33.0, 43.0, 55.0, 67.0, 64.0, 81.0, 61.0, 76.0, 79.0, 58.0, 47.0, 41.0, 40.0, 34.0, 24.0, 22.0, 14.0, 8.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.39453125, -2.331817626953125, -2.26910400390625, -2.206390380859375, -2.1436767578125, -2.080963134765625, -2.01824951171875, -1.955535888671875, -1.892822265625, -1.830108642578125, -1.76739501953125, -1.704681396484375, -1.6419677734375, -1.579254150390625, -1.51654052734375, -1.453826904296875, -1.39111328125, -1.328399658203125, -1.26568603515625, -1.202972412109375, -1.1402587890625, -1.077545166015625, -1.01483154296875, -0.952117919921875, -0.889404296875, -0.826690673828125, -0.76397705078125, -0.701263427734375, -0.6385498046875, -0.575836181640625, -0.51312255859375, -0.450408935546875, -0.3876953125, -0.324981689453125, -0.26226806640625, -0.199554443359375, -0.1368408203125, -0.074127197265625, -0.01141357421875, 0.051300048828125, 0.114013671875, 0.176727294921875, 0.23944091796875, 0.302154541015625, 0.3648681640625, 0.427581787109375, 0.49029541015625, 0.553009033203125, 0.61572265625, 0.678436279296875, 0.74114990234375, 0.803863525390625, 0.8665771484375, 0.929290771484375, 0.99200439453125, 1.054718017578125, 1.117431640625, 1.180145263671875, 1.24285888671875, 1.305572509765625, 1.3682861328125, 1.430999755859375, 1.49371337890625, 1.556427001953125, 1.619140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 10.0, 14.0, 19.0, 29.0, 37.0, 62.0, 100.0, 106.0, 139.0, 193.0, 243.0, 408.0, 725.0, 1250.0, 2656.0, 6739.0, 19749.0, 68608.0, 243339.0, 434350.0, 191038.0, 52410.0, 15709.0, 5292.0, 2301.0, 1058.0, 645.0, 375.0, 276.0, 156.0, 111.0, 98.0, 71.0, 60.0, 27.0, 40.0, 19.0, 15.0, 14.0, 12.0, 13.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9609375, -5.76483154296875, -5.5687255859375, -5.37261962890625, -5.176513671875, -4.98040771484375, -4.7843017578125, -4.58819580078125, -4.39208984375, -4.19598388671875, -3.9998779296875, -3.80377197265625, -3.607666015625, -3.41156005859375, -3.2154541015625, -3.01934814453125, -2.8232421875, -2.62713623046875, -2.4310302734375, -2.23492431640625, -2.038818359375, -1.84271240234375, -1.6466064453125, -1.45050048828125, -1.25439453125, -1.05828857421875, -0.8621826171875, -0.66607666015625, -0.469970703125, -0.27386474609375, -0.0777587890625, 0.11834716796875, 0.314453125, 0.51055908203125, 0.7066650390625, 0.90277099609375, 1.098876953125, 1.29498291015625, 1.4910888671875, 1.68719482421875, 1.88330078125, 2.07940673828125, 2.2755126953125, 2.47161865234375, 2.667724609375, 2.86383056640625, 3.0599365234375, 3.25604248046875, 3.4521484375, 3.64825439453125, 3.8443603515625, 4.04046630859375, 4.236572265625, 4.43267822265625, 4.6287841796875, 4.82489013671875, 5.02099609375, 5.21710205078125, 5.4132080078125, 5.60931396484375, 5.805419921875, 6.00152587890625, 6.1976318359375, 6.39373779296875, 6.58984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 6.0, 12.0, 5.0, 15.0, 18.0, 19.0, 19.0, 17.0, 18.0, 35.0, 31.0, 37.0, 45.0, 32.0, 39.0, 50.0, 51.0, 30.0, 38.0, 50.0, 41.0, 40.0, 35.0, 34.0, 33.0, 28.0, 30.0, 20.0, 22.0, 17.0, 16.0, 22.0, 13.0, 12.0, 15.0, 4.0, 7.0, 3.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.87890625, -4.7215576171875, -4.564208984375, -4.4068603515625, -4.24951171875, -4.0921630859375, -3.934814453125, -3.7774658203125, -3.6201171875, -3.4627685546875, -3.305419921875, -3.1480712890625, -2.99072265625, -2.8333740234375, -2.676025390625, -2.5186767578125, -2.361328125, -2.2039794921875, -2.046630859375, -1.8892822265625, -1.73193359375, -1.5745849609375, -1.417236328125, -1.2598876953125, -1.1025390625, -0.9451904296875, -0.787841796875, -0.6304931640625, -0.47314453125, -0.3157958984375, -0.158447265625, -0.0010986328125, 0.15625, 0.3135986328125, 0.470947265625, 0.6282958984375, 0.78564453125, 0.9429931640625, 1.100341796875, 1.2576904296875, 1.4150390625, 1.5723876953125, 1.729736328125, 1.8870849609375, 2.04443359375, 2.2017822265625, 2.359130859375, 2.5164794921875, 2.673828125, 2.8311767578125, 2.988525390625, 3.1458740234375, 3.30322265625, 3.4605712890625, 3.617919921875, 3.7752685546875, 3.9326171875, 4.0899658203125, 4.247314453125, 4.4046630859375, 4.56201171875, 4.7193603515625, 4.876708984375, 5.0340576171875, 5.19140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 8.0, 14.0, 14.0, 31.0, 34.0, 57.0, 96.0, 139.0, 236.0, 368.0, 595.0, 1079.0, 2014.0, 4345.0, 10659.0, 33051.0, 163973.0, 576626.0, 195680.0, 38006.0, 11811.0, 4599.0, 2258.0, 1136.0, 657.0, 364.0, 242.0, 150.0, 85.0, 63.0, 51.0, 34.0, 23.0, 12.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.046875, -4.88690185546875, -4.7269287109375, -4.56695556640625, -4.406982421875, -4.24700927734375, -4.0870361328125, -3.92706298828125, -3.76708984375, -3.60711669921875, -3.4471435546875, -3.28717041015625, -3.127197265625, -2.96722412109375, -2.8072509765625, -2.64727783203125, -2.4873046875, -2.32733154296875, -2.1673583984375, -2.00738525390625, -1.847412109375, -1.68743896484375, -1.5274658203125, -1.36749267578125, -1.20751953125, -1.04754638671875, -0.8875732421875, -0.72760009765625, -0.567626953125, -0.40765380859375, -0.2476806640625, -0.08770751953125, 0.072265625, 0.23223876953125, 0.3922119140625, 0.55218505859375, 0.712158203125, 0.87213134765625, 1.0321044921875, 1.19207763671875, 1.35205078125, 1.51202392578125, 1.6719970703125, 1.83197021484375, 1.991943359375, 2.15191650390625, 2.3118896484375, 2.47186279296875, 2.6318359375, 2.79180908203125, 2.9517822265625, 3.11175537109375, 3.271728515625, 3.43170166015625, 3.5916748046875, 3.75164794921875, 3.91162109375, 4.07159423828125, 4.2315673828125, 4.39154052734375, 4.551513671875, 4.71148681640625, 4.8714599609375, 5.03143310546875, 5.19140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 3.0, 6.0, 6.0, 7.0, 13.0, 17.0, 29.0, 27.0, 49.0, 68.0, 108.0, 119.0, 129.0, 95.0, 78.0, 58.0, 53.0, 42.0, 23.0, 22.0, 8.0, 5.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000911712646484375, -0.0008886009454727173, -0.0008654892444610596, -0.0008423775434494019, -0.0008192658424377441, -0.0007961541414260864, -0.0007730424404144287, -0.000749930739402771, -0.0007268190383911133, -0.0007037073373794556, -0.0006805956363677979, -0.0006574839353561401, -0.0006343722343444824, -0.0006112605333328247, -0.000588148832321167, -0.0005650371313095093, -0.0005419254302978516, -0.0005188137292861938, -0.0004957020282745361, -0.0004725903272628784, -0.0004494786262512207, -0.000426366925239563, -0.0004032552242279053, -0.00038014352321624756, -0.00035703182220458984, -0.00033392012119293213, -0.0003108084201812744, -0.0002876967191696167, -0.000264585018157959, -0.00024147331714630127, -0.00021836161613464355, -0.00019524991512298584, -0.00017213821411132812, -0.0001490265130996704, -0.0001259148120880127, -0.00010280311107635498, -7.969141006469727e-05, -5.657970905303955e-05, -3.3468008041381836e-05, -1.0356307029724121e-05, 1.2755393981933594e-05, 3.586709499359131e-05, 5.8978796005249023e-05, 8.209049701690674e-05, 0.00010520219802856445, 0.00012831389904022217, 0.00015142560005187988, 0.0001745373010635376, 0.0001976490020751953, 0.00022076070308685303, 0.00024387240409851074, 0.00026698410511016846, 0.00029009580612182617, 0.0003132075071334839, 0.0003363192081451416, 0.0003594309091567993, 0.00038254261016845703, 0.00040565431118011475, 0.00042876601219177246, 0.0004518777132034302, 0.0004749894142150879, 0.0004981011152267456, 0.0005212128162384033, 0.000544324517250061, 0.0005674362182617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 19.0, 32.0, 63.0, 66.0, 133.0, 271.0, 594.0, 1339.0, 3613.0, 13562.0, 87372.0, 768203.0, 147253.0, 18396.0, 4600.0, 1561.0, 711.0, 331.0, 152.0, 94.0, 41.0, 40.0, 21.0, 8.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9140625, -8.640625, -8.3671875, -8.09375, -7.8203125, -7.546875, -7.2734375, -7.0, -6.7265625, -6.453125, -6.1796875, -5.90625, -5.6328125, -5.359375, -5.0859375, -4.8125, -4.5390625, -4.265625, -3.9921875, -3.71875, -3.4453125, -3.171875, -2.8984375, -2.625, -2.3515625, -2.078125, -1.8046875, -1.53125, -1.2578125, -0.984375, -0.7109375, -0.4375, -0.1640625, 0.109375, 0.3828125, 0.65625, 0.9296875, 1.203125, 1.4765625, 1.75, 2.0234375, 2.296875, 2.5703125, 2.84375, 3.1171875, 3.390625, 3.6640625, 3.9375, 4.2109375, 4.484375, 4.7578125, 5.03125, 5.3046875, 5.578125, 5.8515625, 6.125, 6.3984375, 6.671875, 6.9453125, 7.21875, 7.4921875, 7.765625, 8.0390625, 8.3125, 8.5859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 13.0, 13.0, 17.0, 31.0, 57.0, 85.0, 143.0, 195.0, 149.0, 108.0, 74.0, 38.0, 22.0, 17.0, 9.0, 9.0, 5.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.77130126953125, -5.5465087890625, -5.32171630859375, -5.096923828125, -4.87213134765625, -4.6473388671875, -4.42254638671875, -4.19775390625, -3.97296142578125, -3.7481689453125, -3.52337646484375, -3.298583984375, -3.07379150390625, -2.8489990234375, -2.62420654296875, -2.3994140625, -2.17462158203125, -1.9498291015625, -1.72503662109375, -1.500244140625, -1.27545166015625, -1.0506591796875, -0.82586669921875, -0.60107421875, -0.37628173828125, -0.1514892578125, 0.07330322265625, 0.298095703125, 0.52288818359375, 0.7476806640625, 0.97247314453125, 1.197265625, 1.42205810546875, 1.6468505859375, 1.87164306640625, 2.096435546875, 2.32122802734375, 2.5460205078125, 2.77081298828125, 2.99560546875, 3.22039794921875, 3.4451904296875, 3.66998291015625, 3.894775390625, 4.11956787109375, 4.3443603515625, 4.56915283203125, 4.7939453125, 5.01873779296875, 5.2435302734375, 5.46832275390625, 5.693115234375, 5.91790771484375, 6.1427001953125, 6.36749267578125, 6.59228515625, 6.81707763671875, 7.0418701171875, 7.26666259765625, 7.491455078125, 7.71624755859375, 7.9410400390625, 8.16583251953125, 8.390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 28.0, 63.0, 181.0, 344.0, 230.0, 108.0, 23.0, 13.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.39596557617188, -84.50086212158203, -80.60575866699219, -76.71065521240234, -72.8155517578125, -68.92044067382812, -65.02534484863281, -61.13023376464844, -57.235130310058594, -53.34002685546875, -49.444923400878906, -45.54981994628906, -41.65471267700195, -37.75960922241211, -33.864505767822266, -29.96940040588379, -26.074298858642578, -22.179195404052734, -18.284090042114258, -14.388986587524414, -10.493882179260254, -6.598777770996094, -2.70367431640625, 1.1914310455322266, 5.08653450012207, 8.98163890838623, 12.87674331665039, 16.771846771240234, 20.666950225830078, 24.562055587768555, 28.4571590423584, 32.352264404296875, 36.24736785888672, 40.14247131347656, 44.037574768066406, 47.93267822265625, 51.82778549194336, 55.7228889465332, 59.61799240112305, 63.513099670410156, 67.408203125, 71.30330657958984, 75.19841003417969, 79.09351348876953, 82.98861694335938, 86.88372802734375, 90.77882385253906, 94.67393493652344, 98.56903076171875, 102.4641342163086, 106.35923767089844, 110.25434112548828, 114.14944458007812, 118.0445556640625, 121.93965148925781, 125.83476257324219, 129.72987365722656, 133.62498474121094, 137.52008056640625, 141.41519165039062, 145.31028747558594, 149.2053985595703, 153.10049438476562, 156.99560546875, 160.8907012939453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 7.0, 13.0, 13.0, 14.0, 14.0, 21.0, 22.0, 24.0, 39.0, 28.0, 40.0, 41.0, 38.0, 46.0, 48.0, 43.0, 38.0, 38.0, 46.0, 67.0, 56.0, 42.0, 29.0, 35.0, 34.0, 26.0, 21.0, 20.0, 26.0, 12.0, 6.0, 10.0, 15.0, 2.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-39.394832611083984, -38.283363342285156, -37.17189407348633, -36.0604248046875, -34.94895553588867, -33.837486267089844, -32.726016998291016, -31.614547729492188, -30.50307846069336, -29.39160919189453, -28.280139923095703, -27.168670654296875, -26.057201385498047, -24.94573211669922, -23.83426284790039, -22.722793579101562, -21.611326217651367, -20.49985694885254, -19.38838768005371, -18.276918411254883, -17.165449142456055, -16.053979873657227, -14.942511558532715, -13.831042289733887, -12.719573020935059, -11.60810375213623, -10.496634483337402, -9.38516616821289, -8.273696899414062, -7.162227153778076, -6.050758361816406, -4.939289093017578, -3.82781982421875, -2.716350555419922, -1.6048815250396729, -0.49341249465942383, 0.6180567741394043, 1.7295260429382324, 2.8409948348999023, 3.9524641036987305, 5.063933372497559, 6.175402641296387, 7.286871910095215, 8.398340225219727, 9.509809494018555, 10.621278762817383, 11.732748031616211, 12.844217300415039, 13.955686569213867, 15.067155838012695, 16.178625106811523, 17.29009437561035, 18.40156364440918, 19.513032913208008, 20.624500274658203, 21.73596954345703, 22.84743881225586, 23.958908081054688, 25.070377349853516, 26.181846618652344, 27.293315887451172, 28.40478515625, 29.516254425048828, 30.627723693847656, 31.739192962646484]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 5.0, 15.0, 16.0, 27.0, 26.0, 61.0, 55.0, 94.0, 113.0, 153.0, 243.0, 379.0, 578.0, 1070.0, 2238.0, 5168.0, 14351.0, 57291.0, 757678.0, 3215096.0, 104361.0, 21766.0, 7176.0, 2967.0, 1427.0, 801.0, 405.0, 254.0, 178.0, 86.0, 57.0, 44.0, 23.0, 14.0, 10.0, 12.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-14.2421875, -13.8875732421875, -13.532958984375, -13.1783447265625, -12.82373046875, -12.4691162109375, -12.114501953125, -11.7598876953125, -11.4052734375, -11.0506591796875, -10.696044921875, -10.3414306640625, -9.98681640625, -9.6322021484375, -9.277587890625, -8.9229736328125, -8.568359375, -8.2137451171875, -7.859130859375, -7.5045166015625, -7.14990234375, -6.7952880859375, -6.440673828125, -6.0860595703125, -5.7314453125, -5.3768310546875, -5.022216796875, -4.6676025390625, -4.31298828125, -3.9583740234375, -3.603759765625, -3.2491455078125, -2.89453125, -2.5399169921875, -2.185302734375, -1.8306884765625, -1.47607421875, -1.1214599609375, -0.766845703125, -0.4122314453125, -0.0576171875, 0.2969970703125, 0.651611328125, 1.0062255859375, 1.36083984375, 1.7154541015625, 2.070068359375, 2.4246826171875, 2.779296875, 3.1339111328125, 3.488525390625, 3.8431396484375, 4.19775390625, 4.5523681640625, 4.906982421875, 5.2615966796875, 5.6162109375, 5.9708251953125, 6.325439453125, 6.6800537109375, 7.03466796875, 7.3892822265625, 7.743896484375, 8.0985107421875, 8.453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 14.0, 14.0, 18.0, 21.0, 37.0, 28.0, 45.0, 41.0, 52.0, 64.0, 63.0, 79.0, 84.0, 60.0, 64.0, 56.0, 40.0, 44.0, 35.0, 32.0, 24.0, 17.0, 11.0, 10.0, 16.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.36328125, -2.299224853515625, -2.23516845703125, -2.171112060546875, -2.1070556640625, -2.042999267578125, -1.97894287109375, -1.914886474609375, -1.850830078125, -1.786773681640625, -1.72271728515625, -1.658660888671875, -1.5946044921875, -1.530548095703125, -1.46649169921875, -1.402435302734375, -1.33837890625, -1.274322509765625, -1.21026611328125, -1.146209716796875, -1.0821533203125, -1.018096923828125, -0.95404052734375, -0.889984130859375, -0.825927734375, -0.761871337890625, -0.69781494140625, -0.633758544921875, -0.5697021484375, -0.505645751953125, -0.44158935546875, -0.377532958984375, -0.3134765625, -0.249420166015625, -0.18536376953125, -0.121307373046875, -0.0572509765625, 0.006805419921875, 0.07086181640625, 0.134918212890625, 0.198974609375, 0.263031005859375, 0.32708740234375, 0.391143798828125, 0.4552001953125, 0.519256591796875, 0.58331298828125, 0.647369384765625, 0.71142578125, 0.775482177734375, 0.83953857421875, 0.903594970703125, 0.9676513671875, 1.031707763671875, 1.09576416015625, 1.159820556640625, 1.223876953125, 1.287933349609375, 1.35198974609375, 1.416046142578125, 1.4801025390625, 1.544158935546875, 1.60821533203125, 1.672271728515625, 1.736328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 4.0, 5.0, 15.0, 12.0, 15.0, 31.0, 49.0, 103.0, 200.0, 475.0, 1432.0, 4843.0, 21374.0, 164179.0, 3575683.0, 381431.0, 34166.0, 7121.0, 1955.0, 645.0, 261.0, 105.0, 59.0, 34.0, 22.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9453125, -10.599365234375, -10.25341796875, -9.907470703125, -9.5615234375, -9.215576171875, -8.86962890625, -8.523681640625, -8.177734375, -7.831787109375, -7.48583984375, -7.139892578125, -6.7939453125, -6.447998046875, -6.10205078125, -5.756103515625, -5.41015625, -5.064208984375, -4.71826171875, -4.372314453125, -4.0263671875, -3.680419921875, -3.33447265625, -2.988525390625, -2.642578125, -2.296630859375, -1.95068359375, -1.604736328125, -1.2587890625, -0.912841796875, -0.56689453125, -0.220947265625, 0.125, 0.470947265625, 0.81689453125, 1.162841796875, 1.5087890625, 1.854736328125, 2.20068359375, 2.546630859375, 2.892578125, 3.238525390625, 3.58447265625, 3.930419921875, 4.2763671875, 4.622314453125, 4.96826171875, 5.314208984375, 5.66015625, 6.006103515625, 6.35205078125, 6.697998046875, 7.0439453125, 7.389892578125, 7.73583984375, 8.081787109375, 8.427734375, 8.773681640625, 9.11962890625, 9.465576171875, 9.8115234375, 10.157470703125, 10.50341796875, 10.849365234375, 11.1953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 10.0, 18.0, 25.0, 32.0, 47.0, 48.0, 89.0, 155.0, 245.0, 488.0, 1048.0, 893.0, 381.0, 214.0, 119.0, 71.0, 55.0, 26.0, 22.0, 11.0, 14.0, 17.0, 5.0, 7.0, 2.0, 0.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.728118896484375, -2.63006591796875, -2.532012939453125, -2.4339599609375, -2.335906982421875, -2.23785400390625, -2.139801025390625, -2.041748046875, -1.943695068359375, -1.84564208984375, -1.747589111328125, -1.6495361328125, -1.551483154296875, -1.45343017578125, -1.355377197265625, -1.25732421875, -1.159271240234375, -1.06121826171875, -0.963165283203125, -0.8651123046875, -0.767059326171875, -0.66900634765625, -0.570953369140625, -0.472900390625, -0.374847412109375, -0.27679443359375, -0.178741455078125, -0.0806884765625, 0.017364501953125, 0.11541748046875, 0.213470458984375, 0.3115234375, 0.409576416015625, 0.50762939453125, 0.605682373046875, 0.7037353515625, 0.801788330078125, 0.89984130859375, 0.997894287109375, 1.095947265625, 1.194000244140625, 1.29205322265625, 1.390106201171875, 1.4881591796875, 1.586212158203125, 1.68426513671875, 1.782318115234375, 1.88037109375, 1.978424072265625, 2.07647705078125, 2.174530029296875, 2.2725830078125, 2.370635986328125, 2.46868896484375, 2.566741943359375, 2.664794921875, 2.762847900390625, 2.86090087890625, 2.958953857421875, 3.0570068359375, 3.155059814453125, 3.25311279296875, 3.351165771484375, 3.44921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 12.0, 20.0, 28.0, 56.0, 63.0, 112.0, 147.0, 157.0, 100.0, 100.0, 70.0, 57.0, 27.0, 11.0, 8.0, 7.0, 4.0, 7.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.24801254272461, -18.523685455322266, -17.799358367919922, -17.075031280517578, -16.350704193115234, -15.626378059387207, -14.902050971984863, -14.177724838256836, -13.453397750854492, -12.729070663452148, -12.004743576049805, -11.280416488647461, -10.556090354919434, -9.83176326751709, -9.107436180114746, -8.383110046386719, -7.658782005310059, -6.934454917907715, -6.210128307342529, -5.4858012199401855, -4.761474609375, -4.037147521972656, -3.3128204345703125, -2.588493824005127, -1.8641667366027832, -1.1398398876190186, -0.41551291942596436, 0.30881404876708984, 1.0331408977508545, 1.7574677467346191, 2.481794834136963, 3.2061214447021484, 3.930448532104492, 4.654775619506836, 5.3791022300720215, 6.103429317474365, 6.827755928039551, 7.5520830154418945, 8.276410102844238, 9.000736236572266, 9.72506332397461, 10.449390411376953, 11.173717498779297, 11.89804458618164, 12.622370719909668, 13.346697807312012, 14.071024894714355, 14.795351028442383, 15.519679069519043, 16.24400520324707, 16.968332290649414, 17.692659378051758, 18.4169864654541, 19.141313552856445, 19.86564064025879, 20.589967727661133, 21.314294815063477, 22.03862190246582, 22.762948989868164, 23.487276077270508, 24.21160316467285, 24.935928344726562, 25.660255432128906, 26.38458251953125, 27.108909606933594]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 9.0, 10.0, 7.0, 14.0, 10.0, 17.0, 27.0, 27.0, 24.0, 43.0, 40.0, 37.0, 46.0, 61.0, 33.0, 55.0, 47.0, 52.0, 39.0, 56.0, 38.0, 41.0, 45.0, 30.0, 41.0, 25.0, 18.0, 22.0, 13.0, 19.0, 12.0, 13.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.535513877868652, -12.176068305969238, -11.816621780395508, -11.457176208496094, -11.09773063659668, -10.738285064697266, -10.378838539123535, -10.019392967224121, -9.65994644165039, -9.300500869750977, -8.941054344177246, -8.581608772277832, -8.222163200378418, -7.862717151641846, -7.503271102905273, -7.143825531005859, -6.784379959106445, -6.424933910369873, -6.065488338470459, -5.706042289733887, -5.346596717834473, -4.9871506690979, -4.627704620361328, -4.268259048461914, -3.908812999725342, -3.5493671894073486, -3.1899213790893555, -2.830475330352783, -2.47102952003479, -2.111583709716797, -1.7521376609802246, -1.3926918506622314, -1.0332469940185547, -0.6738011240959167, -0.3143552541732788, 0.045090675354003906, 0.40453648567199707, 0.7639822959899902, 1.1234283447265625, 1.4828741550445557, 1.8423199653625488, 2.201765775680542, 2.561211585998535, 2.9206576347351074, 3.2801034450531006, 3.6395492553710938, 3.998995304107666, 4.358441352844238, 4.717886924743652, 5.077332973480225, 5.436778545379639, 5.796224594116211, 6.155670166015625, 6.515116214752197, 6.8745622634887695, 7.234007835388184, 7.593453884124756, 7.952899932861328, 8.312345504760742, 8.671791076660156, 9.031237602233887, 9.3906831741333, 9.750129699707031, 10.109575271606445, 10.46902084350586]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 4.0, 4.0, 12.0, 20.0, 18.0, 26.0, 24.0, 27.0, 55.0, 78.0, 105.0, 127.0, 245.0, 327.0, 565.0, 896.0, 1470.0, 2619.0, 5071.0, 10313.0, 23477.0, 58333.0, 159023.0, 422619.0, 227257.0, 77943.0, 30897.0, 13009.0, 6061.0, 3151.0, 1806.0, 1086.0, 644.0, 384.0, 276.0, 166.0, 98.0, 86.0, 64.0, 54.0, 20.0, 19.0, 21.0, 11.0, 11.0, 13.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4921875, -6.2803955078125, -6.068603515625, -5.8568115234375, -5.64501953125, -5.4332275390625, -5.221435546875, -5.0096435546875, -4.7978515625, -4.5860595703125, -4.374267578125, -4.1624755859375, -3.95068359375, -3.7388916015625, -3.527099609375, -3.3153076171875, -3.103515625, -2.8917236328125, -2.679931640625, -2.4681396484375, -2.25634765625, -2.0445556640625, -1.832763671875, -1.6209716796875, -1.4091796875, -1.1973876953125, -0.985595703125, -0.7738037109375, -0.56201171875, -0.3502197265625, -0.138427734375, 0.0733642578125, 0.28515625, 0.4969482421875, 0.708740234375, 0.9205322265625, 1.13232421875, 1.3441162109375, 1.555908203125, 1.7677001953125, 1.9794921875, 2.1912841796875, 2.403076171875, 2.6148681640625, 2.82666015625, 3.0384521484375, 3.250244140625, 3.4620361328125, 3.673828125, 3.8856201171875, 4.097412109375, 4.3092041015625, 4.52099609375, 4.7327880859375, 4.944580078125, 5.1563720703125, 5.3681640625, 5.5799560546875, 5.791748046875, 6.0035400390625, 6.21533203125, 6.4271240234375, 6.638916015625, 6.8507080078125, 7.0625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 15.0, 20.0, 22.0, 26.0, 36.0, 41.0, 59.0, 48.0, 64.0, 75.0, 61.0, 84.0, 65.0, 67.0, 56.0, 49.0, 40.0, 27.0, 26.0, 25.0, 14.0, 14.0, 13.0, 8.0, 4.0, 5.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.345703125, -2.2800750732421875, -2.214447021484375, -2.1488189697265625, -2.08319091796875, -2.0175628662109375, -1.951934814453125, -1.8863067626953125, -1.8206787109375, -1.7550506591796875, -1.689422607421875, -1.6237945556640625, -1.55816650390625, -1.4925384521484375, -1.426910400390625, -1.3612823486328125, -1.295654296875, -1.2300262451171875, -1.164398193359375, -1.0987701416015625, -1.03314208984375, -0.9675140380859375, -0.901885986328125, -0.8362579345703125, -0.7706298828125, -0.7050018310546875, -0.639373779296875, -0.5737457275390625, -0.50811767578125, -0.4424896240234375, -0.376861572265625, -0.3112335205078125, -0.24560546875, -0.1799774169921875, -0.114349365234375, -0.0487213134765625, 0.01690673828125, 0.0825347900390625, 0.148162841796875, 0.2137908935546875, 0.2794189453125, 0.3450469970703125, 0.410675048828125, 0.4763031005859375, 0.54193115234375, 0.6075592041015625, 0.673187255859375, 0.7388153076171875, 0.804443359375, 0.8700714111328125, 0.935699462890625, 1.0013275146484375, 1.06695556640625, 1.1325836181640625, 1.198211669921875, 1.2638397216796875, 1.3294677734375, 1.3950958251953125, 1.460723876953125, 1.5263519287109375, 1.59197998046875, 1.6576080322265625, 1.723236083984375, 1.7888641357421875, 1.8544921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 10.0, 9.0, 14.0, 31.0, 23.0, 36.0, 49.0, 71.0, 82.0, 126.0, 142.0, 170.0, 256.0, 417.0, 609.0, 1109.0, 2288.0, 5245.0, 14995.0, 46905.0, 162637.0, 493848.0, 224350.0, 62630.0, 19495.0, 6886.0, 2590.0, 1235.0, 719.0, 422.0, 309.0, 202.0, 142.0, 112.0, 101.0, 75.0, 58.0, 43.0, 21.0, 25.0, 15.0, 15.0, 6.0, 12.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.77734375, -6.57574462890625, -6.3741455078125, -6.17254638671875, -5.970947265625, -5.76934814453125, -5.5677490234375, -5.36614990234375, -5.16455078125, -4.96295166015625, -4.7613525390625, -4.55975341796875, -4.358154296875, -4.15655517578125, -3.9549560546875, -3.75335693359375, -3.5517578125, -3.35015869140625, -3.1485595703125, -2.94696044921875, -2.745361328125, -2.54376220703125, -2.3421630859375, -2.14056396484375, -1.93896484375, -1.73736572265625, -1.5357666015625, -1.33416748046875, -1.132568359375, -0.93096923828125, -0.7293701171875, -0.52777099609375, -0.326171875, -0.12457275390625, 0.0770263671875, 0.27862548828125, 0.480224609375, 0.68182373046875, 0.8834228515625, 1.08502197265625, 1.28662109375, 1.48822021484375, 1.6898193359375, 1.89141845703125, 2.093017578125, 2.29461669921875, 2.4962158203125, 2.69781494140625, 2.8994140625, 3.10101318359375, 3.3026123046875, 3.50421142578125, 3.705810546875, 3.90740966796875, 4.1090087890625, 4.31060791015625, 4.51220703125, 4.71380615234375, 4.9154052734375, 5.11700439453125, 5.318603515625, 5.52020263671875, 5.7218017578125, 5.92340087890625, 6.125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 6.0, 8.0, 4.0, 10.0, 15.0, 8.0, 22.0, 20.0, 29.0, 21.0, 29.0, 28.0, 36.0, 43.0, 49.0, 40.0, 46.0, 41.0, 46.0, 45.0, 44.0, 45.0, 45.0, 36.0, 35.0, 38.0, 31.0, 25.0, 27.0, 30.0, 21.0, 19.0, 11.0, 8.0, 5.0, 8.0, 11.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.453125, -6.26788330078125, -6.0826416015625, -5.89739990234375, -5.712158203125, -5.52691650390625, -5.3416748046875, -5.15643310546875, -4.97119140625, -4.78594970703125, -4.6007080078125, -4.41546630859375, -4.230224609375, -4.04498291015625, -3.8597412109375, -3.67449951171875, -3.4892578125, -3.30401611328125, -3.1187744140625, -2.93353271484375, -2.748291015625, -2.56304931640625, -2.3778076171875, -2.19256591796875, -2.00732421875, -1.82208251953125, -1.6368408203125, -1.45159912109375, -1.266357421875, -1.08111572265625, -0.8958740234375, -0.71063232421875, -0.525390625, -0.34014892578125, -0.1549072265625, 0.03033447265625, 0.215576171875, 0.40081787109375, 0.5860595703125, 0.77130126953125, 0.95654296875, 1.14178466796875, 1.3270263671875, 1.51226806640625, 1.697509765625, 1.88275146484375, 2.0679931640625, 2.25323486328125, 2.4384765625, 2.62371826171875, 2.8089599609375, 2.99420166015625, 3.179443359375, 3.36468505859375, 3.5499267578125, 3.73516845703125, 3.92041015625, 4.10565185546875, 4.2908935546875, 4.47613525390625, 4.661376953125, 4.84661865234375, 5.0318603515625, 5.21710205078125, 5.40234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 5.0, 9.0, 6.0, 14.0, 25.0, 35.0, 26.0, 58.0, 85.0, 160.0, 269.0, 552.0, 1249.0, 3739.0, 14176.0, 79325.0, 808676.0, 114859.0, 17867.0, 4562.0, 1531.0, 590.0, 286.0, 162.0, 89.0, 49.0, 40.0, 22.0, 31.0, 18.0, 11.0, 7.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.22265625, -6.97845458984375, -6.7342529296875, -6.49005126953125, -6.245849609375, -6.00164794921875, -5.7574462890625, -5.51324462890625, -5.26904296875, -5.02484130859375, -4.7806396484375, -4.53643798828125, -4.292236328125, -4.04803466796875, -3.8038330078125, -3.55963134765625, -3.3154296875, -3.07122802734375, -2.8270263671875, -2.58282470703125, -2.338623046875, -2.09442138671875, -1.8502197265625, -1.60601806640625, -1.36181640625, -1.11761474609375, -0.8734130859375, -0.62921142578125, -0.385009765625, -0.14080810546875, 0.1033935546875, 0.34759521484375, 0.591796875, 0.83599853515625, 1.0802001953125, 1.32440185546875, 1.568603515625, 1.81280517578125, 2.0570068359375, 2.30120849609375, 2.54541015625, 2.78961181640625, 3.0338134765625, 3.27801513671875, 3.522216796875, 3.76641845703125, 4.0106201171875, 4.25482177734375, 4.4990234375, 4.74322509765625, 4.9874267578125, 5.23162841796875, 5.475830078125, 5.72003173828125, 5.9642333984375, 6.20843505859375, 6.45263671875, 6.69683837890625, 6.9410400390625, 7.18524169921875, 7.429443359375, 7.67364501953125, 7.9178466796875, 8.16204833984375, 8.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 7.0, 13.0, 16.0, 11.0, 21.0, 29.0, 35.0, 58.0, 116.0, 277.0, 169.0, 67.0, 39.0, 24.0, 32.0, 25.0, 11.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007114410400390625, -0.0006826817989349365, -0.0006539225578308105, -0.0006251633167266846, -0.0005964040756225586, -0.0005676448345184326, -0.0005388855934143066, -0.0005101263523101807, -0.0004813671112060547, -0.0004526078701019287, -0.00042384862899780273, -0.00039508938789367676, -0.0003663301467895508, -0.0003375709056854248, -0.00030881166458129883, -0.00028005242347717285, -0.0002512931823730469, -0.0002225339412689209, -0.00019377470016479492, -0.00016501545906066895, -0.00013625621795654297, -0.00010749697685241699, -7.873773574829102e-05, -4.997849464416504e-05, -2.1219253540039062e-05, 7.539987564086914e-06, 3.629922866821289e-05, 6.505846977233887e-05, 9.381771087646484e-05, 0.00012257695198059082, 0.0001513361930847168, 0.00018009543418884277, 0.00020885467529296875, 0.00023761391639709473, 0.0002663731575012207, 0.0002951323986053467, 0.00032389163970947266, 0.00035265088081359863, 0.0003814101219177246, 0.0004101693630218506, 0.00043892860412597656, 0.00046768784523010254, 0.0004964470863342285, 0.0005252063274383545, 0.0005539655685424805, 0.0005827248096466064, 0.0006114840507507324, 0.0006402432918548584, 0.0006690025329589844, 0.0006977617740631104, 0.0007265210151672363, 0.0007552802562713623, 0.0007840394973754883, 0.0008127987384796143, 0.0008415579795837402, 0.0008703172206878662, 0.0008990764617919922, 0.0009278357028961182, 0.0009565949440002441, 0.0009853541851043701, 0.001014113426208496, 0.001042872667312622, 0.001071631908416748, 0.001100391149520874, 0.001129150390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 4.0, 9.0, 15.0, 29.0, 32.0, 47.0, 45.0, 86.0, 107.0, 256.0, 425.0, 971.0, 2420.0, 7621.0, 26882.0, 176113.0, 758087.0, 54831.0, 13621.0, 4104.0, 1414.0, 592.0, 299.0, 150.0, 119.0, 66.0, 41.0, 29.0, 29.0, 22.0, 12.0, 11.0, 11.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.93359375, -7.6875, -7.44140625, -7.1953125, -6.94921875, -6.703125, -6.45703125, -6.2109375, -5.96484375, -5.71875, -5.47265625, -5.2265625, -4.98046875, -4.734375, -4.48828125, -4.2421875, -3.99609375, -3.75, -3.50390625, -3.2578125, -3.01171875, -2.765625, -2.51953125, -2.2734375, -2.02734375, -1.78125, -1.53515625, -1.2890625, -1.04296875, -0.796875, -0.55078125, -0.3046875, -0.05859375, 0.1875, 0.43359375, 0.6796875, 0.92578125, 1.171875, 1.41796875, 1.6640625, 1.91015625, 2.15625, 2.40234375, 2.6484375, 2.89453125, 3.140625, 3.38671875, 3.6328125, 3.87890625, 4.125, 4.37109375, 4.6171875, 4.86328125, 5.109375, 5.35546875, 5.6015625, 5.84765625, 6.09375, 6.33984375, 6.5859375, 6.83203125, 7.078125, 7.32421875, 7.5703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 6.0, 6.0, 6.0, 5.0, 14.0, 13.0, 16.0, 21.0, 34.0, 76.0, 115.0, 207.0, 164.0, 99.0, 61.0, 29.0, 27.0, 12.0, 11.0, 5.0, 13.0, 7.0, 8.0, 6.0, 5.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.3515625, -5.2022705078125, -5.052978515625, -4.9036865234375, -4.75439453125, -4.6051025390625, -4.455810546875, -4.3065185546875, -4.1572265625, -4.0079345703125, -3.858642578125, -3.7093505859375, -3.56005859375, -3.4107666015625, -3.261474609375, -3.1121826171875, -2.962890625, -2.8135986328125, -2.664306640625, -2.5150146484375, -2.36572265625, -2.2164306640625, -2.067138671875, -1.9178466796875, -1.7685546875, -1.6192626953125, -1.469970703125, -1.3206787109375, -1.17138671875, -1.0220947265625, -0.872802734375, -0.7235107421875, -0.57421875, -0.4249267578125, -0.275634765625, -0.1263427734375, 0.02294921875, 0.1722412109375, 0.321533203125, 0.4708251953125, 0.6201171875, 0.7694091796875, 0.918701171875, 1.0679931640625, 1.21728515625, 1.3665771484375, 1.515869140625, 1.6651611328125, 1.814453125, 1.9637451171875, 2.113037109375, 2.2623291015625, 2.41162109375, 2.5609130859375, 2.710205078125, 2.8594970703125, 3.0087890625, 3.1580810546875, 3.307373046875, 3.4566650390625, 3.60595703125, 3.7552490234375, 3.904541015625, 4.0538330078125, 4.203125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 35.0, 112.0, 310.0, 332.0, 147.0, 45.0, 11.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.8377685546875, -114.45972442626953, -110.08168029785156, -105.7036361694336, -101.32559204101562, -96.94754791259766, -92.56950378417969, -88.19145965576172, -83.81341552734375, -79.43537139892578, -75.05732727050781, -70.67928314208984, -66.30123901367188, -61.923194885253906, -57.54515075683594, -53.16710662841797, -48.7890625, -44.41101837158203, -40.03297424316406, -35.654930114746094, -31.276885986328125, -26.898841857910156, -22.520797729492188, -18.14275360107422, -13.76470947265625, -9.386665344238281, -5.0086212158203125, -0.6305770874023438, 3.747467041015625, 8.125511169433594, 12.503555297851562, 16.88159942626953, 21.2596435546875, 25.63768768310547, 30.015731811523438, 34.393775939941406, 38.771820068359375, 43.149864196777344, 47.52790832519531, 51.90595245361328, 56.28399658203125, 60.66204071044922, 65.04008483886719, 69.41812896728516, 73.79617309570312, 78.1742172241211, 82.55226135253906, 86.93030548095703, 91.308349609375, 95.68639373779297, 100.06443786621094, 104.4424819946289, 108.82052612304688, 113.19857025146484, 117.57661437988281, 121.95465850830078, 126.33270263671875, 130.71075439453125, 135.0887908935547, 139.46682739257812, 143.84487915039062, 148.22293090820312, 152.60096740722656, 156.97900390625, 161.3570556640625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 10.0, 3.0, 9.0, 16.0, 15.0, 15.0, 23.0, 24.0, 29.0, 28.0, 32.0, 43.0, 45.0, 59.0, 46.0, 43.0, 54.0, 47.0, 49.0, 54.0, 59.0, 41.0, 41.0, 35.0, 31.0, 30.0, 25.0, 22.0, 16.0, 10.0, 12.0, 15.0, 10.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.448490142822266, -30.297542572021484, -29.146595001220703, -27.995647430419922, -26.84469985961914, -25.69375228881836, -24.542804718017578, -23.391857147216797, -22.240909576416016, -21.089962005615234, -19.939014434814453, -18.788066864013672, -17.63711929321289, -16.48617172241211, -15.335223197937012, -14.18427562713623, -13.033327102661133, -11.882379531860352, -10.73143196105957, -9.580484390258789, -8.429536819458008, -7.278588771820068, -6.127640724182129, -4.976693153381348, -3.8257455825805664, -2.674798011779785, -1.5238502025604248, -0.37290239334106445, 0.7780451774597168, 1.928992748260498, 3.0799407958984375, 4.230888366699219, 5.3818359375, 6.532783508300781, 7.6837310791015625, 8.834678649902344, 9.985626220703125, 11.136573791503906, 12.287522315979004, 13.438469886779785, 14.589417457580566, 15.740365028381348, 16.891313552856445, 18.042261123657227, 19.193208694458008, 20.34415626525879, 21.49510383605957, 22.64605140686035, 23.796998977661133, 24.947946548461914, 26.098894119262695, 27.249841690063477, 28.400789260864258, 29.55173683166504, 30.702686309814453, 31.853633880615234, 33.004581451416016, 34.1555290222168, 35.30647659301758, 36.45742416381836, 37.60837173461914, 38.75931930541992, 39.9102668762207, 41.061214447021484, 42.212162017822266]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 9.0, 4.0, 7.0, 14.0, 9.0, 16.0, 14.0, 19.0, 31.0, 40.0, 57.0, 55.0, 95.0, 118.0, 202.0, 294.0, 465.0, 822.0, 1390.0, 2477.0, 5181.0, 12404.0, 34921.0, 169293.0, 3416588.0, 457391.0, 59135.0, 18107.0, 7283.0, 3546.0, 1667.0, 963.0, 582.0, 372.0, 213.0, 157.0, 102.0, 80.0, 42.0, 29.0, 29.0, 17.0, 8.0, 14.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-11.8515625, -11.51953125, -11.1875, -10.85546875, -10.5234375, -10.19140625, -9.859375, -9.52734375, -9.1953125, -8.86328125, -8.53125, -8.19921875, -7.8671875, -7.53515625, -7.203125, -6.87109375, -6.5390625, -6.20703125, -5.875, -5.54296875, -5.2109375, -4.87890625, -4.546875, -4.21484375, -3.8828125, -3.55078125, -3.21875, -2.88671875, -2.5546875, -2.22265625, -1.890625, -1.55859375, -1.2265625, -0.89453125, -0.5625, -0.23046875, 0.1015625, 0.43359375, 0.765625, 1.09765625, 1.4296875, 1.76171875, 2.09375, 2.42578125, 2.7578125, 3.08984375, 3.421875, 3.75390625, 4.0859375, 4.41796875, 4.75, 5.08203125, 5.4140625, 5.74609375, 6.078125, 6.41015625, 6.7421875, 7.07421875, 7.40625, 7.73828125, 8.0703125, 8.40234375, 8.734375, 9.06640625, 9.3984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 6.0, 5.0, 13.0, 15.0, 14.0, 22.0, 33.0, 31.0, 41.0, 35.0, 54.0, 62.0, 58.0, 60.0, 70.0, 62.0, 55.0, 54.0, 59.0, 43.0, 39.0, 38.0, 26.0, 26.0, 12.0, 19.0, 14.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6872100830078125, -1.623443603515625, -1.5596771240234375, -1.49591064453125, -1.4321441650390625, -1.368377685546875, -1.3046112060546875, -1.2408447265625, -1.1770782470703125, -1.113311767578125, -1.0495452880859375, -0.98577880859375, -0.9220123291015625, -0.858245849609375, -0.7944793701171875, -0.730712890625, -0.6669464111328125, -0.603179931640625, -0.5394134521484375, -0.47564697265625, -0.4118804931640625, -0.348114013671875, -0.2843475341796875, -0.2205810546875, -0.1568145751953125, -0.093048095703125, -0.0292816162109375, 0.03448486328125, 0.0982513427734375, 0.162017822265625, 0.2257843017578125, 0.28955078125, 0.3533172607421875, 0.417083740234375, 0.4808502197265625, 0.54461669921875, 0.6083831787109375, 0.672149658203125, 0.7359161376953125, 0.7996826171875, 0.8634490966796875, 0.927215576171875, 0.9909820556640625, 1.05474853515625, 1.1185150146484375, 1.182281494140625, 1.2460479736328125, 1.309814453125, 1.3735809326171875, 1.437347412109375, 1.5011138916015625, 1.56488037109375, 1.6286468505859375, 1.692413330078125, 1.7561798095703125, 1.8199462890625, 1.8837127685546875, 1.947479248046875, 2.0112457275390625, 2.07501220703125, 2.1387786865234375, 2.202545166015625, 2.2663116455078125, 2.330078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 14.0, 19.0, 33.0, 57.0, 84.0, 150.0, 248.0, 766.0, 23793.0, 4139068.0, 28455.0, 927.0, 271.0, 156.0, 100.0, 62.0, 37.0, 22.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.421875, -21.064697265625, -19.70751953125, -18.350341796875, -16.9931640625, -15.635986328125, -14.27880859375, -12.921630859375, -11.564453125, -10.207275390625, -8.85009765625, -7.492919921875, -6.1357421875, -4.778564453125, -3.42138671875, -2.064208984375, -0.70703125, 0.650146484375, 2.00732421875, 3.364501953125, 4.7216796875, 6.078857421875, 7.43603515625, 8.793212890625, 10.150390625, 11.507568359375, 12.86474609375, 14.221923828125, 15.5791015625, 16.936279296875, 18.29345703125, 19.650634765625, 21.0078125, 22.364990234375, 23.72216796875, 25.079345703125, 26.4365234375, 27.793701171875, 29.15087890625, 30.508056640625, 31.865234375, 33.222412109375, 34.57958984375, 35.936767578125, 37.2939453125, 38.651123046875, 40.00830078125, 41.365478515625, 42.72265625, 44.079833984375, 45.43701171875, 46.794189453125, 48.1513671875, 49.508544921875, 50.86572265625, 52.222900390625, 53.580078125, 54.937255859375, 56.29443359375, 57.651611328125, 59.0087890625, 60.365966796875, 61.72314453125, 63.080322265625, 64.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 6.0, 12.0, 22.0, 36.0, 47.0, 188.0, 872.0, 2313.0, 378.0, 113.0, 47.0, 23.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.643280029296875, -2.38616943359375, -2.129058837890625, -1.8719482421875, -1.614837646484375, -1.35772705078125, -1.100616455078125, -0.843505859375, -0.586395263671875, -0.32928466796875, -0.072174072265625, 0.1849365234375, 0.442047119140625, 0.69915771484375, 0.956268310546875, 1.21337890625, 1.470489501953125, 1.72760009765625, 1.984710693359375, 2.2418212890625, 2.498931884765625, 2.75604248046875, 3.013153076171875, 3.270263671875, 3.527374267578125, 3.78448486328125, 4.041595458984375, 4.2987060546875, 4.555816650390625, 4.81292724609375, 5.070037841796875, 5.3271484375, 5.584259033203125, 5.84136962890625, 6.098480224609375, 6.3555908203125, 6.612701416015625, 6.86981201171875, 7.126922607421875, 7.384033203125, 7.641143798828125, 7.89825439453125, 8.155364990234375, 8.4124755859375, 8.669586181640625, 8.92669677734375, 9.183807373046875, 9.44091796875, 9.698028564453125, 9.95513916015625, 10.212249755859375, 10.4693603515625, 10.726470947265625, 10.98358154296875, 11.240692138671875, 11.497802734375, 11.754913330078125, 12.01202392578125, 12.269134521484375, 12.5262451171875, 12.783355712890625, 13.04046630859375, 13.297576904296875, 13.5546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 20.0, 62.0, 169.0, 285.0, 252.0, 138.0, 46.0, 8.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.08334350585938, -83.23007202148438, -81.3768081665039, -79.5235366821289, -77.6702651977539, -75.81700134277344, -73.96372985839844, -72.11045837402344, -70.25718688964844, -68.40391540527344, -66.55065155029297, -64.69738006591797, -62.84410858154297, -60.990840911865234, -59.1375732421875, -57.2843017578125, -55.43103790283203, -53.5777702331543, -51.7244987487793, -49.87123107910156, -48.01795959472656, -46.16469192504883, -44.311424255371094, -42.458152770996094, -40.60488510131836, -38.751617431640625, -36.898345947265625, -35.04507827758789, -33.191810607910156, -31.338539123535156, -29.485271453857422, -27.632001876831055, -25.778732299804688, -23.92546272277832, -22.072193145751953, -20.21892547607422, -18.36565589904785, -16.512386322021484, -14.659117698669434, -12.805849075317383, -10.952579498291016, -9.099309921264648, -7.246041297912598, -5.392772197723389, -3.5395030975341797, -1.6862335205078125, 0.16703510284423828, 2.020303726196289, 3.8735733032226562, 5.726842403411865, 7.580111503601074, 9.433380126953125, 11.286649703979492, 13.13991928100586, 14.99318790435791, 16.84645652770996, 18.699726104736328, 20.552995681762695, 22.406265258789062, 24.259532928466797, 26.112802505493164, 27.96607208251953, 29.819339752197266, 31.672609329223633, 33.52587890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 26.0, 33.0, 41.0, 63.0, 70.0, 88.0, 93.0, 103.0, 108.0, 87.0, 77.0, 61.0, 50.0, 21.0, 23.0, 11.0, 15.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.83271789550781, -34.9895133972168, -34.146305084228516, -33.3031005859375, -32.45989227294922, -31.61668586730957, -30.773479461669922, -29.930274963378906, -29.087066650390625, -28.243860244750977, -27.400653839111328, -26.55744743347168, -25.71424102783203, -24.871034622192383, -24.027828216552734, -23.18462371826172, -22.34141731262207, -21.498210906982422, -20.655004501342773, -19.811798095703125, -18.968591690063477, -18.125385284423828, -17.282180786132812, -16.43897247314453, -15.5957670211792, -14.75256061553955, -13.909354209899902, -13.06614875793457, -12.222942352294922, -11.379735946655273, -10.536529541015625, -9.693323135375977, -8.850116729736328, -8.00691032409668, -7.163703918457031, -6.320497989654541, -5.477291584014893, -4.634085178375244, -3.790879249572754, -2.9476728439331055, -2.104466438293457, -1.2612601518630981, -0.41805386543273926, 0.4251523017883301, 1.2683587074279785, 2.111565113067627, 2.954771041870117, 3.7979774475097656, 4.641183853149414, 5.4843902587890625, 6.327596664428711, 7.170802593231201, 8.014009475708008, 8.857215881347656, 9.700421333312988, 10.543627738952637, 11.386834144592285, 12.230040550231934, 13.073246955871582, 13.916452407836914, 14.759658813476562, 15.602865219116211, 16.44607162475586, 17.289278030395508, 18.132484436035156]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 8.0, 7.0, 24.0, 22.0, 23.0, 39.0, 80.0, 107.0, 130.0, 227.0, 370.0, 673.0, 1187.0, 2339.0, 5372.0, 14550.0, 45220.0, 165654.0, 519360.0, 209128.0, 54804.0, 17099.0, 6226.0, 2693.0, 1350.0, 722.0, 432.0, 216.0, 164.0, 90.0, 62.0, 48.0, 40.0, 19.0, 18.0, 9.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.359375, -8.102783203125, -7.84619140625, -7.589599609375, -7.3330078125, -7.076416015625, -6.81982421875, -6.563232421875, -6.306640625, -6.050048828125, -5.79345703125, -5.536865234375, -5.2802734375, -5.023681640625, -4.76708984375, -4.510498046875, -4.25390625, -3.997314453125, -3.74072265625, -3.484130859375, -3.2275390625, -2.970947265625, -2.71435546875, -2.457763671875, -2.201171875, -1.944580078125, -1.68798828125, -1.431396484375, -1.1748046875, -0.918212890625, -0.66162109375, -0.405029296875, -0.1484375, 0.108154296875, 0.36474609375, 0.621337890625, 0.8779296875, 1.134521484375, 1.39111328125, 1.647705078125, 1.904296875, 2.160888671875, 2.41748046875, 2.674072265625, 2.9306640625, 3.187255859375, 3.44384765625, 3.700439453125, 3.95703125, 4.213623046875, 4.47021484375, 4.726806640625, 4.9833984375, 5.239990234375, 5.49658203125, 5.753173828125, 6.009765625, 6.266357421875, 6.52294921875, 6.779541015625, 7.0361328125, 7.292724609375, 7.54931640625, 7.805908203125, 8.0625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 16.0, 15.0, 28.0, 27.0, 42.0, 44.0, 56.0, 58.0, 71.0, 93.0, 80.0, 79.0, 68.0, 66.0, 57.0, 57.0, 36.0, 34.0, 15.0, 19.0, 5.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.978515625, -2.889434814453125, -2.80035400390625, -2.711273193359375, -2.6221923828125, -2.533111572265625, -2.44403076171875, -2.354949951171875, -2.265869140625, -2.176788330078125, -2.08770751953125, -1.998626708984375, -1.9095458984375, -1.820465087890625, -1.73138427734375, -1.642303466796875, -1.55322265625, -1.464141845703125, -1.37506103515625, -1.285980224609375, -1.1968994140625, -1.107818603515625, -1.01873779296875, -0.929656982421875, -0.840576171875, -0.751495361328125, -0.66241455078125, -0.573333740234375, -0.4842529296875, -0.395172119140625, -0.30609130859375, -0.217010498046875, -0.1279296875, -0.038848876953125, 0.05023193359375, 0.139312744140625, 0.2283935546875, 0.317474365234375, 0.40655517578125, 0.495635986328125, 0.584716796875, 0.673797607421875, 0.76287841796875, 0.851959228515625, 0.9410400390625, 1.030120849609375, 1.11920166015625, 1.208282470703125, 1.29736328125, 1.386444091796875, 1.47552490234375, 1.564605712890625, 1.6536865234375, 1.742767333984375, 1.83184814453125, 1.920928955078125, 2.010009765625, 2.099090576171875, 2.18817138671875, 2.277252197265625, 2.3663330078125, 2.455413818359375, 2.54449462890625, 2.633575439453125, 2.72265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 8.0, 21.0, 23.0, 42.0, 58.0, 82.0, 94.0, 167.0, 304.0, 636.0, 1496.0, 5001.0, 20727.0, 106861.0, 570615.0, 280542.0, 46994.0, 10039.0, 2738.0, 977.0, 416.0, 245.0, 151.0, 103.0, 52.0, 41.0, 32.0, 15.0, 18.0, 12.0, 12.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.203125, -7.94482421875, -7.6865234375, -7.42822265625, -7.169921875, -6.91162109375, -6.6533203125, -6.39501953125, -6.13671875, -5.87841796875, -5.6201171875, -5.36181640625, -5.103515625, -4.84521484375, -4.5869140625, -4.32861328125, -4.0703125, -3.81201171875, -3.5537109375, -3.29541015625, -3.037109375, -2.77880859375, -2.5205078125, -2.26220703125, -2.00390625, -1.74560546875, -1.4873046875, -1.22900390625, -0.970703125, -0.71240234375, -0.4541015625, -0.19580078125, 0.0625, 0.32080078125, 0.5791015625, 0.83740234375, 1.095703125, 1.35400390625, 1.6123046875, 1.87060546875, 2.12890625, 2.38720703125, 2.6455078125, 2.90380859375, 3.162109375, 3.42041015625, 3.6787109375, 3.93701171875, 4.1953125, 4.45361328125, 4.7119140625, 4.97021484375, 5.228515625, 5.48681640625, 5.7451171875, 6.00341796875, 6.26171875, 6.52001953125, 6.7783203125, 7.03662109375, 7.294921875, 7.55322265625, 7.8115234375, 8.06982421875, 8.328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 9.0, 11.0, 13.0, 18.0, 17.0, 29.0, 22.0, 27.0, 40.0, 26.0, 27.0, 43.0, 37.0, 36.0, 51.0, 44.0, 49.0, 47.0, 39.0, 50.0, 55.0, 33.0, 39.0, 38.0, 22.0, 32.0, 19.0, 13.0, 13.0, 13.0, 16.0, 9.0, 4.0, 9.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.06640625, -6.869873046875, -6.67333984375, -6.476806640625, -6.2802734375, -6.083740234375, -5.88720703125, -5.690673828125, -5.494140625, -5.297607421875, -5.10107421875, -4.904541015625, -4.7080078125, -4.511474609375, -4.31494140625, -4.118408203125, -3.921875, -3.725341796875, -3.52880859375, -3.332275390625, -3.1357421875, -2.939208984375, -2.74267578125, -2.546142578125, -2.349609375, -2.153076171875, -1.95654296875, -1.760009765625, -1.5634765625, -1.366943359375, -1.17041015625, -0.973876953125, -0.77734375, -0.580810546875, -0.38427734375, -0.187744140625, 0.0087890625, 0.205322265625, 0.40185546875, 0.598388671875, 0.794921875, 0.991455078125, 1.18798828125, 1.384521484375, 1.5810546875, 1.777587890625, 1.97412109375, 2.170654296875, 2.3671875, 2.563720703125, 2.76025390625, 2.956787109375, 3.1533203125, 3.349853515625, 3.54638671875, 3.742919921875, 3.939453125, 4.135986328125, 4.33251953125, 4.529052734375, 4.7255859375, 4.922119140625, 5.11865234375, 5.315185546875, 5.51171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 20.0, 26.0, 42.0, 55.0, 112.0, 193.0, 345.0, 727.0, 1596.0, 4520.0, 17653.0, 114223.0, 737853.0, 142392.0, 20566.0, 4903.0, 1680.0, 761.0, 344.0, 209.0, 103.0, 65.0, 42.0, 30.0, 18.0, 14.0, 14.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.71875, -4.589630126953125, -4.46051025390625, -4.331390380859375, -4.2022705078125, -4.073150634765625, -3.94403076171875, -3.814910888671875, -3.685791015625, -3.556671142578125, -3.42755126953125, -3.298431396484375, -3.1693115234375, -3.040191650390625, -2.91107177734375, -2.781951904296875, -2.65283203125, -2.523712158203125, -2.39459228515625, -2.265472412109375, -2.1363525390625, -2.007232666015625, -1.87811279296875, -1.748992919921875, -1.619873046875, -1.490753173828125, -1.36163330078125, -1.232513427734375, -1.1033935546875, -0.974273681640625, -0.84515380859375, -0.716033935546875, -0.5869140625, -0.457794189453125, -0.32867431640625, -0.199554443359375, -0.0704345703125, 0.058685302734375, 0.18780517578125, 0.316925048828125, 0.446044921875, 0.575164794921875, 0.70428466796875, 0.833404541015625, 0.9625244140625, 1.091644287109375, 1.22076416015625, 1.349884033203125, 1.47900390625, 1.608123779296875, 1.73724365234375, 1.866363525390625, 1.9954833984375, 2.124603271484375, 2.25372314453125, 2.382843017578125, 2.511962890625, 2.641082763671875, 2.77020263671875, 2.899322509765625, 3.0284423828125, 3.157562255859375, 3.28668212890625, 3.415802001953125, 3.544921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 11.0, 13.0, 22.0, 14.0, 32.0, 48.0, 98.0, 203.0, 227.0, 140.0, 55.0, 35.0, 28.0, 18.0, 15.0, 13.0, 8.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005292892456054688, -0.0005082637071609497, -0.00048723816871643066, -0.0004662126302719116, -0.0004451870918273926, -0.00042416155338287354, -0.0004031360149383545, -0.00038211047649383545, -0.0003610849380493164, -0.00034005939960479736, -0.0003190338611602783, -0.0002980083227157593, -0.00027698278427124023, -0.0002559572458267212, -0.00023493170738220215, -0.0002139061689376831, -0.00019288063049316406, -0.00017185509204864502, -0.00015082955360412598, -0.00012980401515960693, -0.00010877847671508789, -8.775293827056885e-05, -6.67273998260498e-05, -4.570186138153076e-05, -2.467632293701172e-05, -3.6507844924926758e-06, 1.7374753952026367e-05, 3.840029239654541e-05, 5.942583084106445e-05, 8.04513692855835e-05, 0.00010147690773010254, 0.00012250244617462158, 0.00014352798461914062, 0.00016455352306365967, 0.0001855790615081787, 0.00020660459995269775, 0.0002276301383972168, 0.00024865567684173584, 0.0002696812152862549, 0.0002907067537307739, 0.00031173229217529297, 0.000332757830619812, 0.00035378336906433105, 0.0003748089075088501, 0.00039583444595336914, 0.0004168599843978882, 0.0004378855228424072, 0.00045891106128692627, 0.0004799365997314453, 0.0005009621381759644, 0.0005219876766204834, 0.0005430132150650024, 0.0005640387535095215, 0.0005850642919540405, 0.0006060898303985596, 0.0006271153688430786, 0.0006481409072875977, 0.0006691664457321167, 0.0006901919841766357, 0.0007112175226211548, 0.0007322430610656738, 0.0007532685995101929, 0.0007742941379547119, 0.000795319676399231, 0.00081634521484375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 9.0, 16.0, 33.0, 35.0, 80.0, 208.0, 578.0, 3113.0, 58659.0, 961864.0, 21371.0, 1821.0, 459.0, 145.0, 60.0, 38.0, 24.0, 11.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.6575927734375, -7.315185546875, -6.9727783203125, -6.63037109375, -6.2879638671875, -5.945556640625, -5.6031494140625, -5.2607421875, -4.9183349609375, -4.575927734375, -4.2335205078125, -3.89111328125, -3.5487060546875, -3.206298828125, -2.8638916015625, -2.521484375, -2.1790771484375, -1.836669921875, -1.4942626953125, -1.15185546875, -0.8094482421875, -0.467041015625, -0.1246337890625, 0.2177734375, 0.5601806640625, 0.902587890625, 1.2449951171875, 1.58740234375, 1.9298095703125, 2.272216796875, 2.6146240234375, 2.95703125, 3.2994384765625, 3.641845703125, 3.9842529296875, 4.32666015625, 4.6690673828125, 5.011474609375, 5.3538818359375, 5.6962890625, 6.0386962890625, 6.381103515625, 6.7235107421875, 7.06591796875, 7.4083251953125, 7.750732421875, 8.0931396484375, 8.435546875, 8.7779541015625, 9.120361328125, 9.4627685546875, 9.80517578125, 10.1475830078125, 10.489990234375, 10.8323974609375, 11.1748046875, 11.5172119140625, 11.859619140625, 12.2020263671875, 12.54443359375, 12.8868408203125, 13.229248046875, 13.5716552734375, 13.9140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 11.0, 13.0, 33.0, 43.0, 117.0, 297.0, 287.0, 94.0, 44.0, 27.0, 15.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.39337158203125, -4.1734619140625, -3.95355224609375, -3.733642578125, -3.51373291015625, -3.2938232421875, -3.07391357421875, -2.85400390625, -2.63409423828125, -2.4141845703125, -2.19427490234375, -1.974365234375, -1.75445556640625, -1.5345458984375, -1.31463623046875, -1.0947265625, -0.87481689453125, -0.6549072265625, -0.43499755859375, -0.215087890625, 0.00482177734375, 0.2247314453125, 0.44464111328125, 0.66455078125, 0.88446044921875, 1.1043701171875, 1.32427978515625, 1.544189453125, 1.76409912109375, 1.9840087890625, 2.20391845703125, 2.423828125, 2.64373779296875, 2.8636474609375, 3.08355712890625, 3.303466796875, 3.52337646484375, 3.7432861328125, 3.96319580078125, 4.18310546875, 4.40301513671875, 4.6229248046875, 4.84283447265625, 5.062744140625, 5.28265380859375, 5.5025634765625, 5.72247314453125, 5.9423828125, 6.16229248046875, 6.3822021484375, 6.60211181640625, 6.822021484375, 7.04193115234375, 7.2618408203125, 7.48175048828125, 7.70166015625, 7.92156982421875, 8.1414794921875, 8.36138916015625, 8.581298828125, 8.80120849609375, 9.0211181640625, 9.24102783203125, 9.4609375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 50.0, 143.0, 266.0, 292.0, 157.0, 56.0, 18.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-141.76898193359375, -138.48094177246094, -135.19290161132812, -131.9048614501953, -128.6168212890625, -125.32878112792969, -122.04074096679688, -118.75270080566406, -115.46466064453125, -112.17662048339844, -108.88858032226562, -105.60054016113281, -102.3125, -99.02445983886719, -95.73641967773438, -92.44837951660156, -89.16033172607422, -85.8722915649414, -82.5842514038086, -79.29621124267578, -76.00817108154297, -72.72013092041016, -69.43208312988281, -66.14404296875, -62.85600662231445, -59.56796646118164, -56.27992630004883, -52.99188232421875, -49.70384216308594, -46.415802001953125, -43.12776184082031, -39.8397216796875, -36.55168151855469, -33.263641357421875, -29.975601196289062, -26.687559127807617, -23.399518966674805, -20.111478805541992, -16.823436737060547, -13.535396575927734, -10.247356414794922, -6.959315776824951, -3.6712751388549805, -0.38323402404785156, 2.904806137084961, 6.192846298217773, 9.480888366699219, 12.768928527832031, 16.056968688964844, 19.345008850097656, 22.63304901123047, 25.921091079711914, 29.209131240844727, 32.497169494628906, 35.785213470458984, 39.0732536315918, 42.36129379272461, 45.64933395385742, 48.937374114990234, 52.22541809082031, 55.513458251953125, 58.80149841308594, 62.08953857421875, 65.37757873535156, 68.66561889648438]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 5.0, 8.0, 9.0, 14.0, 14.0, 17.0, 21.0, 15.0, 13.0, 25.0, 26.0, 23.0, 29.0, 17.0, 30.0, 27.0, 33.0, 25.0, 30.0, 30.0, 35.0, 46.0, 36.0, 38.0, 29.0, 34.0, 38.0, 26.0, 21.0, 31.0, 25.0, 29.0, 20.0, 17.0, 18.0, 16.0, 19.0, 14.0, 7.0, 12.0, 15.0, 15.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 0.0, 3.0], "bins": [-24.373634338378906, -23.62200355529785, -22.87037467956543, -22.118743896484375, -21.367115020751953, -20.6154842376709, -19.863853454589844, -19.112224578857422, -18.360593795776367, -17.608963012695312, -16.85733413696289, -16.105703353881836, -15.354073524475098, -14.60244369506836, -13.850813865661621, -13.099184036254883, -12.347554206848145, -11.595924377441406, -10.844294548034668, -10.09266471862793, -9.341033935546875, -8.589404106140137, -7.837774276733398, -7.086143970489502, -6.334514141082764, -5.582884311676025, -4.831254005432129, -4.079624176025391, -3.3279941082000732, -2.576364040374756, -1.8247342109680176, -1.073103904724121, -0.3214740753173828, 0.4301559329032898, 1.1817859411239624, 1.9334158897399902, 2.6850459575653076, 3.436676025390625, 4.188305854797363, 4.93993616104126, 5.691565990447998, 6.443195819854736, 7.194826126098633, 7.946455955505371, 8.69808578491211, 9.449716567993164, 10.201345443725586, 10.95297622680664, 11.704606056213379, 12.456235885620117, 13.207865715026855, 13.959495544433594, 14.711126327514648, 15.462756156921387, 16.214385986328125, 16.96601676940918, 17.7176456451416, 18.469276428222656, 19.220905303955078, 19.972536087036133, 20.724164962768555, 21.47579574584961, 22.22742462158203, 22.979055404663086, 23.73068618774414]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 7.0, 3.0, 10.0, 12.0, 14.0, 16.0, 23.0, 23.0, 31.0, 29.0, 40.0, 60.0, 71.0, 78.0, 116.0, 191.0, 259.0, 352.0, 638.0, 1068.0, 1869.0, 3518.0, 7093.0, 16974.0, 50414.0, 343597.0, 3552809.0, 154999.0, 34244.0, 12653.0, 5716.0, 2975.0, 1709.0, 964.0, 599.0, 378.0, 220.0, 162.0, 96.0, 68.0, 52.0, 36.0, 22.0, 16.0, 9.0, 12.0, 10.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0], "bins": [-12.234375, -11.90673828125, -11.5791015625, -11.25146484375, -10.923828125, -10.59619140625, -10.2685546875, -9.94091796875, -9.61328125, -9.28564453125, -8.9580078125, -8.63037109375, -8.302734375, -7.97509765625, -7.6474609375, -7.31982421875, -6.9921875, -6.66455078125, -6.3369140625, -6.00927734375, -5.681640625, -5.35400390625, -5.0263671875, -4.69873046875, -4.37109375, -4.04345703125, -3.7158203125, -3.38818359375, -3.060546875, -2.73291015625, -2.4052734375, -2.07763671875, -1.75, -1.42236328125, -1.0947265625, -0.76708984375, -0.439453125, -0.11181640625, 0.2158203125, 0.54345703125, 0.87109375, 1.19873046875, 1.5263671875, 1.85400390625, 2.181640625, 2.50927734375, 2.8369140625, 3.16455078125, 3.4921875, 3.81982421875, 4.1474609375, 4.47509765625, 4.802734375, 5.13037109375, 5.4580078125, 5.78564453125, 6.11328125, 6.44091796875, 6.7685546875, 7.09619140625, 7.423828125, 7.75146484375, 8.0791015625, 8.40673828125, 8.734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 11.0, 11.0, 22.0, 27.0, 30.0, 36.0, 43.0, 51.0, 70.0, 66.0, 69.0, 70.0, 60.0, 72.0, 66.0, 54.0, 43.0, 48.0, 35.0, 25.0, 20.0, 22.0, 15.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.637542724609375, -2.55438232421875, -2.471221923828125, -2.3880615234375, -2.304901123046875, -2.22174072265625, -2.138580322265625, -2.055419921875, -1.972259521484375, -1.88909912109375, -1.805938720703125, -1.7227783203125, -1.639617919921875, -1.55645751953125, -1.473297119140625, -1.39013671875, -1.306976318359375, -1.22381591796875, -1.140655517578125, -1.0574951171875, -0.974334716796875, -0.89117431640625, -0.808013916015625, -0.724853515625, -0.641693115234375, -0.55853271484375, -0.475372314453125, -0.3922119140625, -0.309051513671875, -0.22589111328125, -0.142730712890625, -0.0595703125, 0.023590087890625, 0.10675048828125, 0.189910888671875, 0.2730712890625, 0.356231689453125, 0.43939208984375, 0.522552490234375, 0.605712890625, 0.688873291015625, 0.77203369140625, 0.855194091796875, 0.9383544921875, 1.021514892578125, 1.10467529296875, 1.187835693359375, 1.27099609375, 1.354156494140625, 1.43731689453125, 1.520477294921875, 1.6036376953125, 1.686798095703125, 1.76995849609375, 1.853118896484375, 1.936279296875, 2.019439697265625, 2.10260009765625, 2.185760498046875, 2.2689208984375, 2.352081298828125, 2.43524169921875, 2.518402099609375, 2.6015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 11.0, 24.0, 19.0, 40.0, 45.0, 78.0, 133.0, 268.0, 683.0, 2832.0, 15401.0, 297292.0, 3828920.0, 41206.0, 5256.0, 1203.0, 402.0, 183.0, 104.0, 62.0, 46.0, 22.0, 22.0, 9.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.030029296875, -20.31005859375, -19.590087890625, -18.8701171875, -18.150146484375, -17.43017578125, -16.710205078125, -15.990234375, -15.270263671875, -14.55029296875, -13.830322265625, -13.1103515625, -12.390380859375, -11.67041015625, -10.950439453125, -10.23046875, -9.510498046875, -8.79052734375, -8.070556640625, -7.3505859375, -6.630615234375, -5.91064453125, -5.190673828125, -4.470703125, -3.750732421875, -3.03076171875, -2.310791015625, -1.5908203125, -0.870849609375, -0.15087890625, 0.569091796875, 1.2890625, 2.009033203125, 2.72900390625, 3.448974609375, 4.1689453125, 4.888916015625, 5.60888671875, 6.328857421875, 7.048828125, 7.768798828125, 8.48876953125, 9.208740234375, 9.9287109375, 10.648681640625, 11.36865234375, 12.088623046875, 12.80859375, 13.528564453125, 14.24853515625, 14.968505859375, 15.6884765625, 16.408447265625, 17.12841796875, 17.848388671875, 18.568359375, 19.288330078125, 20.00830078125, 20.728271484375, 21.4482421875, 22.168212890625, 22.88818359375, 23.608154296875, 24.328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 6.0, 11.0, 14.0, 16.0, 27.0, 39.0, 62.0, 128.0, 354.0, 1937.0, 934.0, 248.0, 99.0, 64.0, 31.0, 31.0, 20.0, 17.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.564666748046875, -3.40863037109375, -3.252593994140625, -3.0965576171875, -2.940521240234375, -2.78448486328125, -2.628448486328125, -2.472412109375, -2.316375732421875, -2.16033935546875, -2.004302978515625, -1.8482666015625, -1.692230224609375, -1.53619384765625, -1.380157470703125, -1.22412109375, -1.068084716796875, -0.91204833984375, -0.756011962890625, -0.5999755859375, -0.443939208984375, -0.28790283203125, -0.131866455078125, 0.024169921875, 0.180206298828125, 0.33624267578125, 0.492279052734375, 0.6483154296875, 0.804351806640625, 0.96038818359375, 1.116424560546875, 1.2724609375, 1.428497314453125, 1.58453369140625, 1.740570068359375, 1.8966064453125, 2.052642822265625, 2.20867919921875, 2.364715576171875, 2.520751953125, 2.676788330078125, 2.83282470703125, 2.988861083984375, 3.1448974609375, 3.300933837890625, 3.45697021484375, 3.613006591796875, 3.76904296875, 3.925079345703125, 4.08111572265625, 4.237152099609375, 4.3931884765625, 4.549224853515625, 4.70526123046875, 4.861297607421875, 5.017333984375, 5.173370361328125, 5.32940673828125, 5.485443115234375, 5.6414794921875, 5.797515869140625, 5.95355224609375, 6.109588623046875, 6.265625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 18.0, 29.0, 64.0, 185.0, 257.0, 243.0, 107.0, 51.0, 24.0, 12.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.457000732421875, -49.04761505126953, -47.63822937011719, -46.22884750366211, -44.819461822509766, -43.41007614135742, -42.000694274902344, -40.59130859375, -39.181922912597656, -37.77253723144531, -36.36315155029297, -34.95376968383789, -33.54438400268555, -32.1349983215332, -30.725614547729492, -29.31623077392578, -27.906845092773438, -26.497459411621094, -25.088075637817383, -23.678691864013672, -22.269306182861328, -20.859920501708984, -19.450536727905273, -18.041152954101562, -16.63176727294922, -15.222382545471191, -13.812997817993164, -12.403613090515137, -10.99422836303711, -9.584843635559082, -8.175458908081055, -6.766074180603027, -5.356689453125, -3.9473047256469727, -2.5379199981689453, -1.128535270690918, 0.2808494567871094, 1.6902341842651367, 3.099618911743164, 4.509003639221191, 5.918388366699219, 7.327773094177246, 8.737157821655273, 10.1465425491333, 11.555927276611328, 12.965312004089355, 14.374696731567383, 15.78408145904541, 17.193466186523438, 18.60285186767578, 20.012235641479492, 21.421619415283203, 22.831005096435547, 24.24039077758789, 25.6497745513916, 27.059158325195312, 28.468544006347656, 29.8779296875, 31.28731346130371, 32.69669723510742, 34.106082916259766, 35.51546859741211, 36.92485046386719, 38.33423614501953, 39.743621826171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 6.0, 9.0, 14.0, 19.0, 16.0, 18.0, 33.0, 39.0, 37.0, 50.0, 40.0, 46.0, 57.0, 57.0, 60.0, 62.0, 61.0, 54.0, 48.0, 45.0, 41.0, 27.0, 28.0, 32.0, 17.0, 19.0, 20.0, 6.0, 8.0, 6.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.785520553588867, -15.313078880310059, -14.840636253356934, -14.368194580078125, -13.895752906799316, -13.423310279846191, -12.950868606567383, -12.478425979614258, -12.00598430633545, -11.53354263305664, -11.061100006103516, -10.588658332824707, -10.116216659545898, -9.643774032592773, -9.171332359313965, -8.698890686035156, -8.226448059082031, -7.7540059089660645, -7.281564235687256, -6.809122085571289, -6.336679935455322, -5.8642377853393555, -5.391796112060547, -4.91935396194458, -4.44691276550293, -3.974470853805542, -3.502028703689575, -3.0295867919921875, -2.5571446418762207, -2.084702730178833, -1.6122608184814453, -1.1398186683654785, -0.6673765182495117, -0.19493451714515686, 0.277507483959198, 0.7499494552612305, 1.2223914861679077, 1.694833517074585, 2.1672754287719727, 2.6397175788879395, 3.112159490585327, 3.584601402282715, 4.057043552398682, 4.529485702514648, 5.001927375793457, 5.474369525909424, 5.946811676025391, 6.419253349304199, 6.891695499420166, 7.364137649536133, 7.836579322814941, 8.30902099609375, 8.781463623046875, 9.253905296325684, 9.726346969604492, 10.198789596557617, 10.671231269836426, 11.143672943115234, 11.61611557006836, 12.088557243347168, 12.560998916625977, 13.033441543579102, 13.50588321685791, 13.978324890136719, 14.450767517089844]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 12.0, 23.0, 24.0, 29.0, 39.0, 48.0, 98.0, 119.0, 177.0, 246.0, 377.0, 645.0, 1130.0, 2132.0, 4121.0, 8720.0, 19663.0, 48892.0, 131118.0, 331634.0, 303775.0, 116975.0, 44127.0, 17924.0, 7912.0, 3831.0, 1917.0, 1081.0, 622.0, 400.0, 213.0, 157.0, 94.0, 80.0, 52.0, 29.0, 28.0, 25.0, 14.0, 10.0, 6.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19140625, -6.95123291015625, -6.7110595703125, -6.47088623046875, -6.230712890625, -5.99053955078125, -5.7503662109375, -5.51019287109375, -5.27001953125, -5.02984619140625, -4.7896728515625, -4.54949951171875, -4.309326171875, -4.06915283203125, -3.8289794921875, -3.58880615234375, -3.3486328125, -3.10845947265625, -2.8682861328125, -2.62811279296875, -2.387939453125, -2.14776611328125, -1.9075927734375, -1.66741943359375, -1.42724609375, -1.18707275390625, -0.9468994140625, -0.70672607421875, -0.466552734375, -0.22637939453125, 0.0137939453125, 0.25396728515625, 0.494140625, 0.73431396484375, 0.9744873046875, 1.21466064453125, 1.454833984375, 1.69500732421875, 1.9351806640625, 2.17535400390625, 2.41552734375, 2.65570068359375, 2.8958740234375, 3.13604736328125, 3.376220703125, 3.61639404296875, 3.8565673828125, 4.09674072265625, 4.3369140625, 4.57708740234375, 4.8172607421875, 5.05743408203125, 5.297607421875, 5.53778076171875, 5.7779541015625, 6.01812744140625, 6.25830078125, 6.49847412109375, 6.7386474609375, 6.97882080078125, 7.218994140625, 7.45916748046875, 7.6993408203125, 7.93951416015625, 8.1796875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 10.0, 12.0, 13.0, 18.0, 30.0, 26.0, 42.0, 41.0, 46.0, 53.0, 66.0, 63.0, 63.0, 62.0, 72.0, 62.0, 56.0, 39.0, 39.0, 36.0, 33.0, 33.0, 29.0, 12.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.564239501953125, -2.48199462890625, -2.399749755859375, -2.3175048828125, -2.235260009765625, -2.15301513671875, -2.070770263671875, -1.988525390625, -1.906280517578125, -1.82403564453125, -1.741790771484375, -1.6595458984375, -1.577301025390625, -1.49505615234375, -1.412811279296875, -1.33056640625, -1.248321533203125, -1.16607666015625, -1.083831787109375, -1.0015869140625, -0.919342041015625, -0.83709716796875, -0.754852294921875, -0.672607421875, -0.590362548828125, -0.50811767578125, -0.425872802734375, -0.3436279296875, -0.261383056640625, -0.17913818359375, -0.096893310546875, -0.0146484375, 0.067596435546875, 0.14984130859375, 0.232086181640625, 0.3143310546875, 0.396575927734375, 0.47882080078125, 0.561065673828125, 0.643310546875, 0.725555419921875, 0.80780029296875, 0.890045166015625, 0.9722900390625, 1.054534912109375, 1.13677978515625, 1.219024658203125, 1.30126953125, 1.383514404296875, 1.46575927734375, 1.548004150390625, 1.6302490234375, 1.712493896484375, 1.79473876953125, 1.876983642578125, 1.959228515625, 2.041473388671875, 2.12371826171875, 2.205963134765625, 2.2882080078125, 2.370452880859375, 2.45269775390625, 2.534942626953125, 2.6171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 7.0, 9.0, 11.0, 20.0, 34.0, 32.0, 54.0, 99.0, 121.0, 184.0, 295.0, 518.0, 1033.0, 2937.0, 13983.0, 121381.0, 702299.0, 179612.0, 19526.0, 3684.0, 1204.0, 562.0, 292.0, 224.0, 129.0, 99.0, 61.0, 36.0, 32.0, 21.0, 15.0, 14.0, 4.0, 4.0, 8.0, 0.0, 0.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.8736572265625, -11.458251953125, -11.0428466796875, -10.62744140625, -10.2120361328125, -9.796630859375, -9.3812255859375, -8.9658203125, -8.5504150390625, -8.135009765625, -7.7196044921875, -7.30419921875, -6.8887939453125, -6.473388671875, -6.0579833984375, -5.642578125, -5.2271728515625, -4.811767578125, -4.3963623046875, -3.98095703125, -3.5655517578125, -3.150146484375, -2.7347412109375, -2.3193359375, -1.9039306640625, -1.488525390625, -1.0731201171875, -0.65771484375, -0.2423095703125, 0.173095703125, 0.5885009765625, 1.00390625, 1.4193115234375, 1.834716796875, 2.2501220703125, 2.66552734375, 3.0809326171875, 3.496337890625, 3.9117431640625, 4.3271484375, 4.7425537109375, 5.157958984375, 5.5733642578125, 5.98876953125, 6.4041748046875, 6.819580078125, 7.2349853515625, 7.650390625, 8.0657958984375, 8.481201171875, 8.8966064453125, 9.31201171875, 9.7274169921875, 10.142822265625, 10.5582275390625, 10.9736328125, 11.3890380859375, 11.804443359375, 12.2198486328125, 12.63525390625, 13.0506591796875, 13.466064453125, 13.8814697265625, 14.296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 6.0, 11.0, 11.0, 14.0, 20.0, 16.0, 21.0, 34.0, 40.0, 43.0, 47.0, 56.0, 52.0, 44.0, 60.0, 66.0, 51.0, 52.0, 41.0, 45.0, 36.0, 32.0, 47.0, 39.0, 20.0, 15.0, 22.0, 8.0, 11.0, 7.0, 3.0, 2.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.5201416015625, -7.219970703125, -6.9197998046875, -6.61962890625, -6.3194580078125, -6.019287109375, -5.7191162109375, -5.4189453125, -5.1187744140625, -4.818603515625, -4.5184326171875, -4.21826171875, -3.9180908203125, -3.617919921875, -3.3177490234375, -3.017578125, -2.7174072265625, -2.417236328125, -2.1170654296875, -1.81689453125, -1.5167236328125, -1.216552734375, -0.9163818359375, -0.6162109375, -0.3160400390625, -0.015869140625, 0.2843017578125, 0.58447265625, 0.8846435546875, 1.184814453125, 1.4849853515625, 1.78515625, 2.0853271484375, 2.385498046875, 2.6856689453125, 2.98583984375, 3.2860107421875, 3.586181640625, 3.8863525390625, 4.1865234375, 4.4866943359375, 4.786865234375, 5.0870361328125, 5.38720703125, 5.6873779296875, 5.987548828125, 6.2877197265625, 6.587890625, 6.8880615234375, 7.188232421875, 7.4884033203125, 7.78857421875, 8.0887451171875, 8.388916015625, 8.6890869140625, 8.9892578125, 9.2894287109375, 9.589599609375, 9.8897705078125, 10.18994140625, 10.4901123046875, 10.790283203125, 11.0904541015625, 11.390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 11.0, 9.0, 16.0, 12.0, 31.0, 52.0, 72.0, 117.0, 162.0, 274.0, 510.0, 843.0, 1660.0, 3487.0, 8453.0, 23443.0, 78349.0, 377409.0, 425679.0, 86118.0, 25179.0, 8891.0, 3781.0, 1733.0, 946.0, 490.0, 301.0, 175.0, 105.0, 76.0, 44.0, 34.0, 22.0, 9.0, 12.0, 10.0, 4.0, 9.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.63671875, -3.502197265625, -3.36767578125, -3.233154296875, -3.0986328125, -2.964111328125, -2.82958984375, -2.695068359375, -2.560546875, -2.426025390625, -2.29150390625, -2.156982421875, -2.0224609375, -1.887939453125, -1.75341796875, -1.618896484375, -1.484375, -1.349853515625, -1.21533203125, -1.080810546875, -0.9462890625, -0.811767578125, -0.67724609375, -0.542724609375, -0.408203125, -0.273681640625, -0.13916015625, -0.004638671875, 0.1298828125, 0.264404296875, 0.39892578125, 0.533447265625, 0.66796875, 0.802490234375, 0.93701171875, 1.071533203125, 1.2060546875, 1.340576171875, 1.47509765625, 1.609619140625, 1.744140625, 1.878662109375, 2.01318359375, 2.147705078125, 2.2822265625, 2.416748046875, 2.55126953125, 2.685791015625, 2.8203125, 2.954833984375, 3.08935546875, 3.223876953125, 3.3583984375, 3.492919921875, 3.62744140625, 3.761962890625, 3.896484375, 4.031005859375, 4.16552734375, 4.300048828125, 4.4345703125, 4.569091796875, 4.70361328125, 4.838134765625, 4.97265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 5.0, 10.0, 14.0, 13.0, 23.0, 24.0, 30.0, 27.0, 38.0, 36.0, 75.0, 132.0, 161.0, 98.0, 64.0, 52.0, 43.0, 25.0, 26.0, 18.0, 16.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005898475646972656, -0.0005674213171005249, -0.0005449950695037842, -0.0005225688219070435, -0.0005001425743103027, -0.000477716326713562, -0.0004552900791168213, -0.00043286383152008057, -0.00041043758392333984, -0.0003880113363265991, -0.0003655850887298584, -0.0003431588411331177, -0.00032073259353637695, -0.00029830634593963623, -0.0002758800983428955, -0.0002534538507461548, -0.00023102760314941406, -0.00020860135555267334, -0.00018617510795593262, -0.0001637488603591919, -0.00014132261276245117, -0.00011889636516571045, -9.647011756896973e-05, -7.4043869972229e-05, -5.161762237548828e-05, -2.919137477874756e-05, -6.765127182006836e-06, 1.5661120414733887e-05, 3.808736801147461e-05, 6.051361560821533e-05, 8.293986320495605e-05, 0.00010536611080169678, 0.0001277923583984375, 0.00015021860599517822, 0.00017264485359191895, 0.00019507110118865967, 0.0002174973487854004, 0.0002399235963821411, 0.00026234984397888184, 0.00028477609157562256, 0.0003072023391723633, 0.000329628586769104, 0.0003520548343658447, 0.00037448108196258545, 0.00039690732955932617, 0.0004193335771560669, 0.0004417598247528076, 0.00046418607234954834, 0.00048661231994628906, 0.0005090385675430298, 0.0005314648151397705, 0.0005538910627365112, 0.000576317310333252, 0.0005987435579299927, 0.0006211698055267334, 0.0006435960531234741, 0.0006660223007202148, 0.0006884485483169556, 0.0007108747959136963, 0.000733301043510437, 0.0007557272911071777, 0.0007781535387039185, 0.0008005797863006592, 0.0008230060338973999, 0.0008454322814941406]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 3.0, 5.0, 7.0, 3.0, 8.0, 15.0, 16.0, 23.0, 41.0, 59.0, 52.0, 119.0, 209.0, 377.0, 967.0, 2789.0, 11994.0, 99006.0, 808985.0, 106318.0, 12593.0, 3038.0, 988.0, 388.0, 186.0, 121.0, 73.0, 49.0, 21.0, 24.0, 12.0, 6.0, 11.0, 11.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.7265625, -10.406494140625, -10.08642578125, -9.766357421875, -9.4462890625, -9.126220703125, -8.80615234375, -8.486083984375, -8.166015625, -7.845947265625, -7.52587890625, -7.205810546875, -6.8857421875, -6.565673828125, -6.24560546875, -5.925537109375, -5.60546875, -5.285400390625, -4.96533203125, -4.645263671875, -4.3251953125, -4.005126953125, -3.68505859375, -3.364990234375, -3.044921875, -2.724853515625, -2.40478515625, -2.084716796875, -1.7646484375, -1.444580078125, -1.12451171875, -0.804443359375, -0.484375, -0.164306640625, 0.15576171875, 0.475830078125, 0.7958984375, 1.115966796875, 1.43603515625, 1.756103515625, 2.076171875, 2.396240234375, 2.71630859375, 3.036376953125, 3.3564453125, 3.676513671875, 3.99658203125, 4.316650390625, 4.63671875, 4.956787109375, 5.27685546875, 5.596923828125, 5.9169921875, 6.237060546875, 6.55712890625, 6.877197265625, 7.197265625, 7.517333984375, 7.83740234375, 8.157470703125, 8.4775390625, 8.797607421875, 9.11767578125, 9.437744140625, 9.7578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 21.0, 33.0, 30.0, 41.0, 54.0, 77.0, 98.0, 114.0, 113.0, 87.0, 70.0, 50.0, 43.0, 29.0, 26.0, 14.0, 12.0, 12.0, 10.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.3232421875, -5.150390625, -4.9775390625, -4.8046875, -4.6318359375, -4.458984375, -4.2861328125, -4.11328125, -3.9404296875, -3.767578125, -3.5947265625, -3.421875, -3.2490234375, -3.076171875, -2.9033203125, -2.73046875, -2.5576171875, -2.384765625, -2.2119140625, -2.0390625, -1.8662109375, -1.693359375, -1.5205078125, -1.34765625, -1.1748046875, -1.001953125, -0.8291015625, -0.65625, -0.4833984375, -0.310546875, -0.1376953125, 0.03515625, 0.2080078125, 0.380859375, 0.5537109375, 0.7265625, 0.8994140625, 1.072265625, 1.2451171875, 1.41796875, 1.5908203125, 1.763671875, 1.9365234375, 2.109375, 2.2822265625, 2.455078125, 2.6279296875, 2.80078125, 2.9736328125, 3.146484375, 3.3193359375, 3.4921875, 3.6650390625, 3.837890625, 4.0107421875, 4.18359375, 4.3564453125, 4.529296875, 4.7021484375, 4.875, 5.0478515625, 5.220703125, 5.3935546875, 5.56640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 33.0, 74.0, 124.0, 209.0, 222.0, 149.0, 101.0, 42.0, 23.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.42138671875, -102.9936294555664, -99.56586456298828, -96.13810729980469, -92.71034240722656, -89.28258514404297, -85.85482788085938, -82.42706298828125, -78.99929809570312, -75.57154083251953, -72.1437759399414, -68.71601867675781, -65.28825378417969, -61.860496520996094, -58.432735443115234, -55.004974365234375, -51.57721710205078, -48.14945602416992, -44.72169494628906, -41.29393768310547, -37.866172790527344, -34.43841552734375, -31.01065444946289, -27.58289337158203, -24.155132293701172, -20.727371215820312, -17.299610137939453, -13.871850967407227, -10.444089889526367, -7.016328811645508, -3.5885696411132812, -0.16080856323242188, 3.2669525146484375, 6.694713115692139, 10.12247371673584, 13.550233840942383, 16.977994918823242, 20.4057559967041, 23.833515167236328, 27.261276245117188, 30.689037322998047, 34.116798400878906, 37.544559478759766, 40.972320556640625, 44.40007781982422, 47.827842712402344, 51.25559997558594, 54.6833610534668, 58.111122131347656, 61.538883209228516, 64.96664428710938, 68.39440155029297, 71.8221664428711, 75.24992370605469, 78.67768859863281, 82.1054458618164, 85.533203125, 88.9609603881836, 92.38872528076172, 95.81648254394531, 99.24424743652344, 102.67200469970703, 106.09976196289062, 109.52752685546875, 112.95529174804688]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 4.0, 8.0, 13.0, 16.0, 17.0, 22.0, 16.0, 23.0, 22.0, 42.0, 30.0, 32.0, 46.0, 51.0, 52.0, 57.0, 53.0, 40.0, 47.0, 42.0, 47.0, 39.0, 35.0, 40.0, 42.0, 23.0, 32.0, 20.0, 13.0, 21.0, 13.0, 9.0, 8.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.68927001953125, -46.214752197265625, -44.740230560302734, -43.26571273803711, -41.79119110107422, -40.316673278808594, -38.8421516418457, -37.36763381958008, -35.89311218261719, -34.41859436035156, -32.94407272338867, -31.469552993774414, -29.995033264160156, -28.5205135345459, -27.04599380493164, -25.571475982666016, -24.096956253051758, -22.6224365234375, -21.147916793823242, -19.673397064208984, -18.198877334594727, -16.72435760498047, -15.249838829040527, -13.77531909942627, -12.300799369812012, -10.826279640197754, -9.351759910583496, -7.8772406578063965, -6.402720928192139, -4.928201198577881, -3.4536819458007812, -1.9791622161865234, -0.5046424865722656, 0.9698771238327026, 2.444396734237671, 3.9189162254333496, 5.393435955047607, 6.867955684661865, 8.342474937438965, 9.816994667053223, 11.29151439666748, 12.766034126281738, 14.240553855895996, 15.715072631835938, 17.189592361450195, 18.664112091064453, 20.13863182067871, 21.61315155029297, 23.087671279907227, 24.562191009521484, 26.036710739135742, 27.51123046875, 28.985750198364258, 30.460269927978516, 31.93478775024414, 33.40930938720703, 34.883827209472656, 36.35834503173828, 37.83286666870117, 39.3073844909668, 40.78190612792969, 42.25642395019531, 43.7309455871582, 45.20546340942383, 46.67998504638672]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 13.0, 16.0, 17.0, 12.0, 15.0, 19.0, 23.0, 33.0, 40.0, 59.0, 83.0, 96.0, 154.0, 266.0, 429.0, 638.0, 1193.0, 2233.0, 4711.0, 11164.0, 32407.0, 152012.0, 3459544.0, 441890.0, 55969.0, 16970.0, 6907.0, 3242.0, 1683.0, 949.0, 555.0, 336.0, 200.0, 129.0, 72.0, 55.0, 40.0, 30.0, 24.0, 11.0, 8.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.9466552734375, -11.612060546875, -11.2774658203125, -10.94287109375, -10.6082763671875, -10.273681640625, -9.9390869140625, -9.6044921875, -9.2698974609375, -8.935302734375, -8.6007080078125, -8.26611328125, -7.9315185546875, -7.596923828125, -7.2623291015625, -6.927734375, -6.5931396484375, -6.258544921875, -5.9239501953125, -5.58935546875, -5.2547607421875, -4.920166015625, -4.5855712890625, -4.2509765625, -3.9163818359375, -3.581787109375, -3.2471923828125, -2.91259765625, -2.5780029296875, -2.243408203125, -1.9088134765625, -1.57421875, -1.2396240234375, -0.905029296875, -0.5704345703125, -0.23583984375, 0.0987548828125, 0.433349609375, 0.7679443359375, 1.1025390625, 1.4371337890625, 1.771728515625, 2.1063232421875, 2.44091796875, 2.7755126953125, 3.110107421875, 3.4447021484375, 3.779296875, 4.1138916015625, 4.448486328125, 4.7830810546875, 5.11767578125, 5.4522705078125, 5.786865234375, 6.1214599609375, 6.4560546875, 6.7906494140625, 7.125244140625, 7.4598388671875, 7.79443359375, 8.1290283203125, 8.463623046875, 8.7982177734375, 9.1328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 13.0, 9.0, 16.0, 21.0, 25.0, 34.0, 40.0, 36.0, 52.0, 55.0, 44.0, 67.0, 54.0, 56.0, 58.0, 52.0, 47.0, 45.0, 43.0, 40.0, 28.0, 29.0, 28.0, 24.0, 17.0, 9.0, 10.0, 7.0, 11.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.161712646484375, -2.08319091796875, -2.004669189453125, -1.9261474609375, -1.847625732421875, -1.76910400390625, -1.690582275390625, -1.612060546875, -1.533538818359375, -1.45501708984375, -1.376495361328125, -1.2979736328125, -1.219451904296875, -1.14093017578125, -1.062408447265625, -0.98388671875, -0.905364990234375, -0.82684326171875, -0.748321533203125, -0.6697998046875, -0.591278076171875, -0.51275634765625, -0.434234619140625, -0.355712890625, -0.277191162109375, -0.19866943359375, -0.120147705078125, -0.0416259765625, 0.036895751953125, 0.11541748046875, 0.193939208984375, 0.2724609375, 0.350982666015625, 0.42950439453125, 0.508026123046875, 0.5865478515625, 0.665069580078125, 0.74359130859375, 0.822113037109375, 0.900634765625, 0.979156494140625, 1.05767822265625, 1.136199951171875, 1.2147216796875, 1.293243408203125, 1.37176513671875, 1.450286865234375, 1.52880859375, 1.607330322265625, 1.68585205078125, 1.764373779296875, 1.8428955078125, 1.921417236328125, 1.99993896484375, 2.078460693359375, 2.156982421875, 2.235504150390625, 2.31402587890625, 2.392547607421875, 2.4710693359375, 2.549591064453125, 2.62811279296875, 2.706634521484375, 2.78515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 19.0, 22.0, 56.0, 73.0, 146.0, 290.0, 566.0, 1208.0, 3075.0, 8936.0, 34378.0, 268876.0, 3675619.0, 162703.0, 26301.0, 7254.0, 2602.0, 1011.0, 546.0, 265.0, 119.0, 57.0, 44.0, 28.0, 26.0, 14.0, 10.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.71875, -14.2781982421875, -13.837646484375, -13.3970947265625, -12.95654296875, -12.5159912109375, -12.075439453125, -11.6348876953125, -11.1943359375, -10.7537841796875, -10.313232421875, -9.8726806640625, -9.43212890625, -8.9915771484375, -8.551025390625, -8.1104736328125, -7.669921875, -7.2293701171875, -6.788818359375, -6.3482666015625, -5.90771484375, -5.4671630859375, -5.026611328125, -4.5860595703125, -4.1455078125, -3.7049560546875, -3.264404296875, -2.8238525390625, -2.38330078125, -1.9427490234375, -1.502197265625, -1.0616455078125, -0.62109375, -0.1805419921875, 0.260009765625, 0.7005615234375, 1.14111328125, 1.5816650390625, 2.022216796875, 2.4627685546875, 2.9033203125, 3.3438720703125, 3.784423828125, 4.2249755859375, 4.66552734375, 5.1060791015625, 5.546630859375, 5.9871826171875, 6.427734375, 6.8682861328125, 7.308837890625, 7.7493896484375, 8.18994140625, 8.6304931640625, 9.071044921875, 9.5115966796875, 9.9521484375, 10.3927001953125, 10.833251953125, 11.2738037109375, 11.71435546875, 12.1549072265625, 12.595458984375, 13.0360107421875, 13.4765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 4.0, 13.0, 29.0, 38.0, 57.0, 98.0, 210.0, 531.0, 1961.0, 595.0, 208.0, 107.0, 73.0, 30.0, 23.0, 17.0, 16.0, 10.0, 10.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.42376708984375, -6.2264404296875, -6.02911376953125, -5.831787109375, -5.63446044921875, -5.4371337890625, -5.23980712890625, -5.04248046875, -4.84515380859375, -4.6478271484375, -4.45050048828125, -4.253173828125, -4.05584716796875, -3.8585205078125, -3.66119384765625, -3.4638671875, -3.26654052734375, -3.0692138671875, -2.87188720703125, -2.674560546875, -2.47723388671875, -2.2799072265625, -2.08258056640625, -1.88525390625, -1.68792724609375, -1.4906005859375, -1.29327392578125, -1.095947265625, -0.89862060546875, -0.7012939453125, -0.50396728515625, -0.306640625, -0.10931396484375, 0.0880126953125, 0.28533935546875, 0.482666015625, 0.67999267578125, 0.8773193359375, 1.07464599609375, 1.27197265625, 1.46929931640625, 1.6666259765625, 1.86395263671875, 2.061279296875, 2.25860595703125, 2.4559326171875, 2.65325927734375, 2.8505859375, 3.04791259765625, 3.2452392578125, 3.44256591796875, 3.639892578125, 3.83721923828125, 4.0345458984375, 4.23187255859375, 4.42919921875, 4.62652587890625, 4.8238525390625, 5.02117919921875, 5.218505859375, 5.41583251953125, 5.6131591796875, 5.81048583984375, 6.0078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 20.0, 115.0, 372.0, 325.0, 130.0, 26.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.631507873535156, -33.263099670410156, -29.894695281982422, -26.526287078857422, -23.157880783081055, -19.789474487304688, -16.421066284179688, -13.05265998840332, -9.684253692626953, -6.315846920013428, -2.9474401473999023, 0.42096710205078125, 3.7893733978271484, 7.157779693603516, 10.526187896728516, 13.894594192504883, 17.26300048828125, 20.631406784057617, 23.999813079833984, 27.368221282958984, 30.73662757873535, 34.10503387451172, 37.47344207763672, 40.84185028076172, 44.21025466918945, 47.57866287231445, 50.94706726074219, 54.31547546386719, 57.68388366699219, 61.05228805541992, 64.42070007324219, 67.78910064697266, 71.15751647949219, 74.52592468261719, 77.89433288574219, 81.26274108886719, 84.63114166259766, 87.99954986572266, 91.36795806884766, 94.73636627197266, 98.10476684570312, 101.47317504882812, 104.84158325195312, 108.20999145507812, 111.5783920288086, 114.9468002319336, 118.3152084350586, 121.6836166381836, 125.0520248413086, 128.42042541503906, 131.78883361816406, 135.15724182128906, 138.52565002441406, 141.89405822753906, 145.26246643066406, 148.63087463378906, 151.99928283691406, 155.36769104003906, 158.73609924316406, 162.10450744628906, 165.47291564941406, 168.84130859375, 172.209716796875, 175.578125, 178.946533203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 14.0, 31.0, 32.0, 33.0, 35.0, 66.0, 69.0, 92.0, 79.0, 75.0, 94.0, 85.0, 61.0, 52.0, 40.0, 46.0, 32.0, 21.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.76951599121094, -31.815479278564453, -30.86144256591797, -29.907405853271484, -28.953371047973633, -27.99933433532715, -27.045297622680664, -26.09126091003418, -25.137224197387695, -24.18318748474121, -23.229150772094727, -22.275115966796875, -21.32107925415039, -20.367042541503906, -19.413005828857422, -18.458969116210938, -17.504932403564453, -16.55089569091797, -15.5968599319458, -14.642823219299316, -13.688786506652832, -12.734750747680664, -11.78071403503418, -10.826677322387695, -9.872642517089844, -8.91860580444336, -7.964569568634033, -7.010533332824707, -6.056496620178223, -5.1024603843688965, -4.14842414855957, -3.194387435913086, -2.2403507232666016, -1.2863142490386963, -0.33227789402008057, 0.6217584609985352, 1.5757949352264404, 2.5298314094543457, 3.483867645263672, 4.437904357910156, 5.391940593719482, 6.345976829528809, 7.300013542175293, 8.254049301147461, 9.208086013793945, 10.16212272644043, 11.116159439086914, 12.070196151733398, 13.024231910705566, 13.97826862335205, 14.932304382324219, 15.886341094970703, 16.840377807617188, 17.794414520263672, 18.748451232910156, 19.70248794555664, 20.656522750854492, 21.610559463500977, 22.56459617614746, 23.518630981445312, 24.472667694091797, 25.42670440673828, 26.380741119384766, 27.33477783203125, 28.288814544677734]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 11.0, 12.0, 22.0, 24.0, 43.0, 77.0, 103.0, 137.0, 224.0, 346.0, 578.0, 1037.0, 1755.0, 3352.0, 6979.0, 15394.0, 35632.0, 89018.0, 207653.0, 315256.0, 212197.0, 91190.0, 36956.0, 15451.0, 7008.0, 3459.0, 1898.0, 1033.0, 623.0, 394.0, 232.0, 160.0, 104.0, 54.0, 52.0, 36.0, 22.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.32855224609375, -6.1141357421875, -5.89971923828125, -5.685302734375, -5.47088623046875, -5.2564697265625, -5.04205322265625, -4.82763671875, -4.61322021484375, -4.3988037109375, -4.18438720703125, -3.969970703125, -3.75555419921875, -3.5411376953125, -3.32672119140625, -3.1123046875, -2.89788818359375, -2.6834716796875, -2.46905517578125, -2.254638671875, -2.04022216796875, -1.8258056640625, -1.61138916015625, -1.39697265625, -1.18255615234375, -0.9681396484375, -0.75372314453125, -0.539306640625, -0.32489013671875, -0.1104736328125, 0.10394287109375, 0.318359375, 0.53277587890625, 0.7471923828125, 0.96160888671875, 1.176025390625, 1.39044189453125, 1.6048583984375, 1.81927490234375, 2.03369140625, 2.24810791015625, 2.4625244140625, 2.67694091796875, 2.891357421875, 3.10577392578125, 3.3201904296875, 3.53460693359375, 3.7490234375, 3.96343994140625, 4.1778564453125, 4.39227294921875, 4.606689453125, 4.82110595703125, 5.0355224609375, 5.24993896484375, 5.46435546875, 5.67877197265625, 5.8931884765625, 6.10760498046875, 6.322021484375, 6.53643798828125, 6.7508544921875, 6.96527099609375, 7.1796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 8.0, 12.0, 20.0, 30.0, 36.0, 47.0, 37.0, 48.0, 43.0, 50.0, 52.0, 60.0, 44.0, 56.0, 67.0, 55.0, 41.0, 33.0, 36.0, 39.0, 31.0, 35.0, 20.0, 18.0, 13.0, 7.0, 10.0, 5.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.521484375, -2.439300537109375, -2.35711669921875, -2.274932861328125, -2.1927490234375, -2.110565185546875, -2.02838134765625, -1.946197509765625, -1.864013671875, -1.781829833984375, -1.69964599609375, -1.617462158203125, -1.5352783203125, -1.453094482421875, -1.37091064453125, -1.288726806640625, -1.20654296875, -1.124359130859375, -1.04217529296875, -0.959991455078125, -0.8778076171875, -0.795623779296875, -0.71343994140625, -0.631256103515625, -0.549072265625, -0.466888427734375, -0.38470458984375, -0.302520751953125, -0.2203369140625, -0.138153076171875, -0.05596923828125, 0.026214599609375, 0.1083984375, 0.190582275390625, 0.27276611328125, 0.354949951171875, 0.4371337890625, 0.519317626953125, 0.60150146484375, 0.683685302734375, 0.765869140625, 0.848052978515625, 0.93023681640625, 1.012420654296875, 1.0946044921875, 1.176788330078125, 1.25897216796875, 1.341156005859375, 1.42333984375, 1.505523681640625, 1.58770751953125, 1.669891357421875, 1.7520751953125, 1.834259033203125, 1.91644287109375, 1.998626708984375, 2.080810546875, 2.162994384765625, 2.24517822265625, 2.327362060546875, 2.4095458984375, 2.491729736328125, 2.57391357421875, 2.656097412109375, 2.73828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 9.0, 7.0, 5.0, 9.0, 13.0, 18.0, 41.0, 36.0, 76.0, 101.0, 203.0, 295.0, 490.0, 984.0, 2942.0, 18005.0, 213647.0, 707645.0, 90896.0, 9276.0, 1974.0, 760.0, 401.0, 247.0, 145.0, 111.0, 71.0, 42.0, 33.0, 26.0, 9.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.328125, -16.808349609375, -16.28857421875, -15.768798828125, -15.2490234375, -14.729248046875, -14.20947265625, -13.689697265625, -13.169921875, -12.650146484375, -12.13037109375, -11.610595703125, -11.0908203125, -10.571044921875, -10.05126953125, -9.531494140625, -9.01171875, -8.491943359375, -7.97216796875, -7.452392578125, -6.9326171875, -6.412841796875, -5.89306640625, -5.373291015625, -4.853515625, -4.333740234375, -3.81396484375, -3.294189453125, -2.7744140625, -2.254638671875, -1.73486328125, -1.215087890625, -0.6953125, -0.175537109375, 0.34423828125, 0.864013671875, 1.3837890625, 1.903564453125, 2.42333984375, 2.943115234375, 3.462890625, 3.982666015625, 4.50244140625, 5.022216796875, 5.5419921875, 6.061767578125, 6.58154296875, 7.101318359375, 7.62109375, 8.140869140625, 8.66064453125, 9.180419921875, 9.7001953125, 10.219970703125, 10.73974609375, 11.259521484375, 11.779296875, 12.299072265625, 12.81884765625, 13.338623046875, 13.8583984375, 14.378173828125, 14.89794921875, 15.417724609375, 15.9375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 10.0, 13.0, 10.0, 17.0, 15.0, 14.0, 16.0, 30.0, 38.0, 25.0, 34.0, 30.0, 42.0, 41.0, 51.0, 48.0, 49.0, 44.0, 48.0, 53.0, 49.0, 41.0, 39.0, 40.0, 24.0, 22.0, 29.0, 16.0, 22.0, 14.0, 21.0, 14.0, 5.0, 3.0, 14.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.2890625, -7.9456787109375, -7.602294921875, -7.2589111328125, -6.91552734375, -6.5721435546875, -6.228759765625, -5.8853759765625, -5.5419921875, -5.1986083984375, -4.855224609375, -4.5118408203125, -4.16845703125, -3.8250732421875, -3.481689453125, -3.1383056640625, -2.794921875, -2.4515380859375, -2.108154296875, -1.7647705078125, -1.42138671875, -1.0780029296875, -0.734619140625, -0.3912353515625, -0.0478515625, 0.2955322265625, 0.638916015625, 0.9822998046875, 1.32568359375, 1.6690673828125, 2.012451171875, 2.3558349609375, 2.69921875, 3.0426025390625, 3.385986328125, 3.7293701171875, 4.07275390625, 4.4161376953125, 4.759521484375, 5.1029052734375, 5.4462890625, 5.7896728515625, 6.133056640625, 6.4764404296875, 6.81982421875, 7.1632080078125, 7.506591796875, 7.8499755859375, 8.193359375, 8.5367431640625, 8.880126953125, 9.2235107421875, 9.56689453125, 9.9102783203125, 10.253662109375, 10.5970458984375, 10.9404296875, 11.2838134765625, 11.627197265625, 11.9705810546875, 12.31396484375, 12.6573486328125, 13.000732421875, 13.3441162109375, 13.6875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 2.0, 14.0, 23.0, 37.0, 53.0, 87.0, 178.0, 427.0, 1316.0, 4506.0, 24687.0, 203171.0, 644070.0, 146204.0, 18193.0, 3744.0, 1074.0, 393.0, 162.0, 79.0, 47.0, 28.0, 21.0, 9.0, 12.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40625, -6.1956787109375, -5.985107421875, -5.7745361328125, -5.56396484375, -5.3533935546875, -5.142822265625, -4.9322509765625, -4.7216796875, -4.5111083984375, -4.300537109375, -4.0899658203125, -3.87939453125, -3.6688232421875, -3.458251953125, -3.2476806640625, -3.037109375, -2.8265380859375, -2.615966796875, -2.4053955078125, -2.19482421875, -1.9842529296875, -1.773681640625, -1.5631103515625, -1.3525390625, -1.1419677734375, -0.931396484375, -0.7208251953125, -0.51025390625, -0.2996826171875, -0.089111328125, 0.1214599609375, 0.33203125, 0.5426025390625, 0.753173828125, 0.9637451171875, 1.17431640625, 1.3848876953125, 1.595458984375, 1.8060302734375, 2.0166015625, 2.2271728515625, 2.437744140625, 2.6483154296875, 2.85888671875, 3.0694580078125, 3.280029296875, 3.4906005859375, 3.701171875, 3.9117431640625, 4.122314453125, 4.3328857421875, 4.54345703125, 4.7540283203125, 4.964599609375, 5.1751708984375, 5.3857421875, 5.5963134765625, 5.806884765625, 6.0174560546875, 6.22802734375, 6.4385986328125, 6.649169921875, 6.8597412109375, 7.0703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 6.0, 10.0, 6.0, 9.0, 20.0, 24.0, 41.0, 25.0, 34.0, 49.0, 74.0, 72.0, 89.0, 74.0, 86.0, 87.0, 65.0, 46.0, 50.0, 32.0, 18.0, 23.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006055831909179688, -0.0005872100591659546, -0.0005688369274139404, -0.0005504637956619263, -0.0005320906639099121, -0.000513717532157898, -0.0004953444004058838, -0.00047697126865386963, -0.00045859813690185547, -0.0004402250051498413, -0.00042185187339782715, -0.000403478741645813, -0.00038510560989379883, -0.00036673247814178467, -0.0003483593463897705, -0.00032998621463775635, -0.0003116130828857422, -0.00029323995113372803, -0.00027486681938171387, -0.0002564936876296997, -0.00023812055587768555, -0.0002197474241256714, -0.00020137429237365723, -0.00018300116062164307, -0.0001646280288696289, -0.00014625489711761475, -0.00012788176536560059, -0.00010950863361358643, -9.113550186157227e-05, -7.27623701095581e-05, -5.4389238357543945e-05, -3.6016106605529785e-05, -1.7642974853515625e-05, 7.301568984985352e-07, 1.9103288650512695e-05, 3.7476420402526855e-05, 5.5849552154541016e-05, 7.422268390655518e-05, 9.259581565856934e-05, 0.0001109689474105835, 0.00012934207916259766, 0.00014771521091461182, 0.00016608834266662598, 0.00018446147441864014, 0.0002028346061706543, 0.00022120773792266846, 0.00023958086967468262, 0.0002579540014266968, 0.00027632713317871094, 0.0002947002649307251, 0.00031307339668273926, 0.0003314465284347534, 0.0003498196601867676, 0.00036819279193878174, 0.0003865659236907959, 0.00040493905544281006, 0.0004233121871948242, 0.0004416853189468384, 0.00046005845069885254, 0.0004784315824508667, 0.0004968047142028809, 0.000515177845954895, 0.0005335509777069092, 0.0005519241094589233, 0.0005702972412109375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 8.0, 14.0, 13.0, 24.0, 28.0, 45.0, 59.0, 88.0, 115.0, 201.0, 301.0, 589.0, 1089.0, 2569.0, 6921.0, 24351.0, 114867.0, 459856.0, 339553.0, 72001.0, 16337.0, 5141.0, 2055.0, 968.0, 518.0, 302.0, 159.0, 103.0, 63.0, 43.0, 41.0, 29.0, 27.0, 14.0, 18.0, 9.0, 10.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.9375, -5.77191162109375, -5.6063232421875, -5.44073486328125, -5.275146484375, -5.10955810546875, -4.9439697265625, -4.77838134765625, -4.61279296875, -4.44720458984375, -4.2816162109375, -4.11602783203125, -3.950439453125, -3.78485107421875, -3.6192626953125, -3.45367431640625, -3.2880859375, -3.12249755859375, -2.9569091796875, -2.79132080078125, -2.625732421875, -2.46014404296875, -2.2945556640625, -2.12896728515625, -1.96337890625, -1.79779052734375, -1.6322021484375, -1.46661376953125, -1.301025390625, -1.13543701171875, -0.9698486328125, -0.80426025390625, -0.638671875, -0.47308349609375, -0.3074951171875, -0.14190673828125, 0.023681640625, 0.18927001953125, 0.3548583984375, 0.52044677734375, 0.68603515625, 0.85162353515625, 1.0172119140625, 1.18280029296875, 1.348388671875, 1.51397705078125, 1.6795654296875, 1.84515380859375, 2.0107421875, 2.17633056640625, 2.3419189453125, 2.50750732421875, 2.673095703125, 2.83868408203125, 3.0042724609375, 3.16986083984375, 3.33544921875, 3.50103759765625, 3.6666259765625, 3.83221435546875, 3.997802734375, 4.16339111328125, 4.3289794921875, 4.49456787109375, 4.66015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 10.0, 7.0, 17.0, 12.0, 14.0, 25.0, 32.0, 35.0, 48.0, 54.0, 54.0, 61.0, 73.0, 71.0, 75.0, 66.0, 68.0, 40.0, 32.0, 28.0, 36.0, 27.0, 18.0, 16.0, 19.0, 16.0, 6.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.74609375, -3.630462646484375, -3.51483154296875, -3.399200439453125, -3.2835693359375, -3.167938232421875, -3.05230712890625, -2.936676025390625, -2.821044921875, -2.705413818359375, -2.58978271484375, -2.474151611328125, -2.3585205078125, -2.242889404296875, -2.12725830078125, -2.011627197265625, -1.89599609375, -1.780364990234375, -1.66473388671875, -1.549102783203125, -1.4334716796875, -1.317840576171875, -1.20220947265625, -1.086578369140625, -0.970947265625, -0.855316162109375, -0.73968505859375, -0.624053955078125, -0.5084228515625, -0.392791748046875, -0.27716064453125, -0.161529541015625, -0.0458984375, 0.069732666015625, 0.18536376953125, 0.300994873046875, 0.4166259765625, 0.532257080078125, 0.64788818359375, 0.763519287109375, 0.879150390625, 0.994781494140625, 1.11041259765625, 1.226043701171875, 1.3416748046875, 1.457305908203125, 1.57293701171875, 1.688568115234375, 1.80419921875, 1.919830322265625, 2.03546142578125, 2.151092529296875, 2.2667236328125, 2.382354736328125, 2.49798583984375, 2.613616943359375, 2.729248046875, 2.844879150390625, 2.96051025390625, 3.076141357421875, 3.1917724609375, 3.307403564453125, 3.42303466796875, 3.538665771484375, 3.654296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 12.0, 13.0, 29.0, 52.0, 82.0, 123.0, 139.0, 161.0, 136.0, 100.0, 64.0, 35.0, 18.0, 12.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71430206298828, -40.204185485839844, -37.69406509399414, -35.1839485168457, -32.673828125, -30.163711547851562, -27.653594970703125, -25.143476486206055, -22.633358001708984, -20.123239517211914, -17.613121032714844, -15.103004455566406, -12.592885971069336, -10.082767486572266, -7.572649955749512, -5.062532424926758, -2.5524139404296875, -0.04229593276977539, 2.4678220748901367, 4.977940082550049, 7.488058090209961, 9.998176574707031, 12.508294105529785, 15.018411636352539, 17.52853012084961, 20.03864860534668, 22.54876708984375, 25.058883666992188, 27.569002151489258, 30.079120635986328, 32.589237213134766, 35.09935760498047, 37.60948181152344, 40.119598388671875, 42.62971878051758, 45.139835357666016, 47.64995574951172, 50.160072326660156, 52.670188903808594, 55.18030548095703, 57.690425872802734, 60.20054244995117, 62.710662841796875, 65.22077941894531, 67.73089599609375, 70.24101257324219, 72.75113677978516, 75.2612533569336, 77.77136993408203, 80.28148651123047, 82.7916030883789, 85.30172729492188, 87.81184387207031, 90.32196044921875, 92.83207702636719, 95.34219360351562, 97.85231018066406, 100.3624267578125, 102.87254333496094, 105.3826675415039, 107.89278411865234, 110.40290069580078, 112.91301727294922, 115.42313385009766, 117.93325805664062]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 7.0, 5.0, 5.0, 9.0, 8.0, 15.0, 10.0, 12.0, 16.0, 17.0, 22.0, 22.0, 18.0, 15.0, 28.0, 26.0, 39.0, 35.0, 30.0, 35.0, 35.0, 30.0, 37.0, 34.0, 48.0, 37.0, 48.0, 31.0, 35.0, 39.0, 34.0, 27.0, 17.0, 28.0, 25.0, 21.0, 13.0, 15.0, 16.0, 7.0, 7.0, 8.0, 8.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.200836181640625, -37.87001037597656, -36.5391845703125, -35.20835876464844, -33.877532958984375, -32.54670333862305, -31.215877532958984, -29.885051727294922, -28.55422592163086, -27.223400115966797, -25.892574310302734, -24.56174659729004, -23.230920791625977, -21.900094985961914, -20.56926727294922, -19.238441467285156, -17.907615661621094, -16.57678985595703, -15.245963096618652, -13.915136337280273, -12.584310531616211, -11.253484725952148, -9.92265796661377, -8.59183120727539, -7.261005401611328, -5.930179119110107, -4.599352836608887, -3.268526554107666, -1.9377002716064453, -0.6068739891052246, 0.7239522933959961, 2.054779052734375, 3.385608673095703, 4.716434955596924, 6.0472612380981445, 7.378087520599365, 8.708913803100586, 10.039739608764648, 11.370566368103027, 12.701393127441406, 14.032218933105469, 15.363044738769531, 16.693870544433594, 18.02469825744629, 19.35552406311035, 20.686349868774414, 22.01717758178711, 23.348003387451172, 24.678829193115234, 26.009654998779297, 27.34048080444336, 28.671308517456055, 30.002134323120117, 31.33296012878418, 32.663787841796875, 33.99461364746094, 35.325439453125, 36.65626525878906, 37.987091064453125, 39.31791687011719, 40.64874267578125, 41.97957229614258, 43.31039810180664, 44.6412239074707, 45.972049713134766]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 10.0, 6.0, 8.0, 5.0, 20.0, 24.0, 23.0, 39.0, 68.0, 126.0, 193.0, 288.0, 476.0, 903.0, 1767.0, 4183.0, 17892.0, 3871957.0, 277662.0, 11633.0, 3429.0, 1522.0, 838.0, 462.0, 261.0, 159.0, 104.0, 59.0, 43.0, 26.0, 24.0, 11.0, 10.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.078125, -23.42529296875, -22.7724609375, -22.11962890625, -21.466796875, -20.81396484375, -20.1611328125, -19.50830078125, -18.85546875, -18.20263671875, -17.5498046875, -16.89697265625, -16.244140625, -15.59130859375, -14.9384765625, -14.28564453125, -13.6328125, -12.97998046875, -12.3271484375, -11.67431640625, -11.021484375, -10.36865234375, -9.7158203125, -9.06298828125, -8.41015625, -7.75732421875, -7.1044921875, -6.45166015625, -5.798828125, -5.14599609375, -4.4931640625, -3.84033203125, -3.1875, -2.53466796875, -1.8818359375, -1.22900390625, -0.576171875, 0.07666015625, 0.7294921875, 1.38232421875, 2.03515625, 2.68798828125, 3.3408203125, 3.99365234375, 4.646484375, 5.29931640625, 5.9521484375, 6.60498046875, 7.2578125, 7.91064453125, 8.5634765625, 9.21630859375, 9.869140625, 10.52197265625, 11.1748046875, 11.82763671875, 12.48046875, 13.13330078125, 13.7861328125, 14.43896484375, 15.091796875, 15.74462890625, 16.3974609375, 17.05029296875, 17.703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 10.0, 3.0, 2.0, 8.0, 9.0, 10.0, 11.0, 14.0, 29.0, 24.0, 31.0, 40.0, 45.0, 40.0, 60.0, 59.0, 42.0, 36.0, 53.0, 55.0, 37.0, 38.0, 50.0, 47.0, 32.0, 35.0, 41.0, 23.0, 26.0, 16.0, 14.0, 21.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5, -2.412567138671875, -2.32513427734375, -2.237701416015625, -2.1502685546875, -2.062835693359375, -1.97540283203125, -1.887969970703125, -1.800537109375, -1.713104248046875, -1.62567138671875, -1.538238525390625, -1.4508056640625, -1.363372802734375, -1.27593994140625, -1.188507080078125, -1.10107421875, -1.013641357421875, -0.92620849609375, -0.838775634765625, -0.7513427734375, -0.663909912109375, -0.57647705078125, -0.489044189453125, -0.401611328125, -0.314178466796875, -0.22674560546875, -0.139312744140625, -0.0518798828125, 0.035552978515625, 0.12298583984375, 0.210418701171875, 0.2978515625, 0.385284423828125, 0.47271728515625, 0.560150146484375, 0.6475830078125, 0.735015869140625, 0.82244873046875, 0.909881591796875, 0.997314453125, 1.084747314453125, 1.17218017578125, 1.259613037109375, 1.3470458984375, 1.434478759765625, 1.52191162109375, 1.609344482421875, 1.69677734375, 1.784210205078125, 1.87164306640625, 1.959075927734375, 2.0465087890625, 2.133941650390625, 2.22137451171875, 2.308807373046875, 2.396240234375, 2.483673095703125, 2.57110595703125, 2.658538818359375, 2.7459716796875, 2.833404541015625, 2.92083740234375, 3.008270263671875, 3.095703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 5.0, 18.0, 12.0, 19.0, 18.0, 38.0, 27.0, 46.0, 54.0, 76.0, 102.0, 122.0, 213.0, 283.0, 410.0, 591.0, 874.0, 1285.0, 2166.0, 3966.0, 9362.0, 42180.0, 3922743.0, 179137.0, 16640.0, 5908.0, 2864.0, 1658.0, 1042.0, 739.0, 456.0, 339.0, 230.0, 156.0, 129.0, 87.0, 72.0, 64.0, 44.0, 25.0, 24.0, 19.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -13.068359375, -12.62890625, -12.189453125, -11.75, -11.310546875, -10.87109375, -10.431640625, -9.9921875, -9.552734375, -9.11328125, -8.673828125, -8.234375, -7.794921875, -7.35546875, -6.916015625, -6.4765625, -6.037109375, -5.59765625, -5.158203125, -4.71875, -4.279296875, -3.83984375, -3.400390625, -2.9609375, -2.521484375, -2.08203125, -1.642578125, -1.203125, -0.763671875, -0.32421875, 0.115234375, 0.5546875, 0.994140625, 1.43359375, 1.873046875, 2.3125, 2.751953125, 3.19140625, 3.630859375, 4.0703125, 4.509765625, 4.94921875, 5.388671875, 5.828125, 6.267578125, 6.70703125, 7.146484375, 7.5859375, 8.025390625, 8.46484375, 8.904296875, 9.34375, 9.783203125, 10.22265625, 10.662109375, 11.1015625, 11.541015625, 11.98046875, 12.419921875, 12.859375, 13.298828125, 13.73828125, 14.177734375, 14.6171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 12.0, 8.0, 20.0, 40.0, 133.0, 895.0, 2746.0, 122.0, 37.0, 16.0, 18.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.6441650390625, -3.530517578125, -3.4168701171875, -3.30322265625, -3.1895751953125, -3.075927734375, -2.9622802734375, -2.8486328125, -2.7349853515625, -2.621337890625, -2.5076904296875, -2.39404296875, -2.2803955078125, -2.166748046875, -2.0531005859375, -1.939453125, -1.8258056640625, -1.712158203125, -1.5985107421875, -1.48486328125, -1.3712158203125, -1.257568359375, -1.1439208984375, -1.0302734375, -0.9166259765625, -0.802978515625, -0.6893310546875, -0.57568359375, -0.4620361328125, -0.348388671875, -0.2347412109375, -0.12109375, -0.0074462890625, 0.106201171875, 0.2198486328125, 0.33349609375, 0.4471435546875, 0.560791015625, 0.6744384765625, 0.7880859375, 0.9017333984375, 1.015380859375, 1.1290283203125, 1.24267578125, 1.3563232421875, 1.469970703125, 1.5836181640625, 1.697265625, 1.8109130859375, 1.924560546875, 2.0382080078125, 2.15185546875, 2.2655029296875, 2.379150390625, 2.4927978515625, 2.6064453125, 2.7200927734375, 2.833740234375, 2.9473876953125, 3.06103515625, 3.1746826171875, 3.288330078125, 3.4019775390625, 3.515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 11.0, 21.0, 32.0, 34.0, 45.0, 91.0, 104.0, 119.0, 124.0, 123.0, 80.0, 70.0, 44.0, 31.0, 17.0, 12.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.334512710571289, -14.933136940002441, -14.53176212310791, -14.130386352539062, -13.729011535644531, -13.327635765075684, -12.926259994506836, -12.524885177612305, -12.123509407043457, -11.72213363647461, -11.320758819580078, -10.91938304901123, -10.518007278442383, -10.116632461547852, -9.715256690979004, -9.313880920410156, -8.912506103515625, -8.511130332946777, -8.109755516052246, -7.708379745483398, -7.307004451751709, -6.9056291580200195, -6.504253387451172, -6.102878093719482, -5.701502799987793, -5.3001275062561035, -4.898752212524414, -4.497376441955566, -4.096001148223877, -3.6946258544921875, -3.293250322341919, -2.8918747901916504, -2.490499496459961, -2.0891242027282715, -1.687748670578003, -1.286373257637024, -0.8849978446960449, -0.48362255096435547, -0.08224701881408691, 0.31912851333618164, 0.7205038070678711, 1.12187922000885, 1.523254632949829, 1.924630045890808, 2.326005458831787, 2.7273807525634766, 3.128756284713745, 3.5301318168640137, 3.931507110595703, 4.332882404327393, 4.734257698059082, 5.13563346862793, 5.537008762359619, 5.938384056091309, 6.339759826660156, 6.741135120391846, 7.142510414123535, 7.543885707855225, 7.945261001586914, 8.346636772155762, 8.74801254272461, 9.14938735961914, 9.550763130187988, 9.952138900756836, 10.353513717651367]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 5.0, 8.0, 10.0, 5.0, 10.0, 8.0, 13.0, 14.0, 19.0, 24.0, 24.0, 27.0, 36.0, 23.0, 30.0, 26.0, 37.0, 46.0, 42.0, 33.0, 38.0, 41.0, 51.0, 46.0, 31.0, 42.0, 38.0, 34.0, 22.0, 30.0, 27.0, 23.0, 22.0, 16.0, 18.0, 15.0, 15.0, 10.0, 7.0, 11.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.004422187805176, -4.831449508666992, -4.658477306365967, -4.485504627227783, -4.3125319480896, -4.139559745788574, -3.9665870666503906, -3.793614387512207, -3.6206419467926025, -3.447669506072998, -3.2746968269348145, -3.10172438621521, -2.9287519454956055, -2.755779266357422, -2.5828068256378174, -2.409834384918213, -2.2368617057800293, -2.063889265060425, -1.8909165859222412, -1.7179441452026367, -1.5449715852737427, -1.3719990253448486, -1.1990265846252441, -1.02605402469635, -0.853081464767456, -0.680108904838562, -0.5071364045143127, -0.3341639041900635, -0.16119134426116943, 0.01178121566772461, 0.1847536563873291, 0.35772621631622314, 0.5306987762451172, 0.7036713361740112, 0.8766438364982605, 1.0496163368225098, 1.2225888967514038, 1.3955614566802979, 1.5685338973999023, 1.7415064573287964, 1.9144790172576904, 2.087451457977295, 2.2604241371154785, 2.433396577835083, 2.6063690185546875, 2.779341697692871, 2.9523141384124756, 3.12528657913208, 3.2982592582702637, 3.471231698989868, 3.6442043781280518, 3.8171768188476562, 3.99014949798584, 4.163122177124023, 4.336094379425049, 4.509067058563232, 4.682039260864258, 4.855011940002441, 5.027984142303467, 5.20095682144165, 5.373929500579834, 5.546901702880859, 5.719874382019043, 5.892847061157227, 6.06581974029541]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 4.0, 13.0, 22.0, 25.0, 31.0, 47.0, 69.0, 94.0, 117.0, 229.0, 321.0, 550.0, 998.0, 1819.0, 3225.0, 6429.0, 13057.0, 28116.0, 62646.0, 135655.0, 241826.0, 257791.0, 156939.0, 74168.0, 33106.0, 15276.0, 7365.0, 3773.0, 1946.0, 1074.0, 649.0, 398.0, 267.0, 161.0, 105.0, 75.0, 45.0, 30.0, 23.0, 15.0, 19.0, 9.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.29541015625, -6.0791015625, -5.86279296875, -5.646484375, -5.43017578125, -5.2138671875, -4.99755859375, -4.78125, -4.56494140625, -4.3486328125, -4.13232421875, -3.916015625, -3.69970703125, -3.4833984375, -3.26708984375, -3.05078125, -2.83447265625, -2.6181640625, -2.40185546875, -2.185546875, -1.96923828125, -1.7529296875, -1.53662109375, -1.3203125, -1.10400390625, -0.8876953125, -0.67138671875, -0.455078125, -0.23876953125, -0.0224609375, 0.19384765625, 0.41015625, 0.62646484375, 0.8427734375, 1.05908203125, 1.275390625, 1.49169921875, 1.7080078125, 1.92431640625, 2.140625, 2.35693359375, 2.5732421875, 2.78955078125, 3.005859375, 3.22216796875, 3.4384765625, 3.65478515625, 3.87109375, 4.08740234375, 4.3037109375, 4.52001953125, 4.736328125, 4.95263671875, 5.1689453125, 5.38525390625, 5.6015625, 5.81787109375, 6.0341796875, 6.25048828125, 6.466796875, 6.68310546875, 6.8994140625, 7.11572265625, 7.33203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 6.0, 12.0, 12.0, 14.0, 17.0, 25.0, 26.0, 38.0, 24.0, 47.0, 41.0, 44.0, 48.0, 47.0, 59.0, 65.0, 41.0, 37.0, 39.0, 37.0, 41.0, 45.0, 32.0, 17.0, 30.0, 28.0, 25.0, 20.0, 17.0, 6.0, 9.0, 6.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.59375, -2.50299072265625, -2.4122314453125, -2.32147216796875, -2.230712890625, -2.13995361328125, -2.0491943359375, -1.95843505859375, -1.86767578125, -1.77691650390625, -1.6861572265625, -1.59539794921875, -1.504638671875, -1.41387939453125, -1.3231201171875, -1.23236083984375, -1.1416015625, -1.05084228515625, -0.9600830078125, -0.86932373046875, -0.778564453125, -0.68780517578125, -0.5970458984375, -0.50628662109375, -0.41552734375, -0.32476806640625, -0.2340087890625, -0.14324951171875, -0.052490234375, 0.03826904296875, 0.1290283203125, 0.21978759765625, 0.310546875, 0.40130615234375, 0.4920654296875, 0.58282470703125, 0.673583984375, 0.76434326171875, 0.8551025390625, 0.94586181640625, 1.03662109375, 1.12738037109375, 1.2181396484375, 1.30889892578125, 1.399658203125, 1.49041748046875, 1.5811767578125, 1.67193603515625, 1.7626953125, 1.85345458984375, 1.9442138671875, 2.03497314453125, 2.125732421875, 2.21649169921875, 2.3072509765625, 2.39801025390625, 2.48876953125, 2.57952880859375, 2.6702880859375, 2.76104736328125, 2.851806640625, 2.94256591796875, 3.0333251953125, 3.12408447265625, 3.21484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 8.0, 12.0, 10.0, 26.0, 38.0, 60.0, 81.0, 104.0, 153.0, 294.0, 444.0, 888.0, 2663.0, 20285.0, 439386.0, 553597.0, 25263.0, 2969.0, 969.0, 443.0, 261.0, 185.0, 120.0, 82.0, 57.0, 43.0, 31.0, 24.0, 16.0, 14.0, 4.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.015625, -24.28076171875, -23.5458984375, -22.81103515625, -22.076171875, -21.34130859375, -20.6064453125, -19.87158203125, -19.13671875, -18.40185546875, -17.6669921875, -16.93212890625, -16.197265625, -15.46240234375, -14.7275390625, -13.99267578125, -13.2578125, -12.52294921875, -11.7880859375, -11.05322265625, -10.318359375, -9.58349609375, -8.8486328125, -8.11376953125, -7.37890625, -6.64404296875, -5.9091796875, -5.17431640625, -4.439453125, -3.70458984375, -2.9697265625, -2.23486328125, -1.5, -0.76513671875, -0.0302734375, 0.70458984375, 1.439453125, 2.17431640625, 2.9091796875, 3.64404296875, 4.37890625, 5.11376953125, 5.8486328125, 6.58349609375, 7.318359375, 8.05322265625, 8.7880859375, 9.52294921875, 10.2578125, 10.99267578125, 11.7275390625, 12.46240234375, 13.197265625, 13.93212890625, 14.6669921875, 15.40185546875, 16.13671875, 16.87158203125, 17.6064453125, 18.34130859375, 19.076171875, 19.81103515625, 20.5458984375, 21.28076171875, 22.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 5.0, 4.0, 8.0, 8.0, 8.0, 14.0, 14.0, 22.0, 28.0, 33.0, 29.0, 29.0, 31.0, 37.0, 48.0, 53.0, 60.0, 34.0, 48.0, 52.0, 45.0, 43.0, 50.0, 39.0, 46.0, 39.0, 41.0, 20.0, 13.0, 11.0, 19.0, 12.0, 16.0, 10.0, 7.0, 2.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.21875, -14.77490234375, -14.3310546875, -13.88720703125, -13.443359375, -12.99951171875, -12.5556640625, -12.11181640625, -11.66796875, -11.22412109375, -10.7802734375, -10.33642578125, -9.892578125, -9.44873046875, -9.0048828125, -8.56103515625, -8.1171875, -7.67333984375, -7.2294921875, -6.78564453125, -6.341796875, -5.89794921875, -5.4541015625, -5.01025390625, -4.56640625, -4.12255859375, -3.6787109375, -3.23486328125, -2.791015625, -2.34716796875, -1.9033203125, -1.45947265625, -1.015625, -0.57177734375, -0.1279296875, 0.31591796875, 0.759765625, 1.20361328125, 1.6474609375, 2.09130859375, 2.53515625, 2.97900390625, 3.4228515625, 3.86669921875, 4.310546875, 4.75439453125, 5.1982421875, 5.64208984375, 6.0859375, 6.52978515625, 6.9736328125, 7.41748046875, 7.861328125, 8.30517578125, 8.7490234375, 9.19287109375, 9.63671875, 10.08056640625, 10.5244140625, 10.96826171875, 11.412109375, 11.85595703125, 12.2998046875, 12.74365234375, 13.1875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 8.0, 10.0, 19.0, 17.0, 40.0, 61.0, 123.0, 224.0, 480.0, 1136.0, 3619.0, 16625.0, 164169.0, 770415.0, 76960.0, 10354.0, 2585.0, 887.0, 410.0, 173.0, 91.0, 49.0, 41.0, 20.0, 10.0, 13.0, 3.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.461181640625, -10.15673828125, -9.852294921875, -9.5478515625, -9.243408203125, -8.93896484375, -8.634521484375, -8.330078125, -8.025634765625, -7.72119140625, -7.416748046875, -7.1123046875, -6.807861328125, -6.50341796875, -6.198974609375, -5.89453125, -5.590087890625, -5.28564453125, -4.981201171875, -4.6767578125, -4.372314453125, -4.06787109375, -3.763427734375, -3.458984375, -3.154541015625, -2.85009765625, -2.545654296875, -2.2412109375, -1.936767578125, -1.63232421875, -1.327880859375, -1.0234375, -0.718994140625, -0.41455078125, -0.110107421875, 0.1943359375, 0.498779296875, 0.80322265625, 1.107666015625, 1.412109375, 1.716552734375, 2.02099609375, 2.325439453125, 2.6298828125, 2.934326171875, 3.23876953125, 3.543212890625, 3.84765625, 4.152099609375, 4.45654296875, 4.760986328125, 5.0654296875, 5.369873046875, 5.67431640625, 5.978759765625, 6.283203125, 6.587646484375, 6.89208984375, 7.196533203125, 7.5009765625, 7.805419921875, 8.10986328125, 8.414306640625, 8.71875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 18.0, 32.0, 30.0, 52.0, 74.0, 119.0, 145.0, 134.0, 124.0, 87.0, 55.0, 36.0, 29.0, 22.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001255035400390625, -0.0012160241603851318, -0.0011770129203796387, -0.0011380016803741455, -0.0010989904403686523, -0.0010599792003631592, -0.001020967960357666, -0.0009819567203521729, -0.0009429454803466797, -0.0009039342403411865, -0.0008649230003356934, -0.0008259117603302002, -0.000786900520324707, -0.0007478892803192139, -0.0007088780403137207, -0.0006698668003082275, -0.0006308555603027344, -0.0005918443202972412, -0.000552833080291748, -0.0005138218402862549, -0.0004748106002807617, -0.00043579936027526855, -0.0003967881202697754, -0.0003577768802642822, -0.00031876564025878906, -0.0002797544002532959, -0.00024074316024780273, -0.00020173192024230957, -0.0001627206802368164, -0.00012370944023132324, -8.469820022583008e-05, -4.5686960220336914e-05, -6.67572021484375e-06, 3.2335519790649414e-05, 7.134675979614258e-05, 0.00011035799980163574, 0.0001493692398071289, 0.00018838047981262207, 0.00022739171981811523, 0.0002664029598236084, 0.00030541419982910156, 0.0003444254398345947, 0.0003834366798400879, 0.00042244791984558105, 0.0004614591598510742, 0.0005004703998565674, 0.0005394816398620605, 0.0005784928798675537, 0.0006175041198730469, 0.00065651535987854, 0.0006955265998840332, 0.0007345378398895264, 0.0007735490798950195, 0.0008125603199005127, 0.0008515715599060059, 0.000890582799911499, 0.0009295940399169922, 0.0009686052799224854, 0.0010076165199279785, 0.0010466277599334717, 0.0010856389999389648, 0.001124650239944458, 0.0011636614799499512, 0.0012026727199554443, 0.0012416839599609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 12.0, 19.0, 19.0, 21.0, 45.0, 58.0, 83.0, 142.0, 210.0, 434.0, 846.0, 2120.0, 7760.0, 47338.0, 587269.0, 362220.0, 30729.0, 5906.0, 1715.0, 659.0, 367.0, 187.0, 137.0, 66.0, 39.0, 40.0, 23.0, 20.0, 16.0, 11.0, 11.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.7734375, -7.4732666015625, -7.173095703125, -6.8729248046875, -6.57275390625, -6.2725830078125, -5.972412109375, -5.6722412109375, -5.3720703125, -5.0718994140625, -4.771728515625, -4.4715576171875, -4.17138671875, -3.8712158203125, -3.571044921875, -3.2708740234375, -2.970703125, -2.6705322265625, -2.370361328125, -2.0701904296875, -1.77001953125, -1.4698486328125, -1.169677734375, -0.8695068359375, -0.5693359375, -0.2691650390625, 0.031005859375, 0.3311767578125, 0.63134765625, 0.9315185546875, 1.231689453125, 1.5318603515625, 1.83203125, 2.1322021484375, 2.432373046875, 2.7325439453125, 3.03271484375, 3.3328857421875, 3.633056640625, 3.9332275390625, 4.2333984375, 4.5335693359375, 4.833740234375, 5.1339111328125, 5.43408203125, 5.7342529296875, 6.034423828125, 6.3345947265625, 6.634765625, 6.9349365234375, 7.235107421875, 7.5352783203125, 7.83544921875, 8.1356201171875, 8.435791015625, 8.7359619140625, 9.0361328125, 9.3363037109375, 9.636474609375, 9.9366455078125, 10.23681640625, 10.5369873046875, 10.837158203125, 11.1373291015625, 11.4375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 7.0, 9.0, 13.0, 19.0, 20.0, 27.0, 37.0, 51.0, 60.0, 83.0, 82.0, 128.0, 103.0, 85.0, 72.0, 50.0, 38.0, 42.0, 17.0, 19.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.34857177734375, -5.1229248046875, -4.89727783203125, -4.671630859375, -4.44598388671875, -4.2203369140625, -3.99468994140625, -3.76904296875, -3.54339599609375, -3.3177490234375, -3.09210205078125, -2.866455078125, -2.64080810546875, -2.4151611328125, -2.18951416015625, -1.9638671875, -1.73822021484375, -1.5125732421875, -1.28692626953125, -1.061279296875, -0.83563232421875, -0.6099853515625, -0.38433837890625, -0.15869140625, 0.06695556640625, 0.2926025390625, 0.51824951171875, 0.743896484375, 0.96954345703125, 1.1951904296875, 1.42083740234375, 1.646484375, 1.87213134765625, 2.0977783203125, 2.32342529296875, 2.549072265625, 2.77471923828125, 3.0003662109375, 3.22601318359375, 3.45166015625, 3.67730712890625, 3.9029541015625, 4.12860107421875, 4.354248046875, 4.57989501953125, 4.8055419921875, 5.03118896484375, 5.2568359375, 5.48248291015625, 5.7081298828125, 5.93377685546875, 6.159423828125, 6.38507080078125, 6.6107177734375, 6.83636474609375, 7.06201171875, 7.28765869140625, 7.5133056640625, 7.73895263671875, 7.964599609375, 8.19024658203125, 8.4158935546875, 8.64154052734375, 8.8671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 17.0, 59.0, 146.0, 288.0, 274.0, 140.0, 52.0, 12.0, 10.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-284.8193664550781, -278.4716491699219, -272.12396240234375, -265.7762451171875, -259.42852783203125, -253.08082580566406, -246.73312377929688, -240.38540649414062, -234.03770446777344, -227.69000244140625, -221.34228515625, -214.9945831298828, -208.64688110351562, -202.29916381835938, -195.9514617919922, -189.603759765625, -183.25604248046875, -176.90834045410156, -170.5606231689453, -164.21292114257812, -157.86520385742188, -151.5175018310547, -145.1697998046875, -138.82208251953125, -132.47438049316406, -126.12667083740234, -119.77896118164062, -113.43125915527344, -107.08354949951172, -100.73583984375, -94.38813781738281, -88.0404281616211, -81.69271850585938, -75.34500885009766, -68.99729919433594, -62.64959716796875, -56.30188751220703, -49.95417785644531, -43.60647201538086, -37.258766174316406, -30.911056518554688, -24.5633487701416, -18.215641021728516, -11.86793327331543, -5.520225524902344, 0.8274822235107422, 7.175189971923828, 13.522895812988281, 19.87060546875, 26.218313217163086, 32.56602096557617, 38.913726806640625, 45.261436462402344, 51.60914611816406, 57.956851959228516, 64.30455780029297, 70.65226745605469, 76.9999771118164, 83.34768676757812, 89.69538879394531, 96.04309844970703, 102.39080810546875, 108.73851013183594, 115.08621978759766, 121.43392944335938]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 14.0, 9.0, 8.0, 11.0, 9.0, 12.0, 26.0, 17.0, 26.0, 22.0, 35.0, 35.0, 42.0, 32.0, 40.0, 54.0, 56.0, 41.0, 55.0, 39.0, 50.0, 45.0, 30.0, 33.0, 36.0, 29.0, 25.0, 17.0, 19.0, 27.0, 19.0, 16.0, 7.0, 13.0, 14.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.323707580566406, -50.560359954833984, -48.79701232910156, -47.033668518066406, -45.270320892333984, -43.50697326660156, -41.743629455566406, -39.980281829833984, -38.21693420410156, -36.45358657836914, -34.69023895263672, -32.92689514160156, -31.16354751586914, -29.40019989013672, -27.63685417175293, -25.87350845336914, -24.11016082763672, -22.346813201904297, -20.583467483520508, -18.82012176513672, -17.056774139404297, -15.293427467346191, -13.530080795288086, -11.76673412322998, -10.003387451171875, -8.24004077911377, -6.476694107055664, -4.713347434997559, -2.950000762939453, -1.1866540908813477, 0.5766925811767578, 2.3400392532348633, 4.103385925292969, 5.866732597351074, 7.63007926940918, 9.393425941467285, 11.15677261352539, 12.920119285583496, 14.683465957641602, 16.44681167602539, 18.210159301757812, 19.973506927490234, 21.736852645874023, 23.500198364257812, 25.263545989990234, 27.026893615722656, 28.790239334106445, 30.553585052490234, 32.316932678222656, 34.08028030395508, 35.8436279296875, 37.606971740722656, 39.37031936645508, 41.1336669921875, 42.897010803222656, 44.66035842895508, 46.4237060546875, 48.18705368041992, 49.950401306152344, 51.7137451171875, 53.47709274291992, 55.240440368652344, 57.0037841796875, 58.76713180541992, 60.530479431152344]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 16.0, 7.0, 3.0, 9.0, 16.0, 30.0, 21.0, 25.0, 49.0, 56.0, 99.0, 167.0, 244.0, 382.0, 613.0, 1040.0, 1925.0, 4327.0, 11614.0, 53580.0, 3868585.0, 216311.0, 21931.0, 6768.0, 2859.0, 1435.0, 748.0, 453.0, 296.0, 198.0, 142.0, 86.0, 66.0, 36.0, 36.0, 25.0, 10.0, 12.0, 10.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-11.0703125, -10.76904296875, -10.4677734375, -10.16650390625, -9.865234375, -9.56396484375, -9.2626953125, -8.96142578125, -8.66015625, -8.35888671875, -8.0576171875, -7.75634765625, -7.455078125, -7.15380859375, -6.8525390625, -6.55126953125, -6.25, -5.94873046875, -5.6474609375, -5.34619140625, -5.044921875, -4.74365234375, -4.4423828125, -4.14111328125, -3.83984375, -3.53857421875, -3.2373046875, -2.93603515625, -2.634765625, -2.33349609375, -2.0322265625, -1.73095703125, -1.4296875, -1.12841796875, -0.8271484375, -0.52587890625, -0.224609375, 0.07666015625, 0.3779296875, 0.67919921875, 0.98046875, 1.28173828125, 1.5830078125, 1.88427734375, 2.185546875, 2.48681640625, 2.7880859375, 3.08935546875, 3.390625, 3.69189453125, 3.9931640625, 4.29443359375, 4.595703125, 4.89697265625, 5.1982421875, 5.49951171875, 5.80078125, 6.10205078125, 6.4033203125, 6.70458984375, 7.005859375, 7.30712890625, 7.6083984375, 7.90966796875, 8.2109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 2.0, 5.0, 5.0, 9.0, 22.0, 20.0, 20.0, 26.0, 27.0, 28.0, 36.0, 35.0, 40.0, 55.0, 50.0, 53.0, 46.0, 44.0, 44.0, 45.0, 51.0, 44.0, 44.0, 43.0, 40.0, 26.0, 21.0, 23.0, 14.0, 17.0, 16.0, 4.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.5440673828125, -2.453369140625, -2.3626708984375, -2.27197265625, -2.1812744140625, -2.090576171875, -1.9998779296875, -1.9091796875, -1.8184814453125, -1.727783203125, -1.6370849609375, -1.54638671875, -1.4556884765625, -1.364990234375, -1.2742919921875, -1.18359375, -1.0928955078125, -1.002197265625, -0.9114990234375, -0.82080078125, -0.7301025390625, -0.639404296875, -0.5487060546875, -0.4580078125, -0.3673095703125, -0.276611328125, -0.1859130859375, -0.09521484375, -0.0045166015625, 0.086181640625, 0.1768798828125, 0.267578125, 0.3582763671875, 0.448974609375, 0.5396728515625, 0.63037109375, 0.7210693359375, 0.811767578125, 0.9024658203125, 0.9931640625, 1.0838623046875, 1.174560546875, 1.2652587890625, 1.35595703125, 1.4466552734375, 1.537353515625, 1.6280517578125, 1.71875, 1.8094482421875, 1.900146484375, 1.9908447265625, 2.08154296875, 2.1722412109375, 2.262939453125, 2.3536376953125, 2.4443359375, 2.5350341796875, 2.625732421875, 2.7164306640625, 2.80712890625, 2.8978271484375, 2.988525390625, 3.0792236328125, 3.169921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 14.0, 17.0, 24.0, 33.0, 33.0, 60.0, 75.0, 106.0, 159.0, 220.0, 323.0, 461.0, 664.0, 1031.0, 1701.0, 3277.0, 6900.0, 22571.0, 277419.0, 3813732.0, 44873.0, 10513.0, 4214.0, 2209.0, 1207.0, 756.0, 492.0, 338.0, 240.0, 183.0, 129.0, 82.0, 53.0, 48.0, 25.0, 27.0, 24.0, 18.0, 7.0, 7.0, 2.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.859375, -11.5125732421875, -11.165771484375, -10.8189697265625, -10.47216796875, -10.1253662109375, -9.778564453125, -9.4317626953125, -9.0849609375, -8.7381591796875, -8.391357421875, -8.0445556640625, -7.69775390625, -7.3509521484375, -7.004150390625, -6.6573486328125, -6.310546875, -5.9637451171875, -5.616943359375, -5.2701416015625, -4.92333984375, -4.5765380859375, -4.229736328125, -3.8829345703125, -3.5361328125, -3.1893310546875, -2.842529296875, -2.4957275390625, -2.14892578125, -1.8021240234375, -1.455322265625, -1.1085205078125, -0.76171875, -0.4149169921875, -0.068115234375, 0.2786865234375, 0.62548828125, 0.9722900390625, 1.319091796875, 1.6658935546875, 2.0126953125, 2.3594970703125, 2.706298828125, 3.0531005859375, 3.39990234375, 3.7467041015625, 4.093505859375, 4.4403076171875, 4.787109375, 5.1339111328125, 5.480712890625, 5.8275146484375, 6.17431640625, 6.5211181640625, 6.867919921875, 7.2147216796875, 7.5615234375, 7.9083251953125, 8.255126953125, 8.6019287109375, 8.94873046875, 9.2955322265625, 9.642333984375, 9.9891357421875, 10.3359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 14.0, 21.0, 31.0, 61.0, 180.0, 2990.0, 559.0, 109.0, 40.0, 21.0, 15.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.455322265625, -2.35205078125, -2.248779296875, -2.1455078125, -2.042236328125, -1.93896484375, -1.835693359375, -1.732421875, -1.629150390625, -1.52587890625, -1.422607421875, -1.3193359375, -1.216064453125, -1.11279296875, -1.009521484375, -0.90625, -0.802978515625, -0.69970703125, -0.596435546875, -0.4931640625, -0.389892578125, -0.28662109375, -0.183349609375, -0.080078125, 0.023193359375, 0.12646484375, 0.229736328125, 0.3330078125, 0.436279296875, 0.53955078125, 0.642822265625, 0.74609375, 0.849365234375, 0.95263671875, 1.055908203125, 1.1591796875, 1.262451171875, 1.36572265625, 1.468994140625, 1.572265625, 1.675537109375, 1.77880859375, 1.882080078125, 1.9853515625, 2.088623046875, 2.19189453125, 2.295166015625, 2.3984375, 2.501708984375, 2.60498046875, 2.708251953125, 2.8115234375, 2.914794921875, 3.01806640625, 3.121337890625, 3.224609375, 3.327880859375, 3.43115234375, 3.534423828125, 3.6376953125, 3.740966796875, 3.84423828125, 3.947509765625, 4.05078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 8.0, 14.0, 19.0, 33.0, 49.0, 70.0, 94.0, 109.0, 108.0, 94.0, 98.0, 80.0, 56.0, 49.0, 26.0, 20.0, 18.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.802661895751953, -11.472405433654785, -11.142148971557617, -10.81189250946045, -10.481636047363281, -10.151379585266113, -9.821123123168945, -9.490867614746094, -9.16061019897461, -8.830353736877441, -8.500097274780273, -8.169840812683105, -7.8395843505859375, -7.5093278884887695, -7.17907190322876, -6.848815441131592, -6.518559455871582, -6.188302993774414, -5.858046531677246, -5.527790069580078, -5.19753360748291, -4.867277145385742, -4.537021160125732, -4.2067646980285645, -3.8765082359313965, -3.5462517738342285, -3.2159953117370605, -2.8857390880584717, -2.5554826259613037, -2.2252261638641357, -1.8949698209762573, -1.564713478088379, -1.234457015991211, -0.9042006134986877, -0.5739442110061646, -0.24368780851364136, 0.08656859397888184, 0.4168250560760498, 0.7470813989639282, 1.0773377418518066, 1.4075942039489746, 1.7378506660461426, 2.0681071281433105, 2.3983633518218994, 2.7286198139190674, 3.0588762760162354, 3.389132499694824, 3.719388961791992, 4.04964542388916, 4.379901885986328, 4.710158348083496, 5.040414810180664, 5.370671272277832, 5.700927734375, 6.03118371963501, 6.361440181732178, 6.691696643829346, 7.021953105926514, 7.352209568023682, 7.68246603012085, 8.01272201538086, 8.342978477478027, 8.673234939575195, 9.003491401672363, 9.333747863769531]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 8.0, 8.0, 8.0, 6.0, 12.0, 10.0, 16.0, 18.0, 16.0, 28.0, 23.0, 24.0, 32.0, 31.0, 29.0, 29.0, 36.0, 35.0, 36.0, 40.0, 30.0, 32.0, 37.0, 43.0, 43.0, 24.0, 31.0, 23.0, 24.0, 28.0, 29.0, 24.0, 21.0, 21.0, 10.0, 19.0, 20.0, 10.0, 6.0, 13.0, 10.0, 4.0, 6.0, 11.0, 7.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.173661708831787, -5.017061710357666, -4.860462188720703, -4.703862190246582, -4.547262191772461, -4.39066219329834, -4.234062671661377, -4.077462673187256, -3.920862913131714, -3.764263153076172, -3.607663154602051, -3.451063394546509, -3.294463634490967, -3.1378636360168457, -2.9812638759613037, -2.8246641159057617, -2.6680641174316406, -2.5114643573760986, -2.3548643589019775, -2.1982645988464355, -2.0416646003723145, -1.8850648403167725, -1.7284650802612305, -1.571865200996399, -1.4152653217315674, -1.2586654424667358, -1.1020655632019043, -0.9454658031463623, -0.7888659238815308, -0.6322660446166992, -0.47566622495651245, -0.3190664052963257, -0.16246604919433594, -0.005866199731826782, 0.15073364973068237, 0.30733349919319153, 0.4639333486557007, 0.6205332279205322, 0.777133047580719, 0.9337328672409058, 1.0903327465057373, 1.2469326257705688, 1.4035325050354004, 1.5601322650909424, 1.716732144355774, 1.8733320236206055, 2.0299317836761475, 2.1865315437316895, 2.3431315422058105, 2.4997313022613525, 2.6563313007354736, 2.8129310607910156, 2.9695310592651367, 3.1261308193206787, 3.2827305793762207, 3.439330577850342, 3.595930337905884, 3.752530097961426, 3.909130096435547, 4.065730094909668, 4.222329616546631, 4.378929615020752, 4.535529613494873, 4.692129135131836, 4.848729133605957]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 9.0, 6.0, 16.0, 26.0, 34.0, 49.0, 66.0, 113.0, 162.0, 267.0, 425.0, 688.0, 1160.0, 2077.0, 3820.0, 7392.0, 14762.0, 32543.0, 76389.0, 168459.0, 276696.0, 238786.0, 123881.0, 53314.0, 23495.0, 11274.0, 5583.0, 2913.0, 1671.0, 920.0, 557.0, 324.0, 247.0, 152.0, 99.0, 54.0, 44.0, 29.0, 21.0, 6.0, 6.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-6.74609375, -6.562744140625, -6.37939453125, -6.196044921875, -6.0126953125, -5.829345703125, -5.64599609375, -5.462646484375, -5.279296875, -5.095947265625, -4.91259765625, -4.729248046875, -4.5458984375, -4.362548828125, -4.17919921875, -3.995849609375, -3.8125, -3.629150390625, -3.44580078125, -3.262451171875, -3.0791015625, -2.895751953125, -2.71240234375, -2.529052734375, -2.345703125, -2.162353515625, -1.97900390625, -1.795654296875, -1.6123046875, -1.428955078125, -1.24560546875, -1.062255859375, -0.87890625, -0.695556640625, -0.51220703125, -0.328857421875, -0.1455078125, 0.037841796875, 0.22119140625, 0.404541015625, 0.587890625, 0.771240234375, 0.95458984375, 1.137939453125, 1.3212890625, 1.504638671875, 1.68798828125, 1.871337890625, 2.0546875, 2.238037109375, 2.42138671875, 2.604736328125, 2.7880859375, 2.971435546875, 3.15478515625, 3.338134765625, 3.521484375, 3.704833984375, 3.88818359375, 4.071533203125, 4.2548828125, 4.438232421875, 4.62158203125, 4.804931640625, 4.98828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 3.0, 4.0, 6.0, 6.0, 8.0, 11.0, 8.0, 13.0, 23.0, 28.0, 26.0, 32.0, 36.0, 31.0, 47.0, 48.0, 54.0, 34.0, 72.0, 52.0, 50.0, 45.0, 36.0, 39.0, 36.0, 49.0, 29.0, 28.0, 26.0, 23.0, 24.0, 14.0, 12.0, 13.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.62445068359375, -2.5281982421875, -2.43194580078125, -2.335693359375, -2.23944091796875, -2.1431884765625, -2.04693603515625, -1.95068359375, -1.85443115234375, -1.7581787109375, -1.66192626953125, -1.565673828125, -1.46942138671875, -1.3731689453125, -1.27691650390625, -1.1806640625, -1.08441162109375, -0.9881591796875, -0.89190673828125, -0.795654296875, -0.69940185546875, -0.6031494140625, -0.50689697265625, -0.41064453125, -0.31439208984375, -0.2181396484375, -0.12188720703125, -0.025634765625, 0.07061767578125, 0.1668701171875, 0.26312255859375, 0.359375, 0.45562744140625, 0.5518798828125, 0.64813232421875, 0.744384765625, 0.84063720703125, 0.9368896484375, 1.03314208984375, 1.12939453125, 1.22564697265625, 1.3218994140625, 1.41815185546875, 1.514404296875, 1.61065673828125, 1.7069091796875, 1.80316162109375, 1.8994140625, 1.99566650390625, 2.0919189453125, 2.18817138671875, 2.284423828125, 2.38067626953125, 2.4769287109375, 2.57318115234375, 2.66943359375, 2.76568603515625, 2.8619384765625, 2.95819091796875, 3.054443359375, 3.15069580078125, 3.2469482421875, 3.34320068359375, 3.439453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 10.0, 10.0, 13.0, 21.0, 29.0, 31.0, 63.0, 55.0, 117.0, 155.0, 190.0, 294.0, 400.0, 656.0, 1176.0, 2540.0, 8692.0, 57624.0, 544732.0, 382567.0, 37693.0, 6437.0, 2114.0, 1067.0, 610.0, 376.0, 229.0, 202.0, 118.0, 88.0, 63.0, 47.0, 34.0, 26.0, 19.0, 18.0, 10.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.640625, -14.1956787109375, -13.750732421875, -13.3057861328125, -12.86083984375, -12.4158935546875, -11.970947265625, -11.5260009765625, -11.0810546875, -10.6361083984375, -10.191162109375, -9.7462158203125, -9.30126953125, -8.8563232421875, -8.411376953125, -7.9664306640625, -7.521484375, -7.0765380859375, -6.631591796875, -6.1866455078125, -5.74169921875, -5.2967529296875, -4.851806640625, -4.4068603515625, -3.9619140625, -3.5169677734375, -3.072021484375, -2.6270751953125, -2.18212890625, -1.7371826171875, -1.292236328125, -0.8472900390625, -0.40234375, 0.0426025390625, 0.487548828125, 0.9324951171875, 1.37744140625, 1.8223876953125, 2.267333984375, 2.7122802734375, 3.1572265625, 3.6021728515625, 4.047119140625, 4.4920654296875, 4.93701171875, 5.3819580078125, 5.826904296875, 6.2718505859375, 6.716796875, 7.1617431640625, 7.606689453125, 8.0516357421875, 8.49658203125, 8.9415283203125, 9.386474609375, 9.8314208984375, 10.2763671875, 10.7213134765625, 11.166259765625, 11.6112060546875, 12.05615234375, 12.5010986328125, 12.946044921875, 13.3909912109375, 13.8359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 8.0, 18.0, 13.0, 22.0, 16.0, 28.0, 29.0, 30.0, 32.0, 49.0, 35.0, 35.0, 45.0, 34.0, 51.0, 38.0, 47.0, 46.0, 43.0, 54.0, 37.0, 38.0, 38.0, 20.0, 22.0, 23.0, 26.0, 16.0, 18.0, 13.0, 11.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.5440673828125, -12.127197265625, -11.7103271484375, -11.29345703125, -10.8765869140625, -10.459716796875, -10.0428466796875, -9.6259765625, -9.2091064453125, -8.792236328125, -8.3753662109375, -7.95849609375, -7.5416259765625, -7.124755859375, -6.7078857421875, -6.291015625, -5.8741455078125, -5.457275390625, -5.0404052734375, -4.62353515625, -4.2066650390625, -3.789794921875, -3.3729248046875, -2.9560546875, -2.5391845703125, -2.122314453125, -1.7054443359375, -1.28857421875, -0.8717041015625, -0.454833984375, -0.0379638671875, 0.37890625, 0.7957763671875, 1.212646484375, 1.6295166015625, 2.04638671875, 2.4632568359375, 2.880126953125, 3.2969970703125, 3.7138671875, 4.1307373046875, 4.547607421875, 4.9644775390625, 5.38134765625, 5.7982177734375, 6.215087890625, 6.6319580078125, 7.048828125, 7.4656982421875, 7.882568359375, 8.2994384765625, 8.71630859375, 9.1331787109375, 9.550048828125, 9.9669189453125, 10.3837890625, 10.8006591796875, 11.217529296875, 11.6343994140625, 12.05126953125, 12.4681396484375, 12.885009765625, 13.3018798828125, 13.71875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 5.0, 12.0, 10.0, 12.0, 13.0, 20.0, 27.0, 31.0, 34.0, 63.0, 86.0, 113.0, 154.0, 208.0, 399.0, 712.0, 1537.0, 3398.0, 10387.0, 39623.0, 204585.0, 582987.0, 157797.0, 31402.0, 8653.0, 3134.0, 1314.0, 656.0, 383.0, 232.0, 143.0, 116.0, 87.0, 47.0, 34.0, 33.0, 29.0, 15.0, 8.0, 13.0, 12.0, 3.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.8046875, -4.65179443359375, -4.4989013671875, -4.34600830078125, -4.193115234375, -4.04022216796875, -3.8873291015625, -3.73443603515625, -3.58154296875, -3.42864990234375, -3.2757568359375, -3.12286376953125, -2.969970703125, -2.81707763671875, -2.6641845703125, -2.51129150390625, -2.3583984375, -2.20550537109375, -2.0526123046875, -1.89971923828125, -1.746826171875, -1.59393310546875, -1.4410400390625, -1.28814697265625, -1.13525390625, -0.98236083984375, -0.8294677734375, -0.67657470703125, -0.523681640625, -0.37078857421875, -0.2178955078125, -0.06500244140625, 0.087890625, 0.24078369140625, 0.3936767578125, 0.54656982421875, 0.699462890625, 0.85235595703125, 1.0052490234375, 1.15814208984375, 1.31103515625, 1.46392822265625, 1.6168212890625, 1.76971435546875, 1.922607421875, 2.07550048828125, 2.2283935546875, 2.38128662109375, 2.5341796875, 2.68707275390625, 2.8399658203125, 2.99285888671875, 3.145751953125, 3.29864501953125, 3.4515380859375, 3.60443115234375, 3.75732421875, 3.91021728515625, 4.0631103515625, 4.21600341796875, 4.368896484375, 4.52178955078125, 4.6746826171875, 4.82757568359375, 4.98046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 10.0, 9.0, 5.0, 13.0, 14.0, 26.0, 29.0, 27.0, 37.0, 45.0, 70.0, 59.0, 94.0, 102.0, 80.0, 68.0, 73.0, 56.0, 28.0, 39.0, 30.0, 23.0, 16.0, 8.0, 7.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005254745483398438, -0.0005038157105445862, -0.0004821568727493286, -0.00046049803495407104, -0.0004388391971588135, -0.0004171803593635559, -0.00039552152156829834, -0.00037386268377304077, -0.0003522038459777832, -0.00033054500818252563, -0.00030888617038726807, -0.0002872273325920105, -0.00026556849479675293, -0.00024390965700149536, -0.0002222508192062378, -0.00020059198141098022, -0.00017893314361572266, -0.0001572743058204651, -0.00013561546802520752, -0.00011395663022994995, -9.229779243469238e-05, -7.063895463943481e-05, -4.8980116844177246e-05, -2.7321279048919678e-05, -5.662441253662109e-06, 1.599639654159546e-05, 3.765523433685303e-05, 5.9314072132110596e-05, 8.097290992736816e-05, 0.00010263174772262573, 0.0001242905855178833, 0.00014594942331314087, 0.00016760826110839844, 0.000189267098903656, 0.00021092593669891357, 0.00023258477449417114, 0.0002542436122894287, 0.0002759024500846863, 0.00029756128787994385, 0.0003192201256752014, 0.000340878963470459, 0.00036253780126571655, 0.0003841966390609741, 0.0004058554768562317, 0.00042751431465148926, 0.0004491731524467468, 0.0004708319902420044, 0.000492490828037262, 0.0005141496658325195, 0.0005358085036277771, 0.0005574673414230347, 0.0005791261792182922, 0.0006007850170135498, 0.0006224438548088074, 0.0006441026926040649, 0.0006657615303993225, 0.0006874203681945801, 0.0007090792059898376, 0.0007307380437850952, 0.0007523968815803528, 0.0007740557193756104, 0.0007957145571708679, 0.0008173733949661255, 0.0008390322327613831, 0.0008606910705566406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 3.0, 8.0, 7.0, 14.0, 28.0, 33.0, 48.0, 69.0, 130.0, 256.0, 479.0, 966.0, 2234.0, 6810.0, 35999.0, 459310.0, 492808.0, 37807.0, 7263.0, 2298.0, 962.0, 457.0, 243.0, 116.0, 71.0, 33.0, 23.0, 16.0, 18.0, 9.0, 12.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.32421875, -6.06085205078125, -5.7974853515625, -5.53411865234375, -5.270751953125, -5.00738525390625, -4.7440185546875, -4.48065185546875, -4.21728515625, -3.95391845703125, -3.6905517578125, -3.42718505859375, -3.163818359375, -2.90045166015625, -2.6370849609375, -2.37371826171875, -2.1103515625, -1.84698486328125, -1.5836181640625, -1.32025146484375, -1.056884765625, -0.79351806640625, -0.5301513671875, -0.26678466796875, -0.00341796875, 0.25994873046875, 0.5233154296875, 0.78668212890625, 1.050048828125, 1.31341552734375, 1.5767822265625, 1.84014892578125, 2.103515625, 2.36688232421875, 2.6302490234375, 2.89361572265625, 3.156982421875, 3.42034912109375, 3.6837158203125, 3.94708251953125, 4.21044921875, 4.47381591796875, 4.7371826171875, 5.00054931640625, 5.263916015625, 5.52728271484375, 5.7906494140625, 6.05401611328125, 6.3173828125, 6.58074951171875, 6.8441162109375, 7.10748291015625, 7.370849609375, 7.63421630859375, 7.8975830078125, 8.16094970703125, 8.42431640625, 8.68768310546875, 8.9510498046875, 9.21441650390625, 9.477783203125, 9.74114990234375, 10.0045166015625, 10.26788330078125, 10.53125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 11.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 22.0, 21.0, 24.0, 32.0, 34.0, 54.0, 54.0, 55.0, 74.0, 78.0, 68.0, 75.0, 70.0, 58.0, 40.0, 40.0, 34.0, 22.0, 19.0, 17.0, 8.0, 6.0, 7.0, 5.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.59375, -4.44561767578125, -4.2974853515625, -4.14935302734375, -4.001220703125, -3.85308837890625, -3.7049560546875, -3.55682373046875, -3.40869140625, -3.26055908203125, -3.1124267578125, -2.96429443359375, -2.816162109375, -2.66802978515625, -2.5198974609375, -2.37176513671875, -2.2236328125, -2.07550048828125, -1.9273681640625, -1.77923583984375, -1.631103515625, -1.48297119140625, -1.3348388671875, -1.18670654296875, -1.03857421875, -0.89044189453125, -0.7423095703125, -0.59417724609375, -0.446044921875, -0.29791259765625, -0.1497802734375, -0.00164794921875, 0.146484375, 0.29461669921875, 0.4427490234375, 0.59088134765625, 0.739013671875, 0.88714599609375, 1.0352783203125, 1.18341064453125, 1.33154296875, 1.47967529296875, 1.6278076171875, 1.77593994140625, 1.924072265625, 2.07220458984375, 2.2203369140625, 2.36846923828125, 2.5166015625, 2.66473388671875, 2.8128662109375, 2.96099853515625, 3.109130859375, 3.25726318359375, 3.4053955078125, 3.55352783203125, 3.70166015625, 3.84979248046875, 3.9979248046875, 4.14605712890625, 4.294189453125, 4.44232177734375, 4.5904541015625, 4.73858642578125, 4.88671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 14.0, 47.0, 119.0, 314.0, 323.0, 136.0, 39.0, 12.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.84442138671875, -315.5223388671875, -308.2002258300781, -300.8781433105469, -293.5560302734375, -286.23394775390625, -278.9118347167969, -271.5897521972656, -264.26763916015625, -256.945556640625, -249.62344360351562, -242.3013458251953, -234.979248046875, -227.6571502685547, -220.33505249023438, -213.01296997070312, -205.6908721923828, -198.3687744140625, -191.0466766357422, -183.72457885742188, -176.40248107910156, -169.08038330078125, -161.75830078125, -154.43618774414062, -147.11410522460938, -139.79200744628906, -132.46990966796875, -125.14781188964844, -117.82571411132812, -110.50361633300781, -103.18152618408203, -95.85942840576172, -88.53732299804688, -81.21522521972656, -73.89312744140625, -66.57102966308594, -59.24893569946289, -51.92683792114258, -44.60474395751953, -37.28264617919922, -29.960548400878906, -22.638450622558594, -15.316354751586914, -7.994258880615234, -0.6721611022949219, 6.649936676025391, 13.972030639648438, 21.29412841796875, 28.616226196289062, 35.938323974609375, 43.26042175292969, 50.582515716552734, 57.90461349487305, 65.22671508789062, 72.5488052368164, 79.87090301513672, 87.19300079345703, 94.51509857177734, 101.83719635009766, 109.15928649902344, 116.48138427734375, 123.80348205566406, 131.12557983398438, 138.4476776123047, 145.769775390625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 18.0, 24.0, 24.0, 25.0, 23.0, 35.0, 27.0, 36.0, 41.0, 43.0, 55.0, 58.0, 50.0, 54.0, 54.0, 34.0, 48.0, 37.0, 36.0, 27.0, 28.0, 33.0, 33.0, 26.0, 25.0, 18.0, 16.0, 7.0, 5.0, 10.0, 3.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.84443664550781, -62.68782424926758, -60.53121566772461, -58.374603271484375, -56.21799087524414, -54.061378479003906, -51.90476989746094, -49.7481575012207, -47.59154510498047, -45.434932708740234, -43.278324127197266, -41.12171173095703, -38.9650993347168, -36.80848693847656, -34.651878356933594, -32.49526596069336, -30.33865737915039, -28.18204689025879, -26.025434494018555, -23.868824005126953, -21.71221160888672, -19.555601119995117, -17.398990631103516, -15.242379188537598, -13.08576774597168, -10.929156303405762, -8.772544860839844, -6.615934371948242, -4.459322929382324, -2.3027114868164062, -0.1461009979248047, 2.0105104446411133, 4.167121887207031, 6.323733329772949, 8.480344772338867, 10.636955261230469, 12.793566703796387, 14.950178146362305, 17.106788635253906, 19.26340103149414, 21.420011520385742, 23.576622009277344, 25.733234405517578, 27.88984489440918, 30.04645538330078, 32.203067779541016, 34.35968017578125, 36.51628875732422, 38.67290115356445, 40.82951354980469, 42.986122131347656, 45.14273452758789, 47.299346923828125, 49.455955505371094, 51.61256790161133, 53.76918029785156, 55.92578887939453, 58.082401275634766, 60.239009857177734, 62.39562225341797, 64.55223083496094, 66.70884704589844, 68.8654556274414, 71.02206420898438, 73.17868041992188]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 11.0, 14.0, 12.0, 22.0, 31.0, 45.0, 86.0, 108.0, 200.0, 356.0, 559.0, 1148.0, 2529.0, 7344.0, 40734.0, 4060003.0, 66091.0, 9074.0, 2996.0, 1313.0, 626.0, 375.0, 209.0, 123.0, 90.0, 49.0, 28.0, 29.0, 14.0, 14.0, 14.0, 6.0, 6.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.0078125, -14.5738525390625, -14.139892578125, -13.7059326171875, -13.27197265625, -12.8380126953125, -12.404052734375, -11.9700927734375, -11.5361328125, -11.1021728515625, -10.668212890625, -10.2342529296875, -9.80029296875, -9.3663330078125, -8.932373046875, -8.4984130859375, -8.064453125, -7.6304931640625, -7.196533203125, -6.7625732421875, -6.32861328125, -5.8946533203125, -5.460693359375, -5.0267333984375, -4.5927734375, -4.1588134765625, -3.724853515625, -3.2908935546875, -2.85693359375, -2.4229736328125, -1.989013671875, -1.5550537109375, -1.12109375, -0.6871337890625, -0.253173828125, 0.1807861328125, 0.61474609375, 1.0487060546875, 1.482666015625, 1.9166259765625, 2.3505859375, 2.7845458984375, 3.218505859375, 3.6524658203125, 4.08642578125, 4.5203857421875, 4.954345703125, 5.3883056640625, 5.822265625, 6.2562255859375, 6.690185546875, 7.1241455078125, 7.55810546875, 7.9920654296875, 8.426025390625, 8.8599853515625, 9.2939453125, 9.7279052734375, 10.161865234375, 10.5958251953125, 11.02978515625, 11.4637451171875, 11.897705078125, 12.3316650390625, 12.765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 12.0, 11.0, 12.0, 26.0, 30.0, 37.0, 42.0, 53.0, 63.0, 69.0, 70.0, 86.0, 66.0, 75.0, 67.0, 54.0, 48.0, 48.0, 27.0, 19.0, 26.0, 8.0, 13.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.63494873046875, -5.4808349609375, -5.32672119140625, -5.172607421875, -5.01849365234375, -4.8643798828125, -4.71026611328125, -4.55615234375, -4.40203857421875, -4.2479248046875, -4.09381103515625, -3.939697265625, -3.78558349609375, -3.6314697265625, -3.47735595703125, -3.3232421875, -3.16912841796875, -3.0150146484375, -2.86090087890625, -2.706787109375, -2.55267333984375, -2.3985595703125, -2.24444580078125, -2.09033203125, -1.93621826171875, -1.7821044921875, -1.62799072265625, -1.473876953125, -1.31976318359375, -1.1656494140625, -1.01153564453125, -0.857421875, -0.70330810546875, -0.5491943359375, -0.39508056640625, -0.240966796875, -0.08685302734375, 0.0672607421875, 0.22137451171875, 0.37548828125, 0.52960205078125, 0.6837158203125, 0.83782958984375, 0.991943359375, 1.14605712890625, 1.3001708984375, 1.45428466796875, 1.6083984375, 1.76251220703125, 1.9166259765625, 2.07073974609375, 2.224853515625, 2.37896728515625, 2.5330810546875, 2.68719482421875, 2.84130859375, 2.99542236328125, 3.1495361328125, 3.30364990234375, 3.457763671875, 3.61187744140625, 3.7659912109375, 3.92010498046875, 4.07421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 14.0, 10.0, 15.0, 16.0, 29.0, 44.0, 39.0, 90.0, 96.0, 137.0, 201.0, 265.0, 403.0, 552.0, 732.0, 1075.0, 1709.0, 3017.0, 6014.0, 14097.0, 53386.0, 3838780.0, 225836.0, 27066.0, 9227.0, 4299.0, 2397.0, 1479.0, 949.0, 677.0, 440.0, 318.0, 248.0, 169.0, 131.0, 96.0, 58.0, 54.0, 38.0, 14.0, 27.0, 17.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.21002197265625, -5.9942626953125, -5.77850341796875, -5.562744140625, -5.34698486328125, -5.1312255859375, -4.91546630859375, -4.69970703125, -4.48394775390625, -4.2681884765625, -4.05242919921875, -3.836669921875, -3.62091064453125, -3.4051513671875, -3.18939208984375, -2.9736328125, -2.75787353515625, -2.5421142578125, -2.32635498046875, -2.110595703125, -1.89483642578125, -1.6790771484375, -1.46331787109375, -1.24755859375, -1.03179931640625, -0.8160400390625, -0.60028076171875, -0.384521484375, -0.16876220703125, 0.0469970703125, 0.26275634765625, 0.478515625, 0.69427490234375, 0.9100341796875, 1.12579345703125, 1.341552734375, 1.55731201171875, 1.7730712890625, 1.98883056640625, 2.20458984375, 2.42034912109375, 2.6361083984375, 2.85186767578125, 3.067626953125, 3.28338623046875, 3.4991455078125, 3.71490478515625, 3.9306640625, 4.14642333984375, 4.3621826171875, 4.57794189453125, 4.793701171875, 5.00946044921875, 5.2252197265625, 5.44097900390625, 5.65673828125, 5.87249755859375, 6.0882568359375, 6.30401611328125, 6.519775390625, 6.73553466796875, 6.9512939453125, 7.16705322265625, 7.3828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 7.0, 13.0, 14.0, 55.0, 117.0, 3138.0, 540.0, 80.0, 33.0, 19.0, 12.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.683990478515625, -2.60235595703125, -2.520721435546875, -2.4390869140625, -2.357452392578125, -2.27581787109375, -2.194183349609375, -2.112548828125, -2.030914306640625, -1.94927978515625, -1.867645263671875, -1.7860107421875, -1.704376220703125, -1.62274169921875, -1.541107177734375, -1.45947265625, -1.377838134765625, -1.29620361328125, -1.214569091796875, -1.1329345703125, -1.051300048828125, -0.96966552734375, -0.888031005859375, -0.806396484375, -0.724761962890625, -0.64312744140625, -0.561492919921875, -0.4798583984375, -0.398223876953125, -0.31658935546875, -0.234954833984375, -0.1533203125, -0.071685791015625, 0.00994873046875, 0.091583251953125, 0.1732177734375, 0.254852294921875, 0.33648681640625, 0.418121337890625, 0.499755859375, 0.581390380859375, 0.66302490234375, 0.744659423828125, 0.8262939453125, 0.907928466796875, 0.98956298828125, 1.071197509765625, 1.15283203125, 1.234466552734375, 1.31610107421875, 1.397735595703125, 1.4793701171875, 1.561004638671875, 1.64263916015625, 1.724273681640625, 1.805908203125, 1.887542724609375, 1.96917724609375, 2.050811767578125, 2.1324462890625, 2.214080810546875, 2.29571533203125, 2.377349853515625, 2.458984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 12.0, 8.0, 16.0, 38.0, 59.0, 83.0, 126.0, 160.0, 135.0, 143.0, 94.0, 50.0, 41.0, 13.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.480964660644531, -10.162897109985352, -9.844829559326172, -9.526762008666992, -9.208694458007812, -8.890626907348633, -8.572559356689453, -8.254490852355957, -7.936423301696777, -7.618355751037598, -7.300288200378418, -6.982220649719238, -6.6641526222229, -6.346085071563721, -6.028017520904541, -5.709949493408203, -5.391882419586182, -5.073814868927002, -4.755747318267822, -4.437679290771484, -4.119611740112305, -3.801544189453125, -3.4834766387939453, -3.1654088497161865, -2.847341299057007, -2.529273748397827, -2.2112059593200684, -1.8931384086608887, -1.5750707387924194, -1.2570030689239502, -0.9389355182647705, -0.6208677291870117, -0.30280017852783203, 0.01526746153831482, 0.33333510160446167, 0.6514027118682861, 0.9694703817367554, 1.2875380516052246, 1.6056056022644043, 1.923673391342163, 2.2417409420013428, 2.5598084926605225, 2.8778762817382812, 3.195943832397461, 3.5140113830566406, 3.8320791721343994, 4.150146484375, 4.468214511871338, 4.786282062530518, 5.104349613189697, 5.422417163848877, 5.740485191345215, 6.0585527420043945, 6.376620292663574, 6.694687843322754, 7.012755393981934, 7.330822944641113, 7.648890495300293, 7.966958045959473, 8.285025596618652, 8.603093147277832, 8.921161651611328, 9.239229202270508, 9.557296752929688, 9.875364303588867]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 8.0, 10.0, 10.0, 15.0, 18.0, 25.0, 17.0, 35.0, 32.0, 43.0, 49.0, 45.0, 46.0, 48.0, 52.0, 43.0, 52.0, 54.0, 44.0, 58.0, 39.0, 32.0, 39.0, 28.0, 32.0, 18.0, 20.0, 15.0, 15.0, 4.0, 6.0, 9.0, 6.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.567087650299072, -5.418603420257568, -5.2701191902160645, -5.1216349601745605, -4.973150730133057, -4.8246660232543945, -4.676181793212891, -4.527697563171387, -4.379213333129883, -4.230729103088379, -4.082244873046875, -3.933760643005371, -3.785276174545288, -3.636791944503784, -3.4883077144622803, -3.3398232460021973, -3.1913392543792725, -3.0428550243377686, -2.8943707942962646, -2.7458863258361816, -2.5974020957946777, -2.448917865753174, -2.30043363571167, -2.151949405670166, -2.003465175628662, -1.8549809455871582, -1.7064965963363647, -1.5580123662948608, -1.4095280170440674, -1.2610437870025635, -1.1125595569610596, -0.9640752077102661, -0.8155908584594727, -0.667106568813324, -0.5186222791671753, -0.3701380491256714, -0.2216537594795227, -0.07316946983337402, 0.07531476020812988, 0.22379910945892334, 0.37228333950042725, 0.5207676291465759, 0.6692519187927246, 0.8177361488342285, 0.9662204384803772, 1.1147047281265259, 1.2631889581680298, 1.4116733074188232, 1.5601575374603271, 1.708641767501831, 1.8571261167526245, 2.005610466003418, 2.154094696044922, 2.302578926086426, 2.4510631561279297, 2.5995473861694336, 2.7480316162109375, 2.8965158462524414, 3.0450000762939453, 3.193484306335449, 3.3419687747955322, 3.490453004837036, 3.63893723487854, 3.787421703338623, 3.935905933380127]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 12.0, 16.0, 26.0, 42.0, 52.0, 121.0, 251.0, 411.0, 994.0, 2317.0, 6560.0, 22059.0, 87836.0, 332349.0, 420229.0, 129320.0, 31715.0, 8878.0, 3058.0, 1138.0, 538.0, 296.0, 138.0, 64.0, 44.0, 40.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.2197265625, -10.900390625, -10.5810546875, -10.26171875, -9.9423828125, -9.623046875, -9.3037109375, -8.984375, -8.6650390625, -8.345703125, -8.0263671875, -7.70703125, -7.3876953125, -7.068359375, -6.7490234375, -6.4296875, -6.1103515625, -5.791015625, -5.4716796875, -5.15234375, -4.8330078125, -4.513671875, -4.1943359375, -3.875, -3.5556640625, -3.236328125, -2.9169921875, -2.59765625, -2.2783203125, -1.958984375, -1.6396484375, -1.3203125, -1.0009765625, -0.681640625, -0.3623046875, -0.04296875, 0.2763671875, 0.595703125, 0.9150390625, 1.234375, 1.5537109375, 1.873046875, 2.1923828125, 2.51171875, 2.8310546875, 3.150390625, 3.4697265625, 3.7890625, 4.1083984375, 4.427734375, 4.7470703125, 5.06640625, 5.3857421875, 5.705078125, 6.0244140625, 6.34375, 6.6630859375, 6.982421875, 7.3017578125, 7.62109375, 7.9404296875, 8.259765625, 8.5791015625, 8.8984375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 9.0, 4.0, 8.0, 10.0, 13.0, 17.0, 29.0, 19.0, 37.0, 33.0, 59.0, 58.0, 59.0, 74.0, 61.0, 87.0, 69.0, 60.0, 52.0, 59.0, 42.0, 42.0, 30.0, 24.0, 17.0, 10.0, 9.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.73828125, -5.587066650390625, -5.43585205078125, -5.284637451171875, -5.1334228515625, -4.982208251953125, -4.83099365234375, -4.679779052734375, -4.528564453125, -4.377349853515625, -4.22613525390625, -4.074920654296875, -3.9237060546875, -3.772491455078125, -3.62127685546875, -3.470062255859375, -3.31884765625, -3.167633056640625, -3.01641845703125, -2.865203857421875, -2.7139892578125, -2.562774658203125, -2.41156005859375, -2.260345458984375, -2.109130859375, -1.957916259765625, -1.80670166015625, -1.655487060546875, -1.5042724609375, -1.353057861328125, -1.20184326171875, -1.050628662109375, -0.8994140625, -0.748199462890625, -0.59698486328125, -0.445770263671875, -0.2945556640625, -0.143341064453125, 0.00787353515625, 0.159088134765625, 0.310302734375, 0.461517333984375, 0.61273193359375, 0.763946533203125, 0.9151611328125, 1.066375732421875, 1.21759033203125, 1.368804931640625, 1.52001953125, 1.671234130859375, 1.82244873046875, 1.973663330078125, 2.1248779296875, 2.276092529296875, 2.42730712890625, 2.578521728515625, 2.729736328125, 2.880950927734375, 3.03216552734375, 3.183380126953125, 3.3345947265625, 3.485809326171875, 3.63702392578125, 3.788238525390625, 3.939453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 5.0, 4.0, 9.0, 19.0, 30.0, 33.0, 55.0, 125.0, 172.0, 334.0, 559.0, 1197.0, 3649.0, 22758.0, 415654.0, 567541.0, 29346.0, 4196.0, 1389.0, 625.0, 350.0, 208.0, 109.0, 68.0, 43.0, 23.0, 15.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.57373046875, -17.9755859375, -17.37744140625, -16.779296875, -16.18115234375, -15.5830078125, -14.98486328125, -14.38671875, -13.78857421875, -13.1904296875, -12.59228515625, -11.994140625, -11.39599609375, -10.7978515625, -10.19970703125, -9.6015625, -9.00341796875, -8.4052734375, -7.80712890625, -7.208984375, -6.61083984375, -6.0126953125, -5.41455078125, -4.81640625, -4.21826171875, -3.6201171875, -3.02197265625, -2.423828125, -1.82568359375, -1.2275390625, -0.62939453125, -0.03125, 0.56689453125, 1.1650390625, 1.76318359375, 2.361328125, 2.95947265625, 3.5576171875, 4.15576171875, 4.75390625, 5.35205078125, 5.9501953125, 6.54833984375, 7.146484375, 7.74462890625, 8.3427734375, 8.94091796875, 9.5390625, 10.13720703125, 10.7353515625, 11.33349609375, 11.931640625, 12.52978515625, 13.1279296875, 13.72607421875, 14.32421875, 14.92236328125, 15.5205078125, 16.11865234375, 16.716796875, 17.31494140625, 17.9130859375, 18.51123046875, 19.109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 9.0, 6.0, 15.0, 24.0, 29.0, 41.0, 50.0, 65.0, 77.0, 96.0, 64.0, 84.0, 84.0, 67.0, 66.0, 47.0, 56.0, 45.0, 33.0, 16.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.65625, -20.8017578125, -19.947265625, -19.0927734375, -18.23828125, -17.3837890625, -16.529296875, -15.6748046875, -14.8203125, -13.9658203125, -13.111328125, -12.2568359375, -11.40234375, -10.5478515625, -9.693359375, -8.8388671875, -7.984375, -7.1298828125, -6.275390625, -5.4208984375, -4.56640625, -3.7119140625, -2.857421875, -2.0029296875, -1.1484375, -0.2939453125, 0.560546875, 1.4150390625, 2.26953125, 3.1240234375, 3.978515625, 4.8330078125, 5.6875, 6.5419921875, 7.396484375, 8.2509765625, 9.10546875, 9.9599609375, 10.814453125, 11.6689453125, 12.5234375, 13.3779296875, 14.232421875, 15.0869140625, 15.94140625, 16.7958984375, 17.650390625, 18.5048828125, 19.359375, 20.2138671875, 21.068359375, 21.9228515625, 22.77734375, 23.6318359375, 24.486328125, 25.3408203125, 26.1953125, 27.0498046875, 27.904296875, 28.7587890625, 29.61328125, 30.4677734375, 31.322265625, 32.1767578125, 33.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 15.0, 16.0, 29.0, 32.0, 47.0, 77.0, 86.0, 145.0, 272.0, 491.0, 1264.0, 6880.0, 160156.0, 847709.0, 26952.0, 2692.0, 721.0, 370.0, 196.0, 104.0, 78.0, 41.0, 38.0, 28.0, 19.0, 16.0, 12.0, 7.0, 9.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2890625, -11.9080810546875, -11.527099609375, -11.1461181640625, -10.76513671875, -10.3841552734375, -10.003173828125, -9.6221923828125, -9.2412109375, -8.8602294921875, -8.479248046875, -8.0982666015625, -7.71728515625, -7.3363037109375, -6.955322265625, -6.5743408203125, -6.193359375, -5.8123779296875, -5.431396484375, -5.0504150390625, -4.66943359375, -4.2884521484375, -3.907470703125, -3.5264892578125, -3.1455078125, -2.7645263671875, -2.383544921875, -2.0025634765625, -1.62158203125, -1.2406005859375, -0.859619140625, -0.4786376953125, -0.09765625, 0.2833251953125, 0.664306640625, 1.0452880859375, 1.42626953125, 1.8072509765625, 2.188232421875, 2.5692138671875, 2.9501953125, 3.3311767578125, 3.712158203125, 4.0931396484375, 4.47412109375, 4.8551025390625, 5.236083984375, 5.6170654296875, 5.998046875, 6.3790283203125, 6.760009765625, 7.1409912109375, 7.52197265625, 7.9029541015625, 8.283935546875, 8.6649169921875, 9.0458984375, 9.4268798828125, 9.807861328125, 10.1888427734375, 10.56982421875, 10.9508056640625, 11.331787109375, 11.7127685546875, 12.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 7.0, 10.0, 10.0, 10.0, 26.0, 25.0, 48.0, 44.0, 57.0, 73.0, 99.0, 104.0, 107.0, 85.0, 68.0, 55.0, 36.0, 32.0, 23.0, 19.0, 13.0, 9.0, 10.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007877349853515625, -0.0007621273398399353, -0.0007365196943283081, -0.0007109120488166809, -0.0006853044033050537, -0.0006596967577934265, -0.0006340891122817993, -0.0006084814667701721, -0.0005828738212585449, -0.0005572661757469177, -0.0005316585302352905, -0.0005060508847236633, -0.00048044323921203613, -0.00045483559370040894, -0.00042922794818878174, -0.00040362030267715454, -0.00037801265716552734, -0.00035240501165390015, -0.00032679736614227295, -0.00030118972063064575, -0.00027558207511901855, -0.00024997442960739136, -0.00022436678409576416, -0.00019875913858413696, -0.00017315149307250977, -0.00014754384756088257, -0.00012193620204925537, -9.632855653762817e-05, -7.072091102600098e-05, -4.511326551437378e-05, -1.9505620002746582e-05, 6.102025508880615e-06, 3.170967102050781e-05, 5.731731653213501e-05, 8.292496204376221e-05, 0.0001085326075553894, 0.0001341402530670166, 0.0001597478985786438, 0.000185355544090271, 0.0002109631896018982, 0.0002365708351135254, 0.0002621784806251526, 0.0002877861261367798, 0.000313393771648407, 0.0003390014171600342, 0.0003646090626716614, 0.0003902167081832886, 0.00041582435369491577, 0.00044143199920654297, 0.00046703964471817017, 0.0004926472902297974, 0.0005182549357414246, 0.0005438625812530518, 0.000569470226764679, 0.0005950778722763062, 0.0006206855177879333, 0.0006462931632995605, 0.0006719008088111877, 0.0006975084543228149, 0.0007231160998344421, 0.0007487237453460693, 0.0007743313908576965, 0.0007999390363693237, 0.0008255466818809509, 0.0008511543273925781]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 6.0, 7.0, 14.0, 21.0, 23.0, 17.0, 42.0, 47.0, 78.0, 144.0, 199.0, 396.0, 731.0, 1665.0, 4403.0, 14936.0, 93022.0, 748845.0, 154308.0, 20321.0, 5327.0, 1945.0, 854.0, 457.0, 281.0, 145.0, 90.0, 63.0, 49.0, 33.0, 24.0, 9.0, 14.0, 10.0, 9.0, 6.0, 1.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.640625, -8.3756103515625, -8.110595703125, -7.8455810546875, -7.58056640625, -7.3155517578125, -7.050537109375, -6.7855224609375, -6.5205078125, -6.2554931640625, -5.990478515625, -5.7254638671875, -5.46044921875, -5.1954345703125, -4.930419921875, -4.6654052734375, -4.400390625, -4.1353759765625, -3.870361328125, -3.6053466796875, -3.34033203125, -3.0753173828125, -2.810302734375, -2.5452880859375, -2.2802734375, -2.0152587890625, -1.750244140625, -1.4852294921875, -1.22021484375, -0.9552001953125, -0.690185546875, -0.4251708984375, -0.16015625, 0.1048583984375, 0.369873046875, 0.6348876953125, 0.89990234375, 1.1649169921875, 1.429931640625, 1.6949462890625, 1.9599609375, 2.2249755859375, 2.489990234375, 2.7550048828125, 3.02001953125, 3.2850341796875, 3.550048828125, 3.8150634765625, 4.080078125, 4.3450927734375, 4.610107421875, 4.8751220703125, 5.14013671875, 5.4051513671875, 5.670166015625, 5.9351806640625, 6.2001953125, 6.4652099609375, 6.730224609375, 6.9952392578125, 7.26025390625, 7.5252685546875, 7.790283203125, 8.0552978515625, 8.3203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 13.0, 14.0, 24.0, 31.0, 36.0, 61.0, 76.0, 99.0, 130.0, 124.0, 93.0, 72.0, 58.0, 44.0, 20.0, 20.0, 7.0, 15.0, 10.0, 8.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.6112060546875, -8.323974609375, -8.0367431640625, -7.74951171875, -7.4622802734375, -7.175048828125, -6.8878173828125, -6.6005859375, -6.3133544921875, -6.026123046875, -5.7388916015625, -5.45166015625, -5.1644287109375, -4.877197265625, -4.5899658203125, -4.302734375, -4.0155029296875, -3.728271484375, -3.4410400390625, -3.15380859375, -2.8665771484375, -2.579345703125, -2.2921142578125, -2.0048828125, -1.7176513671875, -1.430419921875, -1.1431884765625, -0.85595703125, -0.5687255859375, -0.281494140625, 0.0057373046875, 0.29296875, 0.5802001953125, 0.867431640625, 1.1546630859375, 1.44189453125, 1.7291259765625, 2.016357421875, 2.3035888671875, 2.5908203125, 2.8780517578125, 3.165283203125, 3.4525146484375, 3.73974609375, 4.0269775390625, 4.314208984375, 4.6014404296875, 4.888671875, 5.1759033203125, 5.463134765625, 5.7503662109375, 6.03759765625, 6.3248291015625, 6.612060546875, 6.8992919921875, 7.1865234375, 7.4737548828125, 7.760986328125, 8.0482177734375, 8.33544921875, 8.6226806640625, 8.909912109375, 9.1971435546875, 9.484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 9.0, 29.0, 72.0, 151.0, 269.0, 232.0, 137.0, 71.0, 19.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.8524932861328, -149.9701385498047, -145.08778381347656, -140.20542907714844, -135.3230743408203, -130.44070434570312, -125.55835723876953, -120.67599487304688, -115.79364013671875, -110.91128540039062, -106.0289306640625, -101.14657592773438, -96.26421356201172, -91.3818588256836, -86.49950408935547, -81.61714172363281, -76.73479461669922, -71.8524398803711, -66.97008514404297, -62.08772659301758, -57.20536804199219, -52.32301330566406, -47.44065856933594, -42.55830001831055, -37.67594528198242, -32.7935905456543, -27.911231994628906, -23.02887725830078, -18.146520614624023, -13.264163970947266, -8.38180923461914, -3.49945068359375, 1.382904052734375, 6.265260219573975, 11.147616386413574, 16.029972076416016, 20.912328720092773, 25.79468536376953, 30.677040100097656, 35.55939865112305, 40.44175338745117, 45.3241081237793, 50.20646667480469, 55.08882141113281, 59.97117614746094, 64.85353088378906, 69.73588562011719, 74.61824798583984, 79.50060272216797, 84.3829574584961, 89.26531219482422, 94.14767456054688, 99.030029296875, 103.91238403320312, 108.79473876953125, 113.67709350585938, 118.5594482421875, 123.44180297851562, 128.32415771484375, 133.20651245117188, 138.0888671875, 142.97122192382812, 147.85357666015625, 152.73594665527344, 157.61830139160156]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 9.0, 17.0, 25.0, 32.0, 42.0, 49.0, 74.0, 77.0, 80.0, 101.0, 94.0, 67.0, 86.0, 64.0, 40.0, 47.0, 29.0, 23.0, 12.0, 9.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.09200286865234, -103.51426696777344, -99.93653869628906, -96.35880279541016, -92.78106689453125, -89.20333099365234, -85.62559509277344, -82.04786682128906, -78.47013092041016, -74.89239501953125, -71.31466674804688, -67.73693084716797, -64.15919494628906, -60.581459045410156, -57.003726959228516, -53.425994873046875, -49.84825897216797, -46.27052307128906, -42.69279098510742, -39.11505889892578, -35.537322998046875, -31.9595890045166, -28.381855010986328, -24.804121017456055, -21.22638702392578, -17.648653030395508, -14.070919036865234, -10.493185043334961, -6.9154510498046875, -3.337717056274414, 0.24001693725585938, 3.817750930786133, 7.3954925537109375, 10.973226547241211, 14.550960540771484, 18.128694534301758, 21.70642852783203, 25.284162521362305, 28.861896514892578, 32.43962860107422, 36.017364501953125, 39.59510040283203, 43.17283248901367, 46.75056457519531, 50.32830047607422, 53.906036376953125, 57.483768463134766, 61.061500549316406, 64.63923645019531, 68.21697235107422, 71.79470825195312, 75.3724365234375, 78.9501724243164, 82.52790832519531, 86.10563659667969, 89.6833724975586, 93.2611083984375, 96.8388442993164, 100.41658020019531, 103.99430847167969, 107.5720443725586, 111.1497802734375, 114.72750854492188, 118.30524444580078, 121.88298034667969]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 9.0, 11.0, 11.0, 15.0, 9.0, 23.0, 24.0, 49.0, 58.0, 102.0, 160.0, 244.0, 407.0, 658.0, 1186.0, 2625.0, 7107.0, 49649.0, 4089454.0, 31182.0, 6233.0, 2422.0, 1150.0, 570.0, 315.0, 218.0, 128.0, 87.0, 63.0, 36.0, 21.0, 14.0, 10.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-28.8125, -28.08154296875, -27.3505859375, -26.61962890625, -25.888671875, -25.15771484375, -24.4267578125, -23.69580078125, -22.96484375, -22.23388671875, -21.5029296875, -20.77197265625, -20.041015625, -19.31005859375, -18.5791015625, -17.84814453125, -17.1171875, -16.38623046875, -15.6552734375, -14.92431640625, -14.193359375, -13.46240234375, -12.7314453125, -12.00048828125, -11.26953125, -10.53857421875, -9.8076171875, -9.07666015625, -8.345703125, -7.61474609375, -6.8837890625, -6.15283203125, -5.421875, -4.69091796875, -3.9599609375, -3.22900390625, -2.498046875, -1.76708984375, -1.0361328125, -0.30517578125, 0.42578125, 1.15673828125, 1.8876953125, 2.61865234375, 3.349609375, 4.08056640625, 4.8115234375, 5.54248046875, 6.2734375, 7.00439453125, 7.7353515625, 8.46630859375, 9.197265625, 9.92822265625, 10.6591796875, 11.39013671875, 12.12109375, 12.85205078125, 13.5830078125, 14.31396484375, 15.044921875, 15.77587890625, 16.5068359375, 17.23779296875, 17.96875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 8.0, 11.0, 12.0, 15.0, 25.0, 28.0, 41.0, 55.0, 55.0, 69.0, 75.0, 73.0, 77.0, 77.0, 86.0, 66.0, 47.0, 41.0, 35.0, 33.0, 24.0, 9.0, 4.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.055419921875, -5.88818359375, -5.720947265625, -5.5537109375, -5.386474609375, -5.21923828125, -5.052001953125, -4.884765625, -4.717529296875, -4.55029296875, -4.383056640625, -4.2158203125, -4.048583984375, -3.88134765625, -3.714111328125, -3.546875, -3.379638671875, -3.21240234375, -3.045166015625, -2.8779296875, -2.710693359375, -2.54345703125, -2.376220703125, -2.208984375, -2.041748046875, -1.87451171875, -1.707275390625, -1.5400390625, -1.372802734375, -1.20556640625, -1.038330078125, -0.87109375, -0.703857421875, -0.53662109375, -0.369384765625, -0.2021484375, -0.034912109375, 0.13232421875, 0.299560546875, 0.466796875, 0.634033203125, 0.80126953125, 0.968505859375, 1.1357421875, 1.302978515625, 1.47021484375, 1.637451171875, 1.8046875, 1.971923828125, 2.13916015625, 2.306396484375, 2.4736328125, 2.640869140625, 2.80810546875, 2.975341796875, 3.142578125, 3.309814453125, 3.47705078125, 3.644287109375, 3.8115234375, 3.978759765625, 4.14599609375, 4.313232421875, 4.48046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 19.0, 25.0, 36.0, 49.0, 56.0, 77.0, 103.0, 167.0, 273.0, 376.0, 599.0, 1050.0, 1663.0, 2809.0, 4839.0, 9017.0, 23717.0, 157234.0, 3889726.0, 68233.0, 16651.0, 7330.0, 3948.0, 2324.0, 1445.0, 851.0, 542.0, 359.0, 240.0, 136.0, 102.0, 73.0, 51.0, 46.0, 27.0, 16.0, 11.0, 9.0, 6.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.5467529296875, -8.234130859375, -7.9215087890625, -7.60888671875, -7.2962646484375, -6.983642578125, -6.6710205078125, -6.3583984375, -6.0457763671875, -5.733154296875, -5.4205322265625, -5.10791015625, -4.7952880859375, -4.482666015625, -4.1700439453125, -3.857421875, -3.5447998046875, -3.232177734375, -2.9195556640625, -2.60693359375, -2.2943115234375, -1.981689453125, -1.6690673828125, -1.3564453125, -1.0438232421875, -0.731201171875, -0.4185791015625, -0.10595703125, 0.2066650390625, 0.519287109375, 0.8319091796875, 1.14453125, 1.4571533203125, 1.769775390625, 2.0823974609375, 2.39501953125, 2.7076416015625, 3.020263671875, 3.3328857421875, 3.6455078125, 3.9581298828125, 4.270751953125, 4.5833740234375, 4.89599609375, 5.2086181640625, 5.521240234375, 5.8338623046875, 6.146484375, 6.4591064453125, 6.771728515625, 7.0843505859375, 7.39697265625, 7.7095947265625, 8.022216796875, 8.3348388671875, 8.6474609375, 8.9600830078125, 9.272705078125, 9.5853271484375, 9.89794921875, 10.2105712890625, 10.523193359375, 10.8358154296875, 11.1484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 6.0, 4.0, 15.0, 12.0, 17.0, 42.0, 97.0, 504.0, 3014.0, 199.0, 60.0, 40.0, 13.0, 10.0, 9.0, 1.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.672393798828125, -3.49127197265625, -3.310150146484375, -3.1290283203125, -2.947906494140625, -2.76678466796875, -2.585662841796875, -2.404541015625, -2.223419189453125, -2.04229736328125, -1.861175537109375, -1.6800537109375, -1.498931884765625, -1.31781005859375, -1.136688232421875, -0.95556640625, -0.774444580078125, -0.59332275390625, -0.412200927734375, -0.2310791015625, -0.049957275390625, 0.13116455078125, 0.312286376953125, 0.493408203125, 0.674530029296875, 0.85565185546875, 1.036773681640625, 1.2178955078125, 1.399017333984375, 1.58013916015625, 1.761260986328125, 1.9423828125, 2.123504638671875, 2.30462646484375, 2.485748291015625, 2.6668701171875, 2.847991943359375, 3.02911376953125, 3.210235595703125, 3.391357421875, 3.572479248046875, 3.75360107421875, 3.934722900390625, 4.1158447265625, 4.296966552734375, 4.47808837890625, 4.659210205078125, 4.84033203125, 5.021453857421875, 5.20257568359375, 5.383697509765625, 5.5648193359375, 5.745941162109375, 5.92706298828125, 6.108184814453125, 6.289306640625, 6.470428466796875, 6.65155029296875, 6.832672119140625, 7.0137939453125, 7.194915771484375, 7.37603759765625, 7.557159423828125, 7.73828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 15.0, 36.0, 85.0, 150.0, 214.0, 197.0, 129.0, 68.0, 43.0, 27.0, 10.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.47669792175293, -19.255374908447266, -18.0340518951416, -16.812728881835938, -15.591405868530273, -14.37008285522461, -13.148759841918945, -11.927436828613281, -10.706113815307617, -9.484790802001953, -8.263467788696289, -7.042144775390625, -5.820821762084961, -4.599498748779297, -3.378175735473633, -2.1568527221679688, -0.9355297088623047, 0.2857933044433594, 1.5071163177490234, 2.7284393310546875, 3.9497623443603516, 5.171085357666016, 6.39240837097168, 7.613731384277344, 8.835054397583008, 10.056377410888672, 11.277700424194336, 12.4990234375, 13.720346450805664, 14.941669464111328, 16.162992477416992, 17.384315490722656, 18.605640411376953, 19.826963424682617, 21.04828643798828, 22.269609451293945, 23.49093246459961, 24.712255477905273, 25.933578491210938, 27.1549015045166, 28.376224517822266, 29.59754753112793, 30.818870544433594, 32.040191650390625, 33.26151657104492, 34.48284149169922, 35.70416259765625, 36.92548370361328, 38.14680862426758, 39.368133544921875, 40.589454650878906, 41.81077575683594, 43.032100677490234, 44.25342559814453, 45.47474670410156, 46.696067810058594, 47.91739273071289, 49.13871765136719, 50.36003875732422, 51.58135986328125, 52.80268478393555, 54.024009704589844, 55.245330810546875, 56.466651916503906, 57.6879768371582]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 6.0, 11.0, 13.0, 13.0, 12.0, 32.0, 20.0, 24.0, 39.0, 38.0, 46.0, 52.0, 41.0, 55.0, 59.0, 53.0, 45.0, 46.0, 48.0, 55.0, 39.0, 31.0, 38.0, 32.0, 34.0, 16.0, 18.0, 14.0, 15.0, 11.0, 11.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.402545928955078, -14.99402141571045, -14.585495948791504, -14.176971435546875, -13.768446922302246, -13.3599214553833, -12.951396942138672, -12.542871475219727, -12.134346961975098, -11.725822448730469, -11.317296981811523, -10.908772468566895, -10.500247955322266, -10.09172248840332, -9.683197975158691, -9.274673461914062, -8.866147994995117, -8.457623481750488, -8.049098014831543, -7.640573501586914, -7.232048511505127, -6.82352352142334, -6.414999008178711, -6.006474018096924, -5.597949981689453, -5.189424991607666, -4.780900478363037, -4.37237548828125, -3.963850498199463, -3.555325746536255, -3.146800994873047, -2.7382760047912598, -2.3297510147094727, -1.921226143836975, -1.5127012729644775, -1.1041765213012695, -0.695651650428772, -0.2871267795562744, 0.1213979721069336, 0.5299229621887207, 0.9384477138519287, 1.3469725847244263, 1.7554974555969238, 2.164022207260132, 2.57254695892334, 2.981071949005127, 3.389596700668335, 3.798121690750122, 4.20664644241333, 4.615171432495117, 5.023695945739746, 5.432220935821533, 5.84074592590332, 6.249270439147949, 6.657795429229736, 7.066320419311523, 7.474844932556152, 7.8833699226379395, 8.291894912719727, 8.700419425964355, 9.108943939208984, 9.51746940612793, 9.925993919372559, 10.334518432617188, 10.743043899536133]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 26.0, 32.0, 47.0, 110.0, 178.0, 361.0, 773.0, 1910.0, 5041.0, 15305.0, 55846.0, 240686.0, 499619.0, 169780.0, 40188.0, 11791.0, 3904.0, 1560.0, 672.0, 341.0, 165.0, 73.0, 58.0, 24.0, 20.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0712890625, -9.728515625, -9.3857421875, -9.04296875, -8.7001953125, -8.357421875, -8.0146484375, -7.671875, -7.3291015625, -6.986328125, -6.6435546875, -6.30078125, -5.9580078125, -5.615234375, -5.2724609375, -4.9296875, -4.5869140625, -4.244140625, -3.9013671875, -3.55859375, -3.2158203125, -2.873046875, -2.5302734375, -2.1875, -1.8447265625, -1.501953125, -1.1591796875, -0.81640625, -0.4736328125, -0.130859375, 0.2119140625, 0.5546875, 0.8974609375, 1.240234375, 1.5830078125, 1.92578125, 2.2685546875, 2.611328125, 2.9541015625, 3.296875, 3.6396484375, 3.982421875, 4.3251953125, 4.66796875, 5.0107421875, 5.353515625, 5.6962890625, 6.0390625, 6.3818359375, 6.724609375, 7.0673828125, 7.41015625, 7.7529296875, 8.095703125, 8.4384765625, 8.78125, 9.1240234375, 9.466796875, 9.8095703125, 10.15234375, 10.4951171875, 10.837890625, 11.1806640625, 11.5234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 16.0, 16.0, 10.0, 25.0, 24.0, 35.0, 40.0, 42.0, 62.0, 59.0, 52.0, 73.0, 61.0, 66.0, 66.0, 62.0, 55.0, 43.0, 44.0, 38.0, 30.0, 22.0, 9.0, 7.0, 10.0, 6.0, 7.0, 5.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.9921875, -5.840423583984375, -5.68865966796875, -5.536895751953125, -5.3851318359375, -5.233367919921875, -5.08160400390625, -4.929840087890625, -4.778076171875, -4.626312255859375, -4.47454833984375, -4.322784423828125, -4.1710205078125, -4.019256591796875, -3.86749267578125, -3.715728759765625, -3.56396484375, -3.412200927734375, -3.26043701171875, -3.108673095703125, -2.9569091796875, -2.805145263671875, -2.65338134765625, -2.501617431640625, -2.349853515625, -2.198089599609375, -2.04632568359375, -1.894561767578125, -1.7427978515625, -1.591033935546875, -1.43927001953125, -1.287506103515625, -1.1357421875, -0.983978271484375, -0.83221435546875, -0.680450439453125, -0.5286865234375, -0.376922607421875, -0.22515869140625, -0.073394775390625, 0.078369140625, 0.230133056640625, 0.38189697265625, 0.533660888671875, 0.6854248046875, 0.837188720703125, 0.98895263671875, 1.140716552734375, 1.29248046875, 1.444244384765625, 1.59600830078125, 1.747772216796875, 1.8995361328125, 2.051300048828125, 2.20306396484375, 2.354827880859375, 2.506591796875, 2.658355712890625, 2.81011962890625, 2.961883544921875, 3.1136474609375, 3.265411376953125, 3.41717529296875, 3.568939208984375, 3.720703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 7.0, 3.0, 7.0, 7.0, 12.0, 13.0, 19.0, 31.0, 45.0, 65.0, 95.0, 150.0, 257.0, 489.0, 1225.0, 3448.0, 19568.0, 345681.0, 638254.0, 31559.0, 4766.0, 1416.0, 612.0, 339.0, 176.0, 89.0, 67.0, 45.0, 33.0, 28.0, 15.0, 7.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.220458984375, -22.51904296875, -21.817626953125, -21.1162109375, -20.414794921875, -19.71337890625, -19.011962890625, -18.310546875, -17.609130859375, -16.90771484375, -16.206298828125, -15.5048828125, -14.803466796875, -14.10205078125, -13.400634765625, -12.69921875, -11.997802734375, -11.29638671875, -10.594970703125, -9.8935546875, -9.192138671875, -8.49072265625, -7.789306640625, -7.087890625, -6.386474609375, -5.68505859375, -4.983642578125, -4.2822265625, -3.580810546875, -2.87939453125, -2.177978515625, -1.4765625, -0.775146484375, -0.07373046875, 0.627685546875, 1.3291015625, 2.030517578125, 2.73193359375, 3.433349609375, 4.134765625, 4.836181640625, 5.53759765625, 6.239013671875, 6.9404296875, 7.641845703125, 8.34326171875, 9.044677734375, 9.74609375, 10.447509765625, 11.14892578125, 11.850341796875, 12.5517578125, 13.253173828125, 13.95458984375, 14.656005859375, 15.357421875, 16.058837890625, 16.76025390625, 17.461669921875, 18.1630859375, 18.864501953125, 19.56591796875, 20.267333984375, 20.96875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 11.0, 7.0, 14.0, 20.0, 28.0, 38.0, 39.0, 56.0, 59.0, 70.0, 100.0, 78.0, 78.0, 78.0, 64.0, 54.0, 43.0, 45.0, 30.0, 24.0, 22.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-34.59375, -33.784423828125, -32.97509765625, -32.165771484375, -31.3564453125, -30.547119140625, -29.73779296875, -28.928466796875, -28.119140625, -27.309814453125, -26.50048828125, -25.691162109375, -24.8818359375, -24.072509765625, -23.26318359375, -22.453857421875, -21.64453125, -20.835205078125, -20.02587890625, -19.216552734375, -18.4072265625, -17.597900390625, -16.78857421875, -15.979248046875, -15.169921875, -14.360595703125, -13.55126953125, -12.741943359375, -11.9326171875, -11.123291015625, -10.31396484375, -9.504638671875, -8.6953125, -7.885986328125, -7.07666015625, -6.267333984375, -5.4580078125, -4.648681640625, -3.83935546875, -3.030029296875, -2.220703125, -1.411376953125, -0.60205078125, 0.207275390625, 1.0166015625, 1.825927734375, 2.63525390625, 3.444580078125, 4.25390625, 5.063232421875, 5.87255859375, 6.681884765625, 7.4912109375, 8.300537109375, 9.10986328125, 9.919189453125, 10.728515625, 11.537841796875, 12.34716796875, 13.156494140625, 13.9658203125, 14.775146484375, 15.58447265625, 16.393798828125, 17.203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 7.0, 6.0, 19.0, 24.0, 21.0, 34.0, 37.0, 60.0, 93.0, 116.0, 183.0, 288.0, 589.0, 1284.0, 3243.0, 11429.0, 57599.0, 616081.0, 310632.0, 34389.0, 7647.0, 2491.0, 973.0, 463.0, 266.0, 157.0, 116.0, 81.0, 49.0, 49.0, 31.0, 20.0, 18.0, 12.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.87799072265625, -5.6934814453125, -5.50897216796875, -5.324462890625, -5.13995361328125, -4.9554443359375, -4.77093505859375, -4.58642578125, -4.40191650390625, -4.2174072265625, -4.03289794921875, -3.848388671875, -3.66387939453125, -3.4793701171875, -3.29486083984375, -3.1103515625, -2.92584228515625, -2.7413330078125, -2.55682373046875, -2.372314453125, -2.18780517578125, -2.0032958984375, -1.81878662109375, -1.63427734375, -1.44976806640625, -1.2652587890625, -1.08074951171875, -0.896240234375, -0.71173095703125, -0.5272216796875, -0.34271240234375, -0.158203125, 0.02630615234375, 0.2108154296875, 0.39532470703125, 0.579833984375, 0.76434326171875, 0.9488525390625, 1.13336181640625, 1.31787109375, 1.50238037109375, 1.6868896484375, 1.87139892578125, 2.055908203125, 2.24041748046875, 2.4249267578125, 2.60943603515625, 2.7939453125, 2.97845458984375, 3.1629638671875, 3.34747314453125, 3.531982421875, 3.71649169921875, 3.9010009765625, 4.08551025390625, 4.27001953125, 4.45452880859375, 4.6390380859375, 4.82354736328125, 5.008056640625, 5.19256591796875, 5.3770751953125, 5.56158447265625, 5.74609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 6.0, 21.0, 18.0, 34.0, 67.0, 155.0, 238.0, 207.0, 97.0, 47.0, 36.0, 22.0, 13.0, 12.0, 5.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015048980712890625, -0.0014542937278747559, -0.0014036893844604492, -0.0013530850410461426, -0.001302480697631836, -0.0012518763542175293, -0.0012012720108032227, -0.001150667667388916, -0.0011000633239746094, -0.0010494589805603027, -0.000998854637145996, -0.0009482502937316895, -0.0008976459503173828, -0.0008470416069030762, -0.0007964372634887695, -0.0007458329200744629, -0.0006952285766601562, -0.0006446242332458496, -0.000594019889831543, -0.0005434155464172363, -0.0004928112030029297, -0.00044220685958862305, -0.0003916025161743164, -0.00034099817276000977, -0.0002903938293457031, -0.00023978948593139648, -0.00018918514251708984, -0.0001385807991027832, -8.797645568847656e-05, -3.737211227416992e-05, 1.3232231140136719e-05, 6.383657455444336e-05, 0.00011444091796875, 0.00016504526138305664, 0.00021564960479736328, 0.0002662539482116699, 0.00031685829162597656, 0.0003674626350402832, 0.00041806697845458984, 0.0004686713218688965, 0.0005192756652832031, 0.0005698800086975098, 0.0006204843521118164, 0.000671088695526123, 0.0007216930389404297, 0.0007722973823547363, 0.000822901725769043, 0.0008735060691833496, 0.0009241104125976562, 0.0009747147560119629, 0.0010253190994262695, 0.0010759234428405762, 0.0011265277862548828, 0.0011771321296691895, 0.001227736473083496, 0.0012783408164978027, 0.0013289451599121094, 0.001379549503326416, 0.0014301538467407227, 0.0014807581901550293, 0.001531362533569336, 0.0015819668769836426, 0.0016325712203979492, 0.0016831755638122559, 0.0017337799072265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 4.0, 7.0, 12.0, 20.0, 17.0, 24.0, 44.0, 61.0, 101.0, 130.0, 242.0, 454.0, 942.0, 2183.0, 6875.0, 32676.0, 386358.0, 563329.0, 42136.0, 8311.0, 2421.0, 1017.0, 425.0, 256.0, 141.0, 117.0, 69.0, 41.0, 24.0, 28.0, 17.0, 12.0, 17.0, 6.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4921875, -7.258544921875, -7.02490234375, -6.791259765625, -6.5576171875, -6.323974609375, -6.09033203125, -5.856689453125, -5.623046875, -5.389404296875, -5.15576171875, -4.922119140625, -4.6884765625, -4.454833984375, -4.22119140625, -3.987548828125, -3.75390625, -3.520263671875, -3.28662109375, -3.052978515625, -2.8193359375, -2.585693359375, -2.35205078125, -2.118408203125, -1.884765625, -1.651123046875, -1.41748046875, -1.183837890625, -0.9501953125, -0.716552734375, -0.48291015625, -0.249267578125, -0.015625, 0.218017578125, 0.45166015625, 0.685302734375, 0.9189453125, 1.152587890625, 1.38623046875, 1.619873046875, 1.853515625, 2.087158203125, 2.32080078125, 2.554443359375, 2.7880859375, 3.021728515625, 3.25537109375, 3.489013671875, 3.72265625, 3.956298828125, 4.18994140625, 4.423583984375, 4.6572265625, 4.890869140625, 5.12451171875, 5.358154296875, 5.591796875, 5.825439453125, 6.05908203125, 6.292724609375, 6.5263671875, 6.760009765625, 6.99365234375, 7.227294921875, 7.4609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 28.0, 28.0, 47.0, 58.0, 101.0, 139.0, 162.0, 115.0, 95.0, 70.0, 35.0, 28.0, 10.0, 11.0, 11.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.5269775390625, -8.272705078125, -8.0184326171875, -7.76416015625, -7.5098876953125, -7.255615234375, -7.0013427734375, -6.7470703125, -6.4927978515625, -6.238525390625, -5.9842529296875, -5.72998046875, -5.4757080078125, -5.221435546875, -4.9671630859375, -4.712890625, -4.4586181640625, -4.204345703125, -3.9500732421875, -3.69580078125, -3.4415283203125, -3.187255859375, -2.9329833984375, -2.6787109375, -2.4244384765625, -2.170166015625, -1.9158935546875, -1.66162109375, -1.4073486328125, -1.153076171875, -0.8988037109375, -0.64453125, -0.3902587890625, -0.135986328125, 0.1182861328125, 0.37255859375, 0.6268310546875, 0.881103515625, 1.1353759765625, 1.3896484375, 1.6439208984375, 1.898193359375, 2.1524658203125, 2.40673828125, 2.6610107421875, 2.915283203125, 3.1695556640625, 3.423828125, 3.6781005859375, 3.932373046875, 4.1866455078125, 4.44091796875, 4.6951904296875, 4.949462890625, 5.2037353515625, 5.4580078125, 5.7122802734375, 5.966552734375, 6.2208251953125, 6.47509765625, 6.7293701171875, 6.983642578125, 7.2379150390625, 7.4921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 10.0, 15.0, 46.0, 121.0, 165.0, 216.0, 201.0, 113.0, 62.0, 25.0, 15.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.0117950439453, -130.28614807128906, -125.56049346923828, -120.8348388671875, -116.10919189453125, -111.383544921875, -106.65789031982422, -101.93223571777344, -97.20658874511719, -92.48094177246094, -87.75528717041016, -83.02963256835938, -78.30398559570312, -73.57833862304688, -68.8526840209961, -64.12702941894531, -59.40138244628906, -54.67573165893555, -49.95008087158203, -45.224430084228516, -40.498779296875, -35.773128509521484, -31.04747772216797, -26.321826934814453, -21.596176147460938, -16.870525360107422, -12.144874572753906, -7.419223785400391, -2.693572998046875, 2.0320777893066406, 6.757728576660156, 11.483379364013672, 16.209014892578125, 20.93466567993164, 25.660316467285156, 30.385967254638672, 35.11161804199219, 39.8372688293457, 44.56291961669922, 49.288570404052734, 54.01422119140625, 58.739871978759766, 63.46552276611328, 68.19117736816406, 72.91682434082031, 77.64247131347656, 82.36812591552734, 87.09378051757812, 91.81942749023438, 96.54507446289062, 101.2707290649414, 105.99638366699219, 110.72203063964844, 115.44767761230469, 120.17333221435547, 124.89898681640625, 129.6246337890625, 134.35028076171875, 139.075927734375, 143.8015899658203, 148.52723693847656, 153.2528839111328, 157.97854614257812, 162.70419311523438, 167.42984008789062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 9.0, 10.0, 11.0, 16.0, 23.0, 16.0, 27.0, 27.0, 22.0, 46.0, 39.0, 44.0, 50.0, 46.0, 54.0, 50.0, 50.0, 51.0, 46.0, 63.0, 38.0, 33.0, 30.0, 30.0, 39.0, 17.0, 22.0, 19.0, 13.0, 9.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-76.74419403076172, -74.5295181274414, -72.3148422241211, -70.10016632080078, -67.88549041748047, -65.67081451416016, -63.456138610839844, -61.24146270751953, -59.02678680419922, -56.812110900878906, -54.597434997558594, -52.38275909423828, -50.16808319091797, -47.953407287597656, -45.738731384277344, -43.52405548095703, -41.30937957763672, -39.094703674316406, -36.880027770996094, -34.66535186767578, -32.45067596435547, -30.236000061035156, -28.021324157714844, -25.80664825439453, -23.59197235107422, -21.377296447753906, -19.162620544433594, -16.94794464111328, -14.733268737792969, -12.518592834472656, -10.303916931152344, -8.089241027832031, -5.874565124511719, -3.6598892211914062, -1.4452133178710938, 0.7694625854492188, 2.9841384887695312, 5.198814392089844, 7.413490295410156, 9.628166198730469, 11.842842102050781, 14.057518005371094, 16.272193908691406, 18.48686981201172, 20.70154571533203, 22.916221618652344, 25.130897521972656, 27.34557342529297, 29.56024932861328, 31.774925231933594, 33.989601135253906, 36.20427703857422, 38.41895294189453, 40.633628845214844, 42.848304748535156, 45.06298065185547, 47.27765655517578, 49.492332458496094, 51.707008361816406, 53.92168426513672, 56.13636016845703, 58.351036071777344, 60.565711975097656, 62.78038787841797, 64.99506378173828]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 8.0, 15.0, 25.0, 32.0, 42.0, 50.0, 118.0, 197.0, 353.0, 591.0, 1214.0, 2225.0, 5026.0, 13252.0, 46860.0, 801553.0, 3198030.0, 92229.0, 19580.0, 6934.0, 2972.0, 1378.0, 733.0, 375.0, 185.0, 111.0, 60.0, 43.0, 38.0, 20.0, 8.0, 12.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4803466796875, -9.202880859375, -8.9254150390625, -8.64794921875, -8.3704833984375, -8.093017578125, -7.8155517578125, -7.5380859375, -7.2606201171875, -6.983154296875, -6.7056884765625, -6.42822265625, -6.1507568359375, -5.873291015625, -5.5958251953125, -5.318359375, -5.0408935546875, -4.763427734375, -4.4859619140625, -4.20849609375, -3.9310302734375, -3.653564453125, -3.3760986328125, -3.0986328125, -2.8211669921875, -2.543701171875, -2.2662353515625, -1.98876953125, -1.7113037109375, -1.433837890625, -1.1563720703125, -0.87890625, -0.6014404296875, -0.323974609375, -0.0465087890625, 0.23095703125, 0.5084228515625, 0.785888671875, 1.0633544921875, 1.3408203125, 1.6182861328125, 1.895751953125, 2.1732177734375, 2.45068359375, 2.7281494140625, 3.005615234375, 3.2830810546875, 3.560546875, 3.8380126953125, 4.115478515625, 4.3929443359375, 4.67041015625, 4.9478759765625, 5.225341796875, 5.5028076171875, 5.7802734375, 6.0577392578125, 6.335205078125, 6.6126708984375, 6.89013671875, 7.1676025390625, 7.445068359375, 7.7225341796875, 8.0]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 1.0, 11.0, 7.0, 8.0, 12.0, 21.0, 18.0, 22.0, 28.0, 45.0, 42.0, 38.0, 51.0, 68.0, 49.0, 62.0, 63.0, 57.0, 57.0, 64.0, 42.0, 47.0, 33.0, 28.0, 33.0, 17.0, 10.0, 8.0, 9.0, 10.0, 5.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.6796875, -4.55230712890625, -4.4249267578125, -4.29754638671875, -4.170166015625, -4.04278564453125, -3.9154052734375, -3.78802490234375, -3.66064453125, -3.53326416015625, -3.4058837890625, -3.27850341796875, -3.151123046875, -3.02374267578125, -2.8963623046875, -2.76898193359375, -2.6416015625, -2.51422119140625, -2.3868408203125, -2.25946044921875, -2.132080078125, -2.00469970703125, -1.8773193359375, -1.74993896484375, -1.62255859375, -1.49517822265625, -1.3677978515625, -1.24041748046875, -1.113037109375, -0.98565673828125, -0.8582763671875, -0.73089599609375, -0.603515625, -0.47613525390625, -0.3487548828125, -0.22137451171875, -0.093994140625, 0.03338623046875, 0.1607666015625, 0.28814697265625, 0.41552734375, 0.54290771484375, 0.6702880859375, 0.79766845703125, 0.925048828125, 1.05242919921875, 1.1798095703125, 1.30718994140625, 1.4345703125, 1.56195068359375, 1.6893310546875, 1.81671142578125, 1.944091796875, 2.07147216796875, 2.1988525390625, 2.32623291015625, 2.45361328125, 2.58099365234375, 2.7083740234375, 2.83575439453125, 2.963134765625, 3.09051513671875, 3.2178955078125, 3.34527587890625, 3.47265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 18.0, 26.0, 20.0, 56.0, 86.0, 203.0, 613.0, 2418.0, 12374.0, 128946.0, 3971316.0, 67179.0, 8393.0, 1778.0, 463.0, 166.0, 85.0, 26.0, 21.0, 13.0, 14.0, 7.0, 8.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.640625, -17.04052734375, -16.4404296875, -15.84033203125, -15.240234375, -14.64013671875, -14.0400390625, -13.43994140625, -12.83984375, -12.23974609375, -11.6396484375, -11.03955078125, -10.439453125, -9.83935546875, -9.2392578125, -8.63916015625, -8.0390625, -7.43896484375, -6.8388671875, -6.23876953125, -5.638671875, -5.03857421875, -4.4384765625, -3.83837890625, -3.23828125, -2.63818359375, -2.0380859375, -1.43798828125, -0.837890625, -0.23779296875, 0.3623046875, 0.96240234375, 1.5625, 2.16259765625, 2.7626953125, 3.36279296875, 3.962890625, 4.56298828125, 5.1630859375, 5.76318359375, 6.36328125, 6.96337890625, 7.5634765625, 8.16357421875, 8.763671875, 9.36376953125, 9.9638671875, 10.56396484375, 11.1640625, 11.76416015625, 12.3642578125, 12.96435546875, 13.564453125, 14.16455078125, 14.7646484375, 15.36474609375, 15.96484375, 16.56494140625, 17.1650390625, 17.76513671875, 18.365234375, 18.96533203125, 19.5654296875, 20.16552734375, 20.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 9.0, 14.0, 6.0, 13.0, 24.0, 27.0, 55.0, 85.0, 191.0, 518.0, 1544.0, 950.0, 336.0, 90.0, 62.0, 40.0, 21.0, 16.0, 10.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.53125, -12.180908203125, -11.83056640625, -11.480224609375, -11.1298828125, -10.779541015625, -10.42919921875, -10.078857421875, -9.728515625, -9.378173828125, -9.02783203125, -8.677490234375, -8.3271484375, -7.976806640625, -7.62646484375, -7.276123046875, -6.92578125, -6.575439453125, -6.22509765625, -5.874755859375, -5.5244140625, -5.174072265625, -4.82373046875, -4.473388671875, -4.123046875, -3.772705078125, -3.42236328125, -3.072021484375, -2.7216796875, -2.371337890625, -2.02099609375, -1.670654296875, -1.3203125, -0.969970703125, -0.61962890625, -0.269287109375, 0.0810546875, 0.431396484375, 0.78173828125, 1.132080078125, 1.482421875, 1.832763671875, 2.18310546875, 2.533447265625, 2.8837890625, 3.234130859375, 3.58447265625, 3.934814453125, 4.28515625, 4.635498046875, 4.98583984375, 5.336181640625, 5.6865234375, 6.036865234375, 6.38720703125, 6.737548828125, 7.087890625, 7.438232421875, 7.78857421875, 8.138916015625, 8.4892578125, 8.839599609375, 9.18994140625, 9.540283203125, 9.890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 11.0, 21.0, 46.0, 144.0, 247.0, 277.0, 160.0, 59.0, 18.0, 11.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.9678192138672, -153.36355590820312, -148.75929260253906, -144.155029296875, -139.55076599121094, -134.94650268554688, -130.3422393798828, -125.73797607421875, -121.13371276855469, -116.52944946289062, -111.92518615722656, -107.3209228515625, -102.71665954589844, -98.11239624023438, -93.50813293457031, -88.90386962890625, -84.29960632324219, -79.69534301757812, -75.09107971191406, -70.48681640625, -65.88255310058594, -61.278289794921875, -56.67402648925781, -52.06976318359375, -47.46549987792969, -42.861236572265625, -38.25697326660156, -33.6527099609375, -29.048446655273438, -24.444183349609375, -19.839920043945312, -15.23565673828125, -10.63140869140625, -6.0271453857421875, -1.422882080078125, 3.1813812255859375, 7.78564453125, 12.389907836914062, 16.994171142578125, 21.598434448242188, 26.20269775390625, 30.806961059570312, 35.411224365234375, 40.01548767089844, 44.6197509765625, 49.22401428222656, 53.828277587890625, 58.43254089355469, 63.03680419921875, 67.64106750488281, 72.24533081054688, 76.84959411621094, 81.453857421875, 86.05812072753906, 90.66238403320312, 95.26664733886719, 99.87091064453125, 104.47517395019531, 109.07943725585938, 113.68370056152344, 118.2879638671875, 122.89222717285156, 127.49649047851562, 132.1007537841797, 136.70501708984375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 9.0, 12.0, 15.0, 14.0, 12.0, 23.0, 28.0, 30.0, 40.0, 56.0, 55.0, 59.0, 59.0, 64.0, 65.0, 68.0, 55.0, 67.0, 69.0, 40.0, 30.0, 39.0, 20.0, 17.0, 16.0, 13.0, 12.0, 4.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.3640251159668, -56.64616012573242, -54.92829895019531, -53.21043395996094, -51.49256896972656, -49.77470397949219, -48.05684280395508, -46.3389778137207, -44.62111282348633, -42.90324783325195, -41.185386657714844, -39.46752166748047, -37.749656677246094, -36.03179168701172, -34.31393051147461, -32.596065521240234, -30.878202438354492, -29.16033935546875, -27.442474365234375, -25.724611282348633, -24.006746292114258, -22.288883209228516, -20.57101821899414, -18.8531551361084, -17.135292053222656, -15.417428016662598, -13.699563980102539, -11.981700897216797, -10.263835906982422, -8.54597282409668, -6.828108787536621, -5.1102447509765625, -3.3923797607421875, -1.6745158433914185, 0.043348073959350586, 1.76121187210083, 3.4790759086608887, 5.196939468383789, 6.914803504943848, 8.632667541503906, 10.350531578063965, 12.068395614624023, 13.786259651184082, 15.50412368774414, 17.221986770629883, 18.939849853515625, 20.65771484375, 22.375579833984375, 24.093442916870117, 25.81130599975586, 27.529170989990234, 29.247034072875977, 30.96489906311035, 32.682762145996094, 34.40062713623047, 36.118492126464844, 37.83635330200195, 39.55421829223633, 41.27207946777344, 42.98994445800781, 44.70780944824219, 46.42567443847656, 48.14353561401367, 49.86140060424805, 51.57926559448242]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 24.0, 50.0, 70.0, 112.0, 202.0, 328.0, 616.0, 1177.0, 2465.0, 5562.0, 14136.0, 38565.0, 117832.0, 350825.0, 341712.0, 113516.0, 37345.0, 13385.0, 5493.0, 2452.0, 1151.0, 598.0, 371.0, 213.0, 109.0, 71.0, 38.0, 30.0, 20.0, 13.0, 14.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1875, -7.9315185546875, -7.675537109375, -7.4195556640625, -7.16357421875, -6.9075927734375, -6.651611328125, -6.3956298828125, -6.1396484375, -5.8836669921875, -5.627685546875, -5.3717041015625, -5.11572265625, -4.8597412109375, -4.603759765625, -4.3477783203125, -4.091796875, -3.8358154296875, -3.579833984375, -3.3238525390625, -3.06787109375, -2.8118896484375, -2.555908203125, -2.2999267578125, -2.0439453125, -1.7879638671875, -1.531982421875, -1.2760009765625, -1.02001953125, -0.7640380859375, -0.508056640625, -0.2520751953125, 0.00390625, 0.2598876953125, 0.515869140625, 0.7718505859375, 1.02783203125, 1.2838134765625, 1.539794921875, 1.7957763671875, 2.0517578125, 2.3077392578125, 2.563720703125, 2.8197021484375, 3.07568359375, 3.3316650390625, 3.587646484375, 3.8436279296875, 4.099609375, 4.3555908203125, 4.611572265625, 4.8675537109375, 5.12353515625, 5.3795166015625, 5.635498046875, 5.8914794921875, 6.1474609375, 6.4034423828125, 6.659423828125, 6.9154052734375, 7.17138671875, 7.4273681640625, 7.683349609375, 7.9393310546875, 8.1953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 9.0, 5.0, 11.0, 10.0, 7.0, 12.0, 25.0, 19.0, 26.0, 33.0, 37.0, 39.0, 44.0, 44.0, 39.0, 50.0, 56.0, 59.0, 61.0, 58.0, 55.0, 40.0, 33.0, 48.0, 34.0, 20.0, 27.0, 27.0, 13.0, 9.0, 12.0, 5.0, 8.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.109375, -3.991912841796875, -3.87445068359375, -3.756988525390625, -3.6395263671875, -3.522064208984375, -3.40460205078125, -3.287139892578125, -3.169677734375, -3.052215576171875, -2.93475341796875, -2.817291259765625, -2.6998291015625, -2.582366943359375, -2.46490478515625, -2.347442626953125, -2.22998046875, -2.112518310546875, -1.99505615234375, -1.877593994140625, -1.7601318359375, -1.642669677734375, -1.52520751953125, -1.407745361328125, -1.290283203125, -1.172821044921875, -1.05535888671875, -0.937896728515625, -0.8204345703125, -0.702972412109375, -0.58551025390625, -0.468048095703125, -0.3505859375, -0.233123779296875, -0.11566162109375, 0.001800537109375, 0.1192626953125, 0.236724853515625, 0.35418701171875, 0.471649169921875, 0.589111328125, 0.706573486328125, 0.82403564453125, 0.941497802734375, 1.0589599609375, 1.176422119140625, 1.29388427734375, 1.411346435546875, 1.52880859375, 1.646270751953125, 1.76373291015625, 1.881195068359375, 1.9986572265625, 2.116119384765625, 2.23358154296875, 2.351043701171875, 2.468505859375, 2.585968017578125, 2.70343017578125, 2.820892333984375, 2.9383544921875, 3.055816650390625, 3.17327880859375, 3.290740966796875, 3.408203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 16.0, 15.0, 34.0, 37.0, 72.0, 86.0, 129.0, 215.0, 399.0, 694.0, 1628.0, 4567.0, 21179.0, 305578.0, 667698.0, 35884.0, 6244.0, 2039.0, 855.0, 418.0, 246.0, 147.0, 117.0, 68.0, 49.0, 34.0, 22.0, 16.0, 10.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.92822265625, -18.2783203125, -17.62841796875, -16.978515625, -16.32861328125, -15.6787109375, -15.02880859375, -14.37890625, -13.72900390625, -13.0791015625, -12.42919921875, -11.779296875, -11.12939453125, -10.4794921875, -9.82958984375, -9.1796875, -8.52978515625, -7.8798828125, -7.22998046875, -6.580078125, -5.93017578125, -5.2802734375, -4.63037109375, -3.98046875, -3.33056640625, -2.6806640625, -2.03076171875, -1.380859375, -0.73095703125, -0.0810546875, 0.56884765625, 1.21875, 1.86865234375, 2.5185546875, 3.16845703125, 3.818359375, 4.46826171875, 5.1181640625, 5.76806640625, 6.41796875, 7.06787109375, 7.7177734375, 8.36767578125, 9.017578125, 9.66748046875, 10.3173828125, 10.96728515625, 11.6171875, 12.26708984375, 12.9169921875, 13.56689453125, 14.216796875, 14.86669921875, 15.5166015625, 16.16650390625, 16.81640625, 17.46630859375, 18.1162109375, 18.76611328125, 19.416015625, 20.06591796875, 20.7158203125, 21.36572265625, 22.015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 6.0, 6.0, 11.0, 10.0, 16.0, 21.0, 33.0, 31.0, 40.0, 62.0, 51.0, 63.0, 78.0, 73.0, 64.0, 73.0, 57.0, 42.0, 47.0, 46.0, 36.0, 40.0, 22.0, 24.0, 12.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.387939453125, -22.66650390625, -21.945068359375, -21.2236328125, -20.502197265625, -19.78076171875, -19.059326171875, -18.337890625, -17.616455078125, -16.89501953125, -16.173583984375, -15.4521484375, -14.730712890625, -14.00927734375, -13.287841796875, -12.56640625, -11.844970703125, -11.12353515625, -10.402099609375, -9.6806640625, -8.959228515625, -8.23779296875, -7.516357421875, -6.794921875, -6.073486328125, -5.35205078125, -4.630615234375, -3.9091796875, -3.187744140625, -2.46630859375, -1.744873046875, -1.0234375, -0.302001953125, 0.41943359375, 1.140869140625, 1.8623046875, 2.583740234375, 3.30517578125, 4.026611328125, 4.748046875, 5.469482421875, 6.19091796875, 6.912353515625, 7.6337890625, 8.355224609375, 9.07666015625, 9.798095703125, 10.51953125, 11.240966796875, 11.96240234375, 12.683837890625, 13.4052734375, 14.126708984375, 14.84814453125, 15.569580078125, 16.291015625, 17.012451171875, 17.73388671875, 18.455322265625, 19.1767578125, 19.898193359375, 20.61962890625, 21.341064453125, 22.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 13.0, 8.0, 15.0, 13.0, 40.0, 26.0, 55.0, 64.0, 94.0, 133.0, 255.0, 408.0, 891.0, 2283.0, 8594.0, 68943.0, 849320.0, 101541.0, 10953.0, 2600.0, 1012.0, 506.0, 242.0, 149.0, 124.0, 60.0, 46.0, 34.0, 33.0, 23.0, 15.0, 12.0, 7.0, 6.0, 1.0, 10.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.4609375, -7.2086181640625, -6.956298828125, -6.7039794921875, -6.45166015625, -6.1993408203125, -5.947021484375, -5.6947021484375, -5.4423828125, -5.1900634765625, -4.937744140625, -4.6854248046875, -4.43310546875, -4.1807861328125, -3.928466796875, -3.6761474609375, -3.423828125, -3.1715087890625, -2.919189453125, -2.6668701171875, -2.41455078125, -2.1622314453125, -1.909912109375, -1.6575927734375, -1.4052734375, -1.1529541015625, -0.900634765625, -0.6483154296875, -0.39599609375, -0.1436767578125, 0.108642578125, 0.3609619140625, 0.61328125, 0.8656005859375, 1.117919921875, 1.3702392578125, 1.62255859375, 1.8748779296875, 2.127197265625, 2.3795166015625, 2.6318359375, 2.8841552734375, 3.136474609375, 3.3887939453125, 3.64111328125, 3.8934326171875, 4.145751953125, 4.3980712890625, 4.650390625, 4.9027099609375, 5.155029296875, 5.4073486328125, 5.65966796875, 5.9119873046875, 6.164306640625, 6.4166259765625, 6.6689453125, 6.9212646484375, 7.173583984375, 7.4259033203125, 7.67822265625, 7.9305419921875, 8.182861328125, 8.4351806640625, 8.6875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 10.0, 4.0, 8.0, 9.0, 10.0, 17.0, 14.0, 16.0, 18.0, 27.0, 23.0, 43.0, 51.0, 92.0, 132.0, 142.0, 100.0, 75.0, 44.0, 33.0, 27.0, 19.0, 12.0, 16.0, 9.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 7.0, 0.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008572638034820557, -0.0008266568183898926, -0.0007960498332977295, -0.0007654428482055664, -0.0007348358631134033, -0.0007042288780212402, -0.0006736218929290771, -0.0006430149078369141, -0.000612407922744751, -0.0005818009376525879, -0.0005511939525604248, -0.0005205869674682617, -0.0004899799823760986, -0.00045937299728393555, -0.00042876601219177246, -0.0003981590270996094, -0.0003675520420074463, -0.0003369450569152832, -0.0003063380718231201, -0.00027573108673095703, -0.00024512410163879395, -0.00021451711654663086, -0.00018391013145446777, -0.0001533031463623047, -0.0001226961612701416, -9.208917617797852e-05, -6.148219108581543e-05, -3.0875205993652344e-05, -2.682209014892578e-07, 3.0338764190673828e-05, 6.0945749282836914e-05, 9.1552734375e-05, 0.00012215971946716309, 0.00015276670455932617, 0.00018337368965148926, 0.00021398067474365234, 0.00024458765983581543, 0.0002751946449279785, 0.0003058016300201416, 0.0003364086151123047, 0.0003670156002044678, 0.00039762258529663086, 0.00042822957038879395, 0.00045883655548095703, 0.0004894435405731201, 0.0005200505256652832, 0.0005506575107574463, 0.0005812644958496094, 0.0006118714809417725, 0.0006424784660339355, 0.0006730854511260986, 0.0007036924362182617, 0.0007342994213104248, 0.0007649064064025879, 0.000795513391494751, 0.0008261203765869141, 0.0008567273616790771, 0.0008873343467712402, 0.0009179413318634033, 0.0009485483169555664, 0.0009791553020477295, 0.0010097622871398926, 0.0010403692722320557, 0.0010709762573242188]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 13.0, 12.0, 25.0, 37.0, 48.0, 56.0, 98.0, 160.0, 256.0, 385.0, 756.0, 1585.0, 4063.0, 12190.0, 51249.0, 647114.0, 283712.0, 31889.0, 8748.0, 3074.0, 1340.0, 691.0, 373.0, 201.0, 143.0, 87.0, 56.0, 40.0, 39.0, 21.0, 12.0, 9.0, 7.0, 8.0, 4.0, 7.0, 9.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3646240234375, -6.127685546875, -5.8907470703125, -5.65380859375, -5.4168701171875, -5.179931640625, -4.9429931640625, -4.7060546875, -4.4691162109375, -4.232177734375, -3.9952392578125, -3.75830078125, -3.5213623046875, -3.284423828125, -3.0474853515625, -2.810546875, -2.5736083984375, -2.336669921875, -2.0997314453125, -1.86279296875, -1.6258544921875, -1.388916015625, -1.1519775390625, -0.9150390625, -0.6781005859375, -0.441162109375, -0.2042236328125, 0.03271484375, 0.2696533203125, 0.506591796875, 0.7435302734375, 0.98046875, 1.2174072265625, 1.454345703125, 1.6912841796875, 1.92822265625, 2.1651611328125, 2.402099609375, 2.6390380859375, 2.8759765625, 3.1129150390625, 3.349853515625, 3.5867919921875, 3.82373046875, 4.0606689453125, 4.297607421875, 4.5345458984375, 4.771484375, 5.0084228515625, 5.245361328125, 5.4822998046875, 5.71923828125, 5.9561767578125, 6.193115234375, 6.4300537109375, 6.6669921875, 6.9039306640625, 7.140869140625, 7.3778076171875, 7.61474609375, 7.8516845703125, 8.088623046875, 8.3255615234375, 8.5625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 13.0, 10.0, 10.0, 14.0, 19.0, 27.0, 33.0, 46.0, 48.0, 72.0, 93.0, 110.0, 116.0, 72.0, 70.0, 54.0, 29.0, 31.0, 25.0, 15.0, 11.0, 13.0, 3.0, 4.0, 7.0, 2.0, 8.0, 5.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.5172119140625, -5.343017578125, -5.1688232421875, -4.99462890625, -4.8204345703125, -4.646240234375, -4.4720458984375, -4.2978515625, -4.1236572265625, -3.949462890625, -3.7752685546875, -3.60107421875, -3.4268798828125, -3.252685546875, -3.0784912109375, -2.904296875, -2.7301025390625, -2.555908203125, -2.3817138671875, -2.20751953125, -2.0333251953125, -1.859130859375, -1.6849365234375, -1.5107421875, -1.3365478515625, -1.162353515625, -0.9881591796875, -0.81396484375, -0.6397705078125, -0.465576171875, -0.2913818359375, -0.1171875, 0.0570068359375, 0.231201171875, 0.4053955078125, 0.57958984375, 0.7537841796875, 0.927978515625, 1.1021728515625, 1.2763671875, 1.4505615234375, 1.624755859375, 1.7989501953125, 1.97314453125, 2.1473388671875, 2.321533203125, 2.4957275390625, 2.669921875, 2.8441162109375, 3.018310546875, 3.1925048828125, 3.36669921875, 3.5408935546875, 3.715087890625, 3.8892822265625, 4.0634765625, 4.2376708984375, 4.411865234375, 4.5860595703125, 4.76025390625, 4.9344482421875, 5.108642578125, 5.2828369140625, 5.45703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 38.0, 108.0, 271.0, 327.0, 132.0, 66.0, 25.0, 13.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.676025390625, -165.77627563476562, -159.87652587890625, -153.97679138183594, -148.07704162597656, -142.1772918701172, -136.27755737304688, -130.3778076171875, -124.47805786132812, -118.57830810546875, -112.6785659790039, -106.77882385253906, -100.87907409667969, -94.97932434082031, -89.07958221435547, -83.17984008789062, -77.28009033203125, -71.38034057617188, -65.48059844970703, -59.58085250854492, -53.68110656738281, -47.7813606262207, -41.881614685058594, -35.981868743896484, -30.082122802734375, -24.182376861572266, -18.282630920410156, -12.382884979248047, -6.4831390380859375, -0.5833930969238281, 5.316352844238281, 11.21609878540039, 17.115859985351562, 23.015605926513672, 28.91535186767578, 34.81509780883789, 40.71484375, 46.61458969116211, 52.51433563232422, 58.41408157348633, 64.31382751464844, 70.21357727050781, 76.11331939697266, 82.0130615234375, 87.91281127929688, 93.81256103515625, 99.7123031616211, 105.61204528808594, 111.51179504394531, 117.41154479980469, 123.31128692626953, 129.21102905273438, 135.11077880859375, 141.01052856445312, 146.9102783203125, 152.8100128173828, 158.7097625732422, 164.60951232910156, 170.50924682617188, 176.40899658203125, 182.30874633789062, 188.20849609375, 194.10824584960938, 200.0079803466797, 205.90773010253906]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 14.0, 14.0, 17.0, 14.0, 24.0, 25.0, 31.0, 39.0, 46.0, 39.0, 44.0, 51.0, 61.0, 67.0, 62.0, 62.0, 55.0, 37.0, 32.0, 34.0, 34.0, 15.0, 32.0, 33.0, 19.0, 16.0, 9.0, 4.0, 6.0, 7.0, 3.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.4040756225586, -73.09455871582031, -70.7850341796875, -68.47551727294922, -66.16600036621094, -63.856475830078125, -61.546958923339844, -59.2374382019043, -56.92791748046875, -54.6183967590332, -52.30887985229492, -49.999359130859375, -47.68983840942383, -45.38031768798828, -43.07080078125, -40.76128005981445, -38.45176315307617, -36.142242431640625, -33.832725524902344, -31.523204803466797, -29.21368408203125, -26.904165267944336, -24.594646453857422, -22.285125732421875, -19.97560691833496, -17.666088104248047, -15.3565673828125, -13.047048568725586, -10.737528800964355, -8.428009033203125, -6.118490219116211, -3.808969497680664, -1.49945068359375, 0.8100688457489014, 3.1195883750915527, 5.429107666015625, 7.7386274337768555, 10.048147201538086, 12.357666015625, 14.667186737060547, 16.97670555114746, 19.286224365234375, 21.595745086669922, 23.905263900756836, 26.21478271484375, 28.524303436279297, 30.83382225036621, 33.143341064453125, 35.45286178588867, 37.76238250732422, 40.0718994140625, 42.38142013549805, 44.690940856933594, 47.000457763671875, 49.30997848510742, 51.61949920654297, 53.92901611328125, 56.2385368347168, 58.54805374145508, 60.857574462890625, 63.16709518432617, 65.47661590576172, 67.7861328125, 70.09565734863281, 72.4051742553711]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 17.0, 9.0, 16.0, 11.0, 18.0, 34.0, 40.0, 60.0, 107.0, 159.0, 232.0, 345.0, 614.0, 1080.0, 2156.0, 4396.0, 10696.0, 37463.0, 425112.0, 3493602.0, 175693.0, 26208.0, 8485.0, 3579.0, 1740.0, 889.0, 555.0, 315.0, 208.0, 138.0, 77.0, 60.0, 41.0, 36.0, 22.0, 10.0, 9.0, 9.0, 7.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.91937255859375, -7.6746826171875, -7.42999267578125, -7.185302734375, -6.94061279296875, -6.6959228515625, -6.45123291015625, -6.20654296875, -5.96185302734375, -5.7171630859375, -5.47247314453125, -5.227783203125, -4.98309326171875, -4.7384033203125, -4.49371337890625, -4.2490234375, -4.00433349609375, -3.7596435546875, -3.51495361328125, -3.270263671875, -3.02557373046875, -2.7808837890625, -2.53619384765625, -2.29150390625, -2.04681396484375, -1.8021240234375, -1.55743408203125, -1.312744140625, -1.06805419921875, -0.8233642578125, -0.57867431640625, -0.333984375, -0.08929443359375, 0.1553955078125, 0.40008544921875, 0.644775390625, 0.88946533203125, 1.1341552734375, 1.37884521484375, 1.62353515625, 1.86822509765625, 2.1129150390625, 2.35760498046875, 2.602294921875, 2.84698486328125, 3.0916748046875, 3.33636474609375, 3.5810546875, 3.82574462890625, 4.0704345703125, 4.31512451171875, 4.559814453125, 4.80450439453125, 5.0491943359375, 5.29388427734375, 5.53857421875, 5.78326416015625, 6.0279541015625, 6.27264404296875, 6.517333984375, 6.76202392578125, 7.0067138671875, 7.25140380859375, 7.49609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 5.0, 12.0, 6.0, 21.0, 27.0, 22.0, 30.0, 44.0, 45.0, 61.0, 73.0, 92.0, 81.0, 83.0, 67.0, 61.0, 58.0, 53.0, 35.0, 29.0, 27.0, 17.0, 14.0, 13.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.01953125, -6.846923828125, -6.67431640625, -6.501708984375, -6.3291015625, -6.156494140625, -5.98388671875, -5.811279296875, -5.638671875, -5.466064453125, -5.29345703125, -5.120849609375, -4.9482421875, -4.775634765625, -4.60302734375, -4.430419921875, -4.2578125, -4.085205078125, -3.91259765625, -3.739990234375, -3.5673828125, -3.394775390625, -3.22216796875, -3.049560546875, -2.876953125, -2.704345703125, -2.53173828125, -2.359130859375, -2.1865234375, -2.013916015625, -1.84130859375, -1.668701171875, -1.49609375, -1.323486328125, -1.15087890625, -0.978271484375, -0.8056640625, -0.633056640625, -0.46044921875, -0.287841796875, -0.115234375, 0.057373046875, 0.22998046875, 0.402587890625, 0.5751953125, 0.747802734375, 0.92041015625, 1.093017578125, 1.265625, 1.438232421875, 1.61083984375, 1.783447265625, 1.9560546875, 2.128662109375, 2.30126953125, 2.473876953125, 2.646484375, 2.819091796875, 2.99169921875, 3.164306640625, 3.3369140625, 3.509521484375, 3.68212890625, 3.854736328125, 4.02734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 6.0, 4.0, 6.0, 21.0, 21.0, 39.0, 54.0, 112.0, 191.0, 471.0, 867.0, 2196.0, 6100.0, 23608.0, 284240.0, 3761587.0, 91521.0, 15261.0, 4632.0, 1817.0, 762.0, 373.0, 157.0, 94.0, 63.0, 25.0, 19.0, 10.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.665283203125, -10.26025390625, -9.855224609375, -9.4501953125, -9.045166015625, -8.64013671875, -8.235107421875, -7.830078125, -7.425048828125, -7.02001953125, -6.614990234375, -6.2099609375, -5.804931640625, -5.39990234375, -4.994873046875, -4.58984375, -4.184814453125, -3.77978515625, -3.374755859375, -2.9697265625, -2.564697265625, -2.15966796875, -1.754638671875, -1.349609375, -0.944580078125, -0.53955078125, -0.134521484375, 0.2705078125, 0.675537109375, 1.08056640625, 1.485595703125, 1.890625, 2.295654296875, 2.70068359375, 3.105712890625, 3.5107421875, 3.915771484375, 4.32080078125, 4.725830078125, 5.130859375, 5.535888671875, 5.94091796875, 6.345947265625, 6.7509765625, 7.156005859375, 7.56103515625, 7.966064453125, 8.37109375, 8.776123046875, 9.18115234375, 9.586181640625, 9.9912109375, 10.396240234375, 10.80126953125, 11.206298828125, 11.611328125, 12.016357421875, 12.42138671875, 12.826416015625, 13.2314453125, 13.636474609375, 14.04150390625, 14.446533203125, 14.8515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 10.0, 17.0, 17.0, 21.0, 46.0, 74.0, 151.0, 409.0, 1058.0, 1238.0, 562.0, 225.0, 77.0, 51.0, 26.0, 20.0, 13.0, 9.0, 12.0, 4.0, 6.0, 2.0, 2.0, 9.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.75, -9.437255859375, -9.12451171875, -8.811767578125, -8.4990234375, -8.186279296875, -7.87353515625, -7.560791015625, -7.248046875, -6.935302734375, -6.62255859375, -6.309814453125, -5.9970703125, -5.684326171875, -5.37158203125, -5.058837890625, -4.74609375, -4.433349609375, -4.12060546875, -3.807861328125, -3.4951171875, -3.182373046875, -2.86962890625, -2.556884765625, -2.244140625, -1.931396484375, -1.61865234375, -1.305908203125, -0.9931640625, -0.680419921875, -0.36767578125, -0.054931640625, 0.2578125, 0.570556640625, 0.88330078125, 1.196044921875, 1.5087890625, 1.821533203125, 2.13427734375, 2.447021484375, 2.759765625, 3.072509765625, 3.38525390625, 3.697998046875, 4.0107421875, 4.323486328125, 4.63623046875, 4.948974609375, 5.26171875, 5.574462890625, 5.88720703125, 6.199951171875, 6.5126953125, 6.825439453125, 7.13818359375, 7.450927734375, 7.763671875, 8.076416015625, 8.38916015625, 8.701904296875, 9.0146484375, 9.327392578125, 9.64013671875, 9.952880859375, 10.265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 20.0, 35.0, 54.0, 124.0, 197.0, 209.0, 170.0, 87.0, 39.0, 18.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.83888244628906, -73.16429138183594, -70.48970031738281, -67.81510925292969, -65.14051818847656, -62.46592712402344, -59.79133605957031, -57.11674499511719, -54.44215393066406, -51.76756286621094, -49.09297180175781, -46.41838073730469, -43.74378967285156, -41.06919860839844, -38.39460754394531, -35.72001647949219, -33.0454216003418, -30.370830535888672, -27.696239471435547, -25.021648406982422, -22.347057342529297, -19.672466278076172, -16.997873306274414, -14.323282241821289, -11.648691177368164, -8.974100112915039, -6.299508571624756, -3.6249170303344727, -0.9503259658813477, 1.7242650985717773, 4.398857116699219, 7.073448181152344, 9.748039245605469, 12.422630310058594, 15.097221374511719, 17.771812438964844, 20.44640350341797, 23.120994567871094, 25.79558753967285, 28.470178604125977, 31.1447696685791, 33.81936264038086, 36.493953704833984, 39.16854476928711, 41.843135833740234, 44.51772689819336, 47.192317962646484, 49.86690902709961, 52.541500091552734, 55.21609115600586, 57.890682220458984, 60.56527328491211, 63.239864349365234, 65.91445922851562, 68.58905029296875, 71.26364135742188, 73.938232421875, 76.61282348632812, 79.28741455078125, 81.96200561523438, 84.6365966796875, 87.31118774414062, 89.98577880859375, 92.66036987304688, 95.3349609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 9.0, 21.0, 18.0, 34.0, 28.0, 39.0, 33.0, 43.0, 54.0, 56.0, 57.0, 71.0, 81.0, 63.0, 67.0, 52.0, 46.0, 45.0, 36.0, 29.0, 21.0, 23.0, 18.0, 9.0, 6.0, 6.0, 11.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-54.78406524658203, -53.38241958618164, -51.98077392578125, -50.57912826538086, -49.17748260498047, -47.775840759277344, -46.37419509887695, -44.97254943847656, -43.57090377807617, -42.16925811767578, -40.76761245727539, -39.365966796875, -37.964324951171875, -36.562679290771484, -35.161033630371094, -33.7593879699707, -32.35774230957031, -30.956096649169922, -29.55445098876953, -28.152807235717773, -26.751161575317383, -25.349515914916992, -23.947872161865234, -22.546226501464844, -21.144580841064453, -19.742935180664062, -18.341289520263672, -16.939645767211914, -15.538000106811523, -14.136354446411133, -12.734709739685059, -11.333065032958984, -9.931415557861328, -8.529769897460938, -7.128125190734863, -5.726480007171631, -4.324834823608398, -2.923189640045166, -1.5215444564819336, -0.11989974975585938, 1.2817459106445312, 2.6833910942077637, 4.085036277770996, 5.4866814613342285, 6.888326644897461, 8.289972305297852, 9.691617012023926, 11.09326171875, 12.49490737915039, 13.896553039550781, 15.298197746276855, 16.69984245300293, 18.10148811340332, 19.50313377380371, 20.90477752685547, 22.30642318725586, 23.70806884765625, 25.10971450805664, 26.51136016845703, 27.91300392150879, 29.31464958190918, 30.71629524230957, 32.11793899536133, 33.51958465576172, 34.92123031616211]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 6.0, 7.0, 10.0, 10.0, 8.0, 16.0, 23.0, 28.0, 45.0, 59.0, 79.0, 114.0, 193.0, 276.0, 453.0, 729.0, 1445.0, 2727.0, 5378.0, 11626.0, 25917.0, 59326.0, 141111.0, 305147.0, 277069.0, 121938.0, 51338.0, 22561.0, 10334.0, 4958.0, 2417.0, 1299.0, 712.0, 418.0, 254.0, 166.0, 101.0, 99.0, 36.0, 33.0, 21.0, 17.0, 12.0, 14.0, 9.0, 9.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.98046875, -5.7930908203125, -5.605712890625, -5.4183349609375, -5.23095703125, -5.0435791015625, -4.856201171875, -4.6688232421875, -4.4814453125, -4.2940673828125, -4.106689453125, -3.9193115234375, -3.73193359375, -3.5445556640625, -3.357177734375, -3.1697998046875, -2.982421875, -2.7950439453125, -2.607666015625, -2.4202880859375, -2.23291015625, -2.0455322265625, -1.858154296875, -1.6707763671875, -1.4833984375, -1.2960205078125, -1.108642578125, -0.9212646484375, -0.73388671875, -0.5465087890625, -0.359130859375, -0.1717529296875, 0.015625, 0.2030029296875, 0.390380859375, 0.5777587890625, 0.76513671875, 0.9525146484375, 1.139892578125, 1.3272705078125, 1.5146484375, 1.7020263671875, 1.889404296875, 2.0767822265625, 2.26416015625, 2.4515380859375, 2.638916015625, 2.8262939453125, 3.013671875, 3.2010498046875, 3.388427734375, 3.5758056640625, 3.76318359375, 3.9505615234375, 4.137939453125, 4.3253173828125, 4.5126953125, 4.7000732421875, 4.887451171875, 5.0748291015625, 5.26220703125, 5.4495849609375, 5.636962890625, 5.8243408203125, 6.01171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 6.0, 12.0, 19.0, 19.0, 16.0, 19.0, 36.0, 33.0, 44.0, 45.0, 65.0, 69.0, 65.0, 62.0, 64.0, 60.0, 48.0, 42.0, 50.0, 40.0, 32.0, 27.0, 22.0, 23.0, 18.0, 14.0, 12.0, 5.0, 6.0, 4.0, 2.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.96234130859375, -4.8231201171875, -4.68389892578125, -4.544677734375, -4.40545654296875, -4.2662353515625, -4.12701416015625, -3.98779296875, -3.84857177734375, -3.7093505859375, -3.57012939453125, -3.430908203125, -3.29168701171875, -3.1524658203125, -3.01324462890625, -2.8740234375, -2.73480224609375, -2.5955810546875, -2.45635986328125, -2.317138671875, -2.17791748046875, -2.0386962890625, -1.89947509765625, -1.76025390625, -1.62103271484375, -1.4818115234375, -1.34259033203125, -1.203369140625, -1.06414794921875, -0.9249267578125, -0.78570556640625, -0.646484375, -0.50726318359375, -0.3680419921875, -0.22882080078125, -0.089599609375, 0.04962158203125, 0.1888427734375, 0.32806396484375, 0.46728515625, 0.60650634765625, 0.7457275390625, 0.88494873046875, 1.024169921875, 1.16339111328125, 1.3026123046875, 1.44183349609375, 1.5810546875, 1.72027587890625, 1.8594970703125, 1.99871826171875, 2.137939453125, 2.27716064453125, 2.4163818359375, 2.55560302734375, 2.69482421875, 2.83404541015625, 2.9732666015625, 3.11248779296875, 3.251708984375, 3.39093017578125, 3.5301513671875, 3.66937255859375, 3.80859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 15.0, 18.0, 35.0, 40.0, 40.0, 89.0, 133.0, 223.0, 404.0, 878.0, 2334.0, 8398.0, 47505.0, 492573.0, 438237.0, 45173.0, 8228.0, 2305.0, 939.0, 382.0, 224.0, 143.0, 80.0, 43.0, 28.0, 19.0, 15.0, 14.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.54443359375, -15.0732421875, -14.60205078125, -14.130859375, -13.65966796875, -13.1884765625, -12.71728515625, -12.24609375, -11.77490234375, -11.3037109375, -10.83251953125, -10.361328125, -9.89013671875, -9.4189453125, -8.94775390625, -8.4765625, -8.00537109375, -7.5341796875, -7.06298828125, -6.591796875, -6.12060546875, -5.6494140625, -5.17822265625, -4.70703125, -4.23583984375, -3.7646484375, -3.29345703125, -2.822265625, -2.35107421875, -1.8798828125, -1.40869140625, -0.9375, -0.46630859375, 0.0048828125, 0.47607421875, 0.947265625, 1.41845703125, 1.8896484375, 2.36083984375, 2.83203125, 3.30322265625, 3.7744140625, 4.24560546875, 4.716796875, 5.18798828125, 5.6591796875, 6.13037109375, 6.6015625, 7.07275390625, 7.5439453125, 8.01513671875, 8.486328125, 8.95751953125, 9.4287109375, 9.89990234375, 10.37109375, 10.84228515625, 11.3134765625, 11.78466796875, 12.255859375, 12.72705078125, 13.1982421875, 13.66943359375, 14.140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 11.0, 7.0, 16.0, 14.0, 17.0, 19.0, 27.0, 16.0, 38.0, 39.0, 33.0, 41.0, 64.0, 57.0, 53.0, 60.0, 47.0, 47.0, 40.0, 50.0, 41.0, 36.0, 38.0, 30.0, 25.0, 20.0, 17.0, 22.0, 13.0, 11.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.3646240234375, -12.924560546875, -12.4844970703125, -12.04443359375, -11.6043701171875, -11.164306640625, -10.7242431640625, -10.2841796875, -9.8441162109375, -9.404052734375, -8.9639892578125, -8.52392578125, -8.0838623046875, -7.643798828125, -7.2037353515625, -6.763671875, -6.3236083984375, -5.883544921875, -5.4434814453125, -5.00341796875, -4.5633544921875, -4.123291015625, -3.6832275390625, -3.2431640625, -2.8031005859375, -2.363037109375, -1.9229736328125, -1.48291015625, -1.0428466796875, -0.602783203125, -0.1627197265625, 0.27734375, 0.7174072265625, 1.157470703125, 1.5975341796875, 2.03759765625, 2.4776611328125, 2.917724609375, 3.3577880859375, 3.7978515625, 4.2379150390625, 4.677978515625, 5.1180419921875, 5.55810546875, 5.9981689453125, 6.438232421875, 6.8782958984375, 7.318359375, 7.7584228515625, 8.198486328125, 8.6385498046875, 9.07861328125, 9.5186767578125, 9.958740234375, 10.3988037109375, 10.8388671875, 11.2789306640625, 11.718994140625, 12.1590576171875, 12.59912109375, 13.0391845703125, 13.479248046875, 13.9193115234375, 14.359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 5.0, 9.0, 9.0, 11.0, 19.0, 41.0, 40.0, 95.0, 192.0, 325.0, 1051.0, 3490.0, 22276.0, 746274.0, 258178.0, 12685.0, 2442.0, 747.0, 292.0, 134.0, 76.0, 36.0, 34.0, 16.0, 7.0, 9.0, 6.0, 5.0, 4.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.796875, -10.4581298828125, -10.119384765625, -9.7806396484375, -9.44189453125, -9.1031494140625, -8.764404296875, -8.4256591796875, -8.0869140625, -7.7481689453125, -7.409423828125, -7.0706787109375, -6.73193359375, -6.3931884765625, -6.054443359375, -5.7156982421875, -5.376953125, -5.0382080078125, -4.699462890625, -4.3607177734375, -4.02197265625, -3.6832275390625, -3.344482421875, -3.0057373046875, -2.6669921875, -2.3282470703125, -1.989501953125, -1.6507568359375, -1.31201171875, -0.9732666015625, -0.634521484375, -0.2957763671875, 0.04296875, 0.3817138671875, 0.720458984375, 1.0592041015625, 1.39794921875, 1.7366943359375, 2.075439453125, 2.4141845703125, 2.7529296875, 3.0916748046875, 3.430419921875, 3.7691650390625, 4.10791015625, 4.4466552734375, 4.785400390625, 5.1241455078125, 5.462890625, 5.8016357421875, 6.140380859375, 6.4791259765625, 6.81787109375, 7.1566162109375, 7.495361328125, 7.8341064453125, 8.1728515625, 8.5115966796875, 8.850341796875, 9.1890869140625, 9.52783203125, 9.8665771484375, 10.205322265625, 10.5440673828125, 10.8828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 21.0, 23.0, 50.0, 69.0, 122.0, 176.0, 192.0, 110.0, 67.0, 44.0, 24.0, 16.0, 12.0, 9.0, 6.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0016088485717773438, -0.0015676170587539673, -0.0015263855457305908, -0.0014851540327072144, -0.0014439225196838379, -0.0014026910066604614, -0.001361459493637085, -0.0013202279806137085, -0.001278996467590332, -0.0012377649545669556, -0.001196533441543579, -0.0011553019285202026, -0.0011140704154968262, -0.0010728389024734497, -0.0010316073894500732, -0.0009903758764266968, -0.0009491443634033203, -0.0009079128503799438, -0.0008666813373565674, -0.0008254498243331909, -0.0007842183113098145, -0.000742986798286438, -0.0007017552852630615, -0.0006605237722396851, -0.0006192922592163086, -0.0005780607461929321, -0.0005368292331695557, -0.0004955977201461792, -0.00045436620712280273, -0.00041313469409942627, -0.0003719031810760498, -0.00033067166805267334, -0.0002894401550292969, -0.0002482086420059204, -0.00020697712898254395, -0.00016574561595916748, -0.00012451410293579102, -8.328258991241455e-05, -4.2051076889038086e-05, -8.195638656616211e-07, 4.0411949157714844e-05, 8.164346218109131e-05, 0.00012287497520446777, 0.00016410648822784424, 0.0002053380012512207, 0.00024656951427459717, 0.00028780102729797363, 0.0003290325403213501, 0.00037026405334472656, 0.00041149556636810303, 0.0004527270793914795, 0.000493958592414856, 0.0005351901054382324, 0.0005764216184616089, 0.0006176531314849854, 0.0006588846445083618, 0.0007001161575317383, 0.0007413476705551147, 0.0007825791835784912, 0.0008238106966018677, 0.0008650422096252441, 0.0009062737226486206, 0.0009475052356719971, 0.0009887367486953735, 0.00102996826171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 16.0, 17.0, 21.0, 41.0, 63.0, 83.0, 128.0, 224.0, 390.0, 697.0, 1324.0, 2861.0, 6350.0, 17446.0, 82265.0, 717788.0, 176477.0, 26281.0, 8637.0, 3623.0, 1682.0, 886.0, 462.0, 289.0, 158.0, 98.0, 68.0, 33.0, 34.0, 21.0, 14.0, 14.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4296875, -6.22662353515625, -6.0235595703125, -5.82049560546875, -5.617431640625, -5.41436767578125, -5.2113037109375, -5.00823974609375, -4.80517578125, -4.60211181640625, -4.3990478515625, -4.19598388671875, -3.992919921875, -3.78985595703125, -3.5867919921875, -3.38372802734375, -3.1806640625, -2.97760009765625, -2.7745361328125, -2.57147216796875, -2.368408203125, -2.16534423828125, -1.9622802734375, -1.75921630859375, -1.55615234375, -1.35308837890625, -1.1500244140625, -0.94696044921875, -0.743896484375, -0.54083251953125, -0.3377685546875, -0.13470458984375, 0.068359375, 0.27142333984375, 0.4744873046875, 0.67755126953125, 0.880615234375, 1.08367919921875, 1.2867431640625, 1.48980712890625, 1.69287109375, 1.89593505859375, 2.0989990234375, 2.30206298828125, 2.505126953125, 2.70819091796875, 2.9112548828125, 3.11431884765625, 3.3173828125, 3.52044677734375, 3.7235107421875, 3.92657470703125, 4.129638671875, 4.33270263671875, 4.5357666015625, 4.73883056640625, 4.94189453125, 5.14495849609375, 5.3480224609375, 5.55108642578125, 5.754150390625, 5.95721435546875, 6.1602783203125, 6.36334228515625, 6.56640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 5.0, 10.0, 18.0, 27.0, 48.0, 62.0, 113.0, 150.0, 168.0, 128.0, 80.0, 51.0, 27.0, 28.0, 13.0, 8.0, 15.0, 2.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-7.91796875, -7.7109375, -7.50390625, -7.296875, -7.08984375, -6.8828125, -6.67578125, -6.46875, -6.26171875, -6.0546875, -5.84765625, -5.640625, -5.43359375, -5.2265625, -5.01953125, -4.8125, -4.60546875, -4.3984375, -4.19140625, -3.984375, -3.77734375, -3.5703125, -3.36328125, -3.15625, -2.94921875, -2.7421875, -2.53515625, -2.328125, -2.12109375, -1.9140625, -1.70703125, -1.5, -1.29296875, -1.0859375, -0.87890625, -0.671875, -0.46484375, -0.2578125, -0.05078125, 0.15625, 0.36328125, 0.5703125, 0.77734375, 0.984375, 1.19140625, 1.3984375, 1.60546875, 1.8125, 2.01953125, 2.2265625, 2.43359375, 2.640625, 2.84765625, 3.0546875, 3.26171875, 3.46875, 3.67578125, 3.8828125, 4.08984375, 4.296875, 4.50390625, 4.7109375, 4.91796875, 5.125, 5.33203125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 17.0, 53.0, 163.0, 342.0, 267.0, 104.0, 27.0, 8.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.76846313476562, -137.03875732421875, -131.30906677246094, -125.57936096191406, -119.84967041015625, -114.11996459960938, -108.39026641845703, -102.66056823730469, -96.93087005615234, -91.201171875, -85.47147369384766, -79.74177551269531, -74.01206970214844, -68.28237915039062, -62.55267333984375, -56.822975158691406, -51.09327697753906, -45.36357879638672, -39.633880615234375, -33.904178619384766, -28.174480438232422, -22.444782257080078, -16.71508026123047, -10.985382080078125, -5.255683898925781, 0.4740152359008789, 6.203714370727539, 11.933414459228516, 17.66311264038086, 23.392810821533203, 29.122512817382812, 34.852210998535156, 40.5819091796875, 46.311607360839844, 52.04130554199219, 57.7710075378418, 63.50070571899414, 69.23040771484375, 74.9601058959961, 80.68980407714844, 86.41950225830078, 92.14920043945312, 97.87889862060547, 103.60859680175781, 109.33830261230469, 115.0679931640625, 120.79769897460938, 126.52739715576172, 132.25709533691406, 137.98680114746094, 143.71649169921875, 149.44619750976562, 155.17588806152344, 160.9055938720703, 166.63528442382812, 172.364990234375, 178.09469604492188, 183.82440185546875, 189.55409240722656, 195.28379821777344, 201.01348876953125, 206.74319458007812, 212.472900390625, 218.2025909423828, 223.93228149414062]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 9.0, 8.0, 6.0, 13.0, 12.0, 16.0, 28.0, 24.0, 32.0, 32.0, 38.0, 50.0, 50.0, 53.0, 68.0, 61.0, 71.0, 73.0, 59.0, 42.0, 45.0, 36.0, 27.0, 33.0, 24.0, 16.0, 18.0, 15.0, 12.0, 11.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.93266296386719, -44.89108657836914, -42.849510192871094, -40.80793380737305, -38.766357421875, -36.72477722167969, -34.68320083618164, -32.641624450683594, -30.600048065185547, -28.5584716796875, -26.516895294189453, -24.475317001342773, -22.433740615844727, -20.39216423034668, -18.3505859375, -16.309009552001953, -14.267433166503906, -12.22585678100586, -10.184279441833496, -8.142702102661133, -6.101125717163086, -4.059549331665039, -2.017971992492676, 0.0236053466796875, 2.0651817321777344, 4.1067585945129395, 6.1483354568481445, 8.189912796020508, 10.231489181518555, 12.273065567016602, 14.314642906188965, 16.356220245361328, 18.397796630859375, 20.439373016357422, 22.48094940185547, 24.52252769470215, 26.564104080200195, 28.605680465698242, 30.647258758544922, 32.68883514404297, 34.730411529541016, 36.77198791503906, 38.81356430053711, 40.855140686035156, 42.89672088623047, 44.93829345703125, 46.97987365722656, 49.02145004272461, 51.063026428222656, 53.1046028137207, 55.14617919921875, 57.1877555847168, 59.229331970214844, 61.270912170410156, 63.3124885559082, 65.35406494140625, 67.39564514160156, 69.43722534179688, 71.47879791259766, 73.52037811279297, 75.56195068359375, 77.60353088378906, 79.64510345458984, 81.68668365478516, 83.72825622558594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 19.0, 8.0, 19.0, 32.0, 57.0, 84.0, 156.0, 361.0, 691.0, 1590.0, 4138.0, 13077.0, 62015.0, 1362135.0, 2634877.0, 90149.0, 16042.0, 4913.0, 1922.0, 892.0, 478.0, 231.0, 134.0, 78.0, 54.0, 29.0, 29.0, 13.0, 14.0, 9.0, 4.0, 1.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.14007568359375, -6.8309326171875, -6.52178955078125, -6.212646484375, -5.90350341796875, -5.5943603515625, -5.28521728515625, -4.97607421875, -4.66693115234375, -4.3577880859375, -4.04864501953125, -3.739501953125, -3.43035888671875, -3.1212158203125, -2.81207275390625, -2.5029296875, -2.19378662109375, -1.8846435546875, -1.57550048828125, -1.266357421875, -0.95721435546875, -0.6480712890625, -0.33892822265625, -0.02978515625, 0.27935791015625, 0.5885009765625, 0.89764404296875, 1.206787109375, 1.51593017578125, 1.8250732421875, 2.13421630859375, 2.443359375, 2.75250244140625, 3.0616455078125, 3.37078857421875, 3.679931640625, 3.98907470703125, 4.2982177734375, 4.60736083984375, 4.91650390625, 5.22564697265625, 5.5347900390625, 5.84393310546875, 6.153076171875, 6.46221923828125, 6.7713623046875, 7.08050537109375, 7.3896484375, 7.69879150390625, 8.0079345703125, 8.31707763671875, 8.626220703125, 8.93536376953125, 9.2445068359375, 9.55364990234375, 9.86279296875, 10.17193603515625, 10.4810791015625, 10.79022216796875, 11.099365234375, 11.40850830078125, 11.7176513671875, 12.02679443359375, 12.3359375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 10.0, 9.0, 21.0, 26.0, 21.0, 37.0, 38.0, 37.0, 67.0, 53.0, 63.0, 77.0, 74.0, 67.0, 71.0, 58.0, 36.0, 51.0, 35.0, 39.0, 24.0, 21.0, 21.0, 10.0, 10.0, 9.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.09808349609375, -2.9539794921875, -2.80987548828125, -2.665771484375, -2.52166748046875, -2.3775634765625, -2.23345947265625, -2.08935546875, -1.94525146484375, -1.8011474609375, -1.65704345703125, -1.512939453125, -1.36883544921875, -1.2247314453125, -1.08062744140625, -0.9365234375, -0.79241943359375, -0.6483154296875, -0.50421142578125, -0.360107421875, -0.21600341796875, -0.0718994140625, 0.07220458984375, 0.21630859375, 0.36041259765625, 0.5045166015625, 0.64862060546875, 0.792724609375, 0.93682861328125, 1.0809326171875, 1.22503662109375, 1.369140625, 1.51324462890625, 1.6573486328125, 1.80145263671875, 1.945556640625, 2.08966064453125, 2.2337646484375, 2.37786865234375, 2.52197265625, 2.66607666015625, 2.8101806640625, 2.95428466796875, 3.098388671875, 3.24249267578125, 3.3865966796875, 3.53070068359375, 3.6748046875, 3.81890869140625, 3.9630126953125, 4.10711669921875, 4.251220703125, 4.39532470703125, 4.5394287109375, 4.68353271484375, 4.82763671875, 4.97174072265625, 5.1158447265625, 5.25994873046875, 5.404052734375, 5.54815673828125, 5.6922607421875, 5.83636474609375, 5.98046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 6.0, 13.0, 14.0, 27.0, 32.0, 47.0, 89.0, 163.0, 327.0, 665.0, 1796.0, 6790.0, 38480.0, 1041383.0, 3028656.0, 62699.0, 9495.0, 2269.0, 743.0, 282.0, 125.0, 67.0, 29.0, 24.0, 20.0, 9.0, 9.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-18.859375, -18.400634765625, -17.94189453125, -17.483154296875, -17.0244140625, -16.565673828125, -16.10693359375, -15.648193359375, -15.189453125, -14.730712890625, -14.27197265625, -13.813232421875, -13.3544921875, -12.895751953125, -12.43701171875, -11.978271484375, -11.51953125, -11.060791015625, -10.60205078125, -10.143310546875, -9.6845703125, -9.225830078125, -8.76708984375, -8.308349609375, -7.849609375, -7.390869140625, -6.93212890625, -6.473388671875, -6.0146484375, -5.555908203125, -5.09716796875, -4.638427734375, -4.1796875, -3.720947265625, -3.26220703125, -2.803466796875, -2.3447265625, -1.885986328125, -1.42724609375, -0.968505859375, -0.509765625, -0.051025390625, 0.40771484375, 0.866455078125, 1.3251953125, 1.783935546875, 2.24267578125, 2.701416015625, 3.16015625, 3.618896484375, 4.07763671875, 4.536376953125, 4.9951171875, 5.453857421875, 5.91259765625, 6.371337890625, 6.830078125, 7.288818359375, 7.74755859375, 8.206298828125, 8.6650390625, 9.123779296875, 9.58251953125, 10.041259765625, 10.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 9.0, 11.0, 13.0, 16.0, 29.0, 57.0, 82.0, 153.0, 275.0, 723.0, 1107.0, 761.0, 367.0, 187.0, 79.0, 57.0, 31.0, 34.0, 25.0, 14.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-14.7734375, -14.410888671875, -14.04833984375, -13.685791015625, -13.3232421875, -12.960693359375, -12.59814453125, -12.235595703125, -11.873046875, -11.510498046875, -11.14794921875, -10.785400390625, -10.4228515625, -10.060302734375, -9.69775390625, -9.335205078125, -8.97265625, -8.610107421875, -8.24755859375, -7.885009765625, -7.5224609375, -7.159912109375, -6.79736328125, -6.434814453125, -6.072265625, -5.709716796875, -5.34716796875, -4.984619140625, -4.6220703125, -4.259521484375, -3.89697265625, -3.534423828125, -3.171875, -2.809326171875, -2.44677734375, -2.084228515625, -1.7216796875, -1.359130859375, -0.99658203125, -0.634033203125, -0.271484375, 0.091064453125, 0.45361328125, 0.816162109375, 1.1787109375, 1.541259765625, 1.90380859375, 2.266357421875, 2.62890625, 2.991455078125, 3.35400390625, 3.716552734375, 4.0791015625, 4.441650390625, 4.80419921875, 5.166748046875, 5.529296875, 5.891845703125, 6.25439453125, 6.616943359375, 6.9794921875, 7.342041015625, 7.70458984375, 8.067138671875, 8.4296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 2.0, 5.0, 9.0, 12.0, 14.0, 39.0, 62.0, 111.0, 149.0, 150.0, 146.0, 109.0, 97.0, 49.0, 11.0, 15.0, 6.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.57435607910156, -71.7668685913086, -68.95938110351562, -66.15189361572266, -63.34440231323242, -60.53691482543945, -57.72942352294922, -54.92193603515625, -52.11444854736328, -49.30696105957031, -46.499473571777344, -43.69198226928711, -40.88449478149414, -38.07700729370117, -35.26951599121094, -32.46202850341797, -29.654541015625, -26.84705352783203, -24.03956413269043, -21.232074737548828, -18.42458724975586, -15.617098808288574, -12.809610366821289, -10.002120971679688, -7.194633483886719, -4.387145042419434, -1.5796566009521484, 1.2278318405151367, 4.035320281982422, 6.842808723449707, 9.650297164916992, 12.457786560058594, 15.265266418457031, 18.07275390625, 20.8802433013916, 23.687732696533203, 26.495220184326172, 29.30270767211914, 32.110198974609375, 34.917686462402344, 37.72517395019531, 40.53266143798828, 43.34014892578125, 46.147640228271484, 48.95512771606445, 51.76261520385742, 54.570106506347656, 57.377593994140625, 60.185081481933594, 62.99256896972656, 65.80005645751953, 68.6075439453125, 71.4150390625, 74.22252655029297, 77.03001403808594, 79.8375015258789, 82.64498901367188, 85.45247650146484, 88.25996398925781, 91.06745147705078, 93.87493896484375, 96.68243408203125, 99.48992156982422, 102.29740905761719, 105.10489654541016]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 13.0, 9.0, 10.0, 19.0, 15.0, 27.0, 41.0, 23.0, 25.0, 42.0, 33.0, 33.0, 39.0, 52.0, 44.0, 46.0, 43.0, 37.0, 50.0, 50.0, 39.0, 33.0, 23.0, 37.0, 30.0, 17.0, 24.0, 13.0, 20.0, 19.0, 16.0, 13.0, 9.0, 4.0, 5.0, 3.0, 3.0, 0.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-42.422935485839844, -41.133819580078125, -39.844703674316406, -38.55559158325195, -37.266475677490234, -35.977359771728516, -34.68824768066406, -33.399131774902344, -32.110015869140625, -30.820899963378906, -29.53178596496582, -28.242671966552734, -26.953556060791016, -25.664440155029297, -24.37532615661621, -23.086212158203125, -21.797096252441406, -20.507980346679688, -19.2188663482666, -17.929752349853516, -16.640636444091797, -15.351521492004395, -14.062406539916992, -12.77329158782959, -11.484176635742188, -10.195061683654785, -8.905946731567383, -7.6168317794799805, -6.327716827392578, -5.038601875305176, -3.7494869232177734, -2.460371971130371, -1.1712570190429688, 0.1178579330444336, 1.406972885131836, 2.6960878372192383, 3.9852027893066406, 5.274317741394043, 6.563432693481445, 7.852547645568848, 9.14166259765625, 10.430777549743652, 11.719892501831055, 13.009007453918457, 14.29812240600586, 15.587237358093262, 16.876352310180664, 18.16546630859375, 19.45458221435547, 20.743698120117188, 22.032812118530273, 23.32192611694336, 24.611042022705078, 25.900157928466797, 27.189271926879883, 28.47838592529297, 29.767501831054688, 31.056617736816406, 32.345733642578125, 33.63484573364258, 34.9239616394043, 36.213077545166016, 37.50218963623047, 38.79130554199219, 40.080421447753906]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 20.0, 18.0, 33.0, 42.0, 91.0, 129.0, 197.0, 363.0, 629.0, 1139.0, 2411.0, 5657.0, 15441.0, 46321.0, 139532.0, 353777.0, 309185.0, 113851.0, 37817.0, 12637.0, 4925.0, 2032.0, 961.0, 489.0, 316.0, 182.0, 112.0, 63.0, 45.0, 32.0, 25.0, 13.0, 14.0, 12.0, 4.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.18524169921875, -5.9368896484375, -5.68853759765625, -5.440185546875, -5.19183349609375, -4.9434814453125, -4.69512939453125, -4.44677734375, -4.19842529296875, -3.9500732421875, -3.70172119140625, -3.453369140625, -3.20501708984375, -2.9566650390625, -2.70831298828125, -2.4599609375, -2.21160888671875, -1.9632568359375, -1.71490478515625, -1.466552734375, -1.21820068359375, -0.9698486328125, -0.72149658203125, -0.47314453125, -0.22479248046875, 0.0235595703125, 0.27191162109375, 0.520263671875, 0.76861572265625, 1.0169677734375, 1.26531982421875, 1.513671875, 1.76202392578125, 2.0103759765625, 2.25872802734375, 2.507080078125, 2.75543212890625, 3.0037841796875, 3.25213623046875, 3.50048828125, 3.74884033203125, 3.9971923828125, 4.24554443359375, 4.493896484375, 4.74224853515625, 4.9906005859375, 5.23895263671875, 5.4873046875, 5.73565673828125, 5.9840087890625, 6.23236083984375, 6.480712890625, 6.72906494140625, 6.9774169921875, 7.22576904296875, 7.47412109375, 7.72247314453125, 7.9708251953125, 8.21917724609375, 8.467529296875, 8.71588134765625, 8.9642333984375, 9.21258544921875, 9.4609375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 6.0, 8.0, 7.0, 15.0, 13.0, 18.0, 23.0, 20.0, 26.0, 36.0, 23.0, 38.0, 42.0, 43.0, 46.0, 38.0, 55.0, 45.0, 52.0, 38.0, 49.0, 46.0, 35.0, 51.0, 34.0, 27.0, 26.0, 23.0, 19.0, 20.0, 10.0, 11.0, 11.0, 6.0, 7.0, 5.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.09375, -2.9923095703125, -2.890869140625, -2.7894287109375, -2.68798828125, -2.5865478515625, -2.485107421875, -2.3836669921875, -2.2822265625, -2.1807861328125, -2.079345703125, -1.9779052734375, -1.87646484375, -1.7750244140625, -1.673583984375, -1.5721435546875, -1.470703125, -1.3692626953125, -1.267822265625, -1.1663818359375, -1.06494140625, -0.9635009765625, -0.862060546875, -0.7606201171875, -0.6591796875, -0.5577392578125, -0.456298828125, -0.3548583984375, -0.25341796875, -0.1519775390625, -0.050537109375, 0.0509033203125, 0.15234375, 0.2537841796875, 0.355224609375, 0.4566650390625, 0.55810546875, 0.6595458984375, 0.760986328125, 0.8624267578125, 0.9638671875, 1.0653076171875, 1.166748046875, 1.2681884765625, 1.36962890625, 1.4710693359375, 1.572509765625, 1.6739501953125, 1.775390625, 1.8768310546875, 1.978271484375, 2.0797119140625, 2.18115234375, 2.2825927734375, 2.384033203125, 2.4854736328125, 2.5869140625, 2.6883544921875, 2.789794921875, 2.8912353515625, 2.99267578125, 3.0941162109375, 3.195556640625, 3.2969970703125, 3.3984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 14.0, 16.0, 16.0, 27.0, 29.0, 48.0, 73.0, 99.0, 162.0, 228.0, 352.0, 606.0, 1022.0, 2165.0, 6112.0, 28947.0, 281917.0, 658491.0, 53103.0, 9050.0, 2850.0, 1261.0, 666.0, 467.0, 279.0, 167.0, 117.0, 78.0, 44.0, 39.0, 22.0, 17.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.984375, -18.428466796875, -17.87255859375, -17.316650390625, -16.7607421875, -16.204833984375, -15.64892578125, -15.093017578125, -14.537109375, -13.981201171875, -13.42529296875, -12.869384765625, -12.3134765625, -11.757568359375, -11.20166015625, -10.645751953125, -10.08984375, -9.533935546875, -8.97802734375, -8.422119140625, -7.8662109375, -7.310302734375, -6.75439453125, -6.198486328125, -5.642578125, -5.086669921875, -4.53076171875, -3.974853515625, -3.4189453125, -2.863037109375, -2.30712890625, -1.751220703125, -1.1953125, -0.639404296875, -0.08349609375, 0.472412109375, 1.0283203125, 1.584228515625, 2.14013671875, 2.696044921875, 3.251953125, 3.807861328125, 4.36376953125, 4.919677734375, 5.4755859375, 6.031494140625, 6.58740234375, 7.143310546875, 7.69921875, 8.255126953125, 8.81103515625, 9.366943359375, 9.9228515625, 10.478759765625, 11.03466796875, 11.590576171875, 12.146484375, 12.702392578125, 13.25830078125, 13.814208984375, 14.3701171875, 14.926025390625, 15.48193359375, 16.037841796875, 16.59375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 11.0, 12.0, 15.0, 19.0, 18.0, 17.0, 28.0, 46.0, 49.0, 34.0, 43.0, 53.0, 49.0, 50.0, 66.0, 57.0, 53.0, 50.0, 46.0, 35.0, 32.0, 29.0, 35.0, 22.0, 11.0, 22.0, 12.0, 16.0, 9.0, 11.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.3046875, -14.7977294921875, -14.290771484375, -13.7838134765625, -13.27685546875, -12.7698974609375, -12.262939453125, -11.7559814453125, -11.2490234375, -10.7420654296875, -10.235107421875, -9.7281494140625, -9.22119140625, -8.7142333984375, -8.207275390625, -7.7003173828125, -7.193359375, -6.6864013671875, -6.179443359375, -5.6724853515625, -5.16552734375, -4.6585693359375, -4.151611328125, -3.6446533203125, -3.1376953125, -2.6307373046875, -2.123779296875, -1.6168212890625, -1.10986328125, -0.6029052734375, -0.095947265625, 0.4110107421875, 0.91796875, 1.4249267578125, 1.931884765625, 2.4388427734375, 2.94580078125, 3.4527587890625, 3.959716796875, 4.4666748046875, 4.9736328125, 5.4805908203125, 5.987548828125, 6.4945068359375, 7.00146484375, 7.5084228515625, 8.015380859375, 8.5223388671875, 9.029296875, 9.5362548828125, 10.043212890625, 10.5501708984375, 11.05712890625, 11.5640869140625, 12.071044921875, 12.5780029296875, 13.0849609375, 13.5919189453125, 14.098876953125, 14.6058349609375, 15.11279296875, 15.6197509765625, 16.126708984375, 16.6336669921875, 17.140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 17.0, 21.0, 42.0, 44.0, 83.0, 137.0, 268.0, 626.0, 2379.0, 26497.0, 953305.0, 60131.0, 3469.0, 755.0, 324.0, 167.0, 96.0, 57.0, 35.0, 25.0, 12.0, 11.0, 10.0, 6.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.921875, -12.5589599609375, -12.196044921875, -11.8331298828125, -11.47021484375, -11.1072998046875, -10.744384765625, -10.3814697265625, -10.0185546875, -9.6556396484375, -9.292724609375, -8.9298095703125, -8.56689453125, -8.2039794921875, -7.841064453125, -7.4781494140625, -7.115234375, -6.7523193359375, -6.389404296875, -6.0264892578125, -5.66357421875, -5.3006591796875, -4.937744140625, -4.5748291015625, -4.2119140625, -3.8489990234375, -3.486083984375, -3.1231689453125, -2.76025390625, -2.3973388671875, -2.034423828125, -1.6715087890625, -1.30859375, -0.9456787109375, -0.582763671875, -0.2198486328125, 0.14306640625, 0.5059814453125, 0.868896484375, 1.2318115234375, 1.5947265625, 1.9576416015625, 2.320556640625, 2.6834716796875, 3.04638671875, 3.4093017578125, 3.772216796875, 4.1351318359375, 4.498046875, 4.8609619140625, 5.223876953125, 5.5867919921875, 5.94970703125, 6.3126220703125, 6.675537109375, 7.0384521484375, 7.4013671875, 7.7642822265625, 8.127197265625, 8.4901123046875, 8.85302734375, 9.2159423828125, 9.578857421875, 9.9417724609375, 10.3046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 11.0, 3.0, 7.0, 11.0, 21.0, 22.0, 26.0, 24.0, 31.0, 43.0, 41.0, 82.0, 140.0, 158.0, 111.0, 71.0, 42.0, 45.0, 23.0, 23.0, 13.0, 14.0, 11.0, 14.0, 5.0, 2.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011844635009765625, -0.0011500716209411621, -0.0011156797409057617, -0.0010812878608703613, -0.001046895980834961, -0.0010125041007995605, -0.0009781122207641602, -0.0009437203407287598, -0.0009093284606933594, -0.000874936580657959, -0.0008405447006225586, -0.0008061528205871582, -0.0007717609405517578, -0.0007373690605163574, -0.000702977180480957, -0.0006685853004455566, -0.0006341934204101562, -0.0005998015403747559, -0.0005654096603393555, -0.0005310177803039551, -0.0004966259002685547, -0.0004622340202331543, -0.0004278421401977539, -0.0003934502601623535, -0.0003590583801269531, -0.00032466650009155273, -0.00029027462005615234, -0.00025588274002075195, -0.00022149085998535156, -0.00018709897994995117, -0.00015270709991455078, -0.00011831521987915039, -8.392333984375e-05, -4.953145980834961e-05, -1.5139579772949219e-05, 1.9252300262451172e-05, 5.364418029785156e-05, 8.803606033325195e-05, 0.00012242794036865234, 0.00015681982040405273, 0.00019121170043945312, 0.00022560358047485352, 0.0002599954605102539, 0.0002943873405456543, 0.0003287792205810547, 0.0003631711006164551, 0.00039756298065185547, 0.00043195486068725586, 0.00046634674072265625, 0.0005007386207580566, 0.000535130500793457, 0.0005695223808288574, 0.0006039142608642578, 0.0006383061408996582, 0.0006726980209350586, 0.000707089900970459, 0.0007414817810058594, 0.0007758736610412598, 0.0008102655410766602, 0.0008446574211120605, 0.0008790493011474609, 0.0009134411811828613, 0.0009478330612182617, 0.0009822249412536621, 0.0010166168212890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 13.0, 17.0, 11.0, 18.0, 28.0, 40.0, 44.0, 82.0, 102.0, 141.0, 247.0, 385.0, 662.0, 1108.0, 2272.0, 4382.0, 10498.0, 30993.0, 270029.0, 654073.0, 48183.0, 13487.0, 5562.0, 2707.0, 1313.0, 794.0, 461.0, 270.0, 187.0, 131.0, 89.0, 57.0, 45.0, 29.0, 26.0, 14.0, 15.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9453125, -5.75439453125, -5.5634765625, -5.37255859375, -5.181640625, -4.99072265625, -4.7998046875, -4.60888671875, -4.41796875, -4.22705078125, -4.0361328125, -3.84521484375, -3.654296875, -3.46337890625, -3.2724609375, -3.08154296875, -2.890625, -2.69970703125, -2.5087890625, -2.31787109375, -2.126953125, -1.93603515625, -1.7451171875, -1.55419921875, -1.36328125, -1.17236328125, -0.9814453125, -0.79052734375, -0.599609375, -0.40869140625, -0.2177734375, -0.02685546875, 0.1640625, 0.35498046875, 0.5458984375, 0.73681640625, 0.927734375, 1.11865234375, 1.3095703125, 1.50048828125, 1.69140625, 1.88232421875, 2.0732421875, 2.26416015625, 2.455078125, 2.64599609375, 2.8369140625, 3.02783203125, 3.21875, 3.40966796875, 3.6005859375, 3.79150390625, 3.982421875, 4.17333984375, 4.3642578125, 4.55517578125, 4.74609375, 4.93701171875, 5.1279296875, 5.31884765625, 5.509765625, 5.70068359375, 5.8916015625, 6.08251953125, 6.2734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 8.0, 8.0, 13.0, 18.0, 19.0, 23.0, 52.0, 93.0, 121.0, 157.0, 137.0, 131.0, 77.0, 49.0, 24.0, 13.0, 7.0, 6.0, 6.0, 6.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -7.04486083984375, -6.8162841796875, -6.58770751953125, -6.359130859375, -6.13055419921875, -5.9019775390625, -5.67340087890625, -5.44482421875, -5.21624755859375, -4.9876708984375, -4.75909423828125, -4.530517578125, -4.30194091796875, -4.0733642578125, -3.84478759765625, -3.6162109375, -3.38763427734375, -3.1590576171875, -2.93048095703125, -2.701904296875, -2.47332763671875, -2.2447509765625, -2.01617431640625, -1.78759765625, -1.55902099609375, -1.3304443359375, -1.10186767578125, -0.873291015625, -0.64471435546875, -0.4161376953125, -0.18756103515625, 0.041015625, 0.26959228515625, 0.4981689453125, 0.72674560546875, 0.955322265625, 1.18389892578125, 1.4124755859375, 1.64105224609375, 1.86962890625, 2.09820556640625, 2.3267822265625, 2.55535888671875, 2.783935546875, 3.01251220703125, 3.2410888671875, 3.46966552734375, 3.6982421875, 3.92681884765625, 4.1553955078125, 4.38397216796875, 4.612548828125, 4.84112548828125, 5.0697021484375, 5.29827880859375, 5.52685546875, 5.75543212890625, 5.9840087890625, 6.21258544921875, 6.441162109375, 6.66973876953125, 6.8983154296875, 7.12689208984375, 7.35546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 14.0, 30.0, 53.0, 112.0, 222.0, 237.0, 135.0, 81.0, 45.0, 19.0, 11.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-132.78964233398438, -129.2099151611328, -125.63018035888672, -122.05044555664062, -118.47071838378906, -114.89098358154297, -111.31124877929688, -107.73152160644531, -104.15179443359375, -100.57205963134766, -96.9923324584961, -93.41259765625, -89.83287048339844, -86.25313568115234, -82.67340087890625, -79.09367370605469, -75.5139389038086, -71.9342041015625, -68.35447692871094, -64.77474212646484, -61.19501495361328, -57.61528015136719, -54.03554916381836, -50.45581817626953, -46.8760871887207, -43.296356201171875, -39.71662521362305, -36.13689422607422, -32.557159423828125, -28.97743034362793, -25.39769744873047, -21.81796646118164, -18.238235473632812, -14.658504486083984, -11.07877254486084, -7.499040603637695, -3.919309616088867, -0.33957862854003906, 3.240154266357422, 6.81988525390625, 10.399616241455078, 13.979347229003906, 17.559078216552734, 21.138811111450195, 24.718542098999023, 28.29827308654785, 31.878005981445312, 35.45773696899414, 39.03746795654297, 42.6171989440918, 46.196929931640625, 49.77666473388672, 53.35639190673828, 56.936126708984375, 60.5158576965332, 64.09558868408203, 67.67532348632812, 71.25505828857422, 74.83478546142578, 78.41452026367188, 81.99424743652344, 85.57398223876953, 89.15371704101562, 92.73344421386719, 96.31317138671875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 8.0, 10.0, 10.0, 7.0, 15.0, 26.0, 24.0, 17.0, 35.0, 33.0, 43.0, 34.0, 28.0, 54.0, 63.0, 64.0, 82.0, 63.0, 43.0, 48.0, 43.0, 26.0, 29.0, 26.0, 27.0, 27.0, 22.0, 13.0, 10.0, 9.0, 9.0, 12.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.6934814453125, -62.802001953125, -60.9105224609375, -59.01904296875, -57.1275634765625, -55.236083984375, -53.344600677490234, -51.453121185302734, -49.561641693115234, -47.670162200927734, -45.778682708740234, -43.887203216552734, -41.99571990966797, -40.10424041748047, -38.21276092529297, -36.32128143310547, -34.42980194091797, -32.53832244873047, -30.64684295654297, -28.755361557006836, -26.863882064819336, -24.972402572631836, -23.080921173095703, -21.189441680908203, -19.297962188720703, -17.406482696533203, -15.515002250671387, -13.62352180480957, -11.73204231262207, -9.84056282043457, -7.949082374572754, -6.0576019287109375, -4.1661224365234375, -2.2746424674987793, -0.3831624984741211, 1.508317470550537, 3.3997974395751953, 5.291276931762695, 7.182757377624512, 9.074237823486328, 10.965717315673828, 12.857196807861328, 14.748677253723145, 16.64015769958496, 18.53163719177246, 20.42311668395996, 22.314598083496094, 24.206077575683594, 26.097557067871094, 27.989036560058594, 29.880516052246094, 31.771997451782227, 33.663475036621094, 35.554954528808594, 37.44643783569336, 39.33791732788086, 41.22939682006836, 43.12087631225586, 45.01235580444336, 46.90383529663086, 48.795318603515625, 50.686798095703125, 52.578277587890625, 54.469757080078125, 56.361236572265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 10.0, 14.0, 30.0, 37.0, 38.0, 90.0, 131.0, 240.0, 483.0, 1378.0, 3949.0, 15076.0, 120541.0, 3663463.0, 356716.0, 23795.0, 5194.0, 1620.0, 660.0, 304.0, 163.0, 110.0, 60.0, 56.0, 24.0, 18.0, 22.0, 19.0, 13.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.8187255859375, -7.473388671875, -7.1280517578125, -6.78271484375, -6.4373779296875, -6.092041015625, -5.7467041015625, -5.4013671875, -5.0560302734375, -4.710693359375, -4.3653564453125, -4.02001953125, -3.6746826171875, -3.329345703125, -2.9840087890625, -2.638671875, -2.2933349609375, -1.947998046875, -1.6026611328125, -1.25732421875, -0.9119873046875, -0.566650390625, -0.2213134765625, 0.1240234375, 0.4693603515625, 0.814697265625, 1.1600341796875, 1.50537109375, 1.8507080078125, 2.196044921875, 2.5413818359375, 2.88671875, 3.2320556640625, 3.577392578125, 3.9227294921875, 4.26806640625, 4.6134033203125, 4.958740234375, 5.3040771484375, 5.6494140625, 5.9947509765625, 6.340087890625, 6.6854248046875, 7.03076171875, 7.3760986328125, 7.721435546875, 8.0667724609375, 8.412109375, 8.7574462890625, 9.102783203125, 9.4481201171875, 9.79345703125, 10.1387939453125, 10.484130859375, 10.8294677734375, 11.1748046875, 11.5201416015625, 11.865478515625, 12.2108154296875, 12.55615234375, 12.9014892578125, 13.246826171875, 13.5921630859375, 13.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 15.0, 15.0, 22.0, 22.0, 27.0, 52.0, 42.0, 44.0, 70.0, 56.0, 64.0, 68.0, 78.0, 68.0, 52.0, 70.0, 52.0, 32.0, 36.0, 30.0, 18.0, 14.0, 12.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.37933349609375, -5.2235107421875, -5.06768798828125, -4.911865234375, -4.75604248046875, -4.6002197265625, -4.44439697265625, -4.28857421875, -4.13275146484375, -3.9769287109375, -3.82110595703125, -3.665283203125, -3.50946044921875, -3.3536376953125, -3.19781494140625, -3.0419921875, -2.88616943359375, -2.7303466796875, -2.57452392578125, -2.418701171875, -2.26287841796875, -2.1070556640625, -1.95123291015625, -1.79541015625, -1.63958740234375, -1.4837646484375, -1.32794189453125, -1.172119140625, -1.01629638671875, -0.8604736328125, -0.70465087890625, -0.548828125, -0.39300537109375, -0.2371826171875, -0.08135986328125, 0.074462890625, 0.23028564453125, 0.3861083984375, 0.54193115234375, 0.69775390625, 0.85357666015625, 1.0093994140625, 1.16522216796875, 1.321044921875, 1.47686767578125, 1.6326904296875, 1.78851318359375, 1.9443359375, 2.10015869140625, 2.2559814453125, 2.41180419921875, 2.567626953125, 2.72344970703125, 2.8792724609375, 3.03509521484375, 3.19091796875, 3.34674072265625, 3.5025634765625, 3.65838623046875, 3.814208984375, 3.97003173828125, 4.1258544921875, 4.28167724609375, 4.4375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 10.0, 10.0, 17.0, 33.0, 51.0, 78.0, 140.0, 173.0, 313.0, 538.0, 936.0, 2099.0, 6000.0, 22725.0, 172764.0, 3672652.0, 271182.0, 31098.0, 7868.0, 2640.0, 1232.0, 671.0, 384.0, 234.0, 157.0, 79.0, 67.0, 39.0, 23.0, 19.0, 12.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.05224609375, -8.6982421875, -8.34423828125, -7.990234375, -7.63623046875, -7.2822265625, -6.92822265625, -6.57421875, -6.22021484375, -5.8662109375, -5.51220703125, -5.158203125, -4.80419921875, -4.4501953125, -4.09619140625, -3.7421875, -3.38818359375, -3.0341796875, -2.68017578125, -2.326171875, -1.97216796875, -1.6181640625, -1.26416015625, -0.91015625, -0.55615234375, -0.2021484375, 0.15185546875, 0.505859375, 0.85986328125, 1.2138671875, 1.56787109375, 1.921875, 2.27587890625, 2.6298828125, 2.98388671875, 3.337890625, 3.69189453125, 4.0458984375, 4.39990234375, 4.75390625, 5.10791015625, 5.4619140625, 5.81591796875, 6.169921875, 6.52392578125, 6.8779296875, 7.23193359375, 7.5859375, 7.93994140625, 8.2939453125, 8.64794921875, 9.001953125, 9.35595703125, 9.7099609375, 10.06396484375, 10.41796875, 10.77197265625, 11.1259765625, 11.47998046875, 11.833984375, 12.18798828125, 12.5419921875, 12.89599609375, 13.25]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 2.0, 11.0, 12.0, 12.0, 22.0, 49.0, 68.0, 152.0, 366.0, 866.0, 1279.0, 674.0, 251.0, 115.0, 60.0, 37.0, 28.0, 13.0, 19.0, 15.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.77880859375, -11.3779296875, -10.97705078125, -10.576171875, -10.17529296875, -9.7744140625, -9.37353515625, -8.97265625, -8.57177734375, -8.1708984375, -7.77001953125, -7.369140625, -6.96826171875, -6.5673828125, -6.16650390625, -5.765625, -5.36474609375, -4.9638671875, -4.56298828125, -4.162109375, -3.76123046875, -3.3603515625, -2.95947265625, -2.55859375, -2.15771484375, -1.7568359375, -1.35595703125, -0.955078125, -0.55419921875, -0.1533203125, 0.24755859375, 0.6484375, 1.04931640625, 1.4501953125, 1.85107421875, 2.251953125, 2.65283203125, 3.0537109375, 3.45458984375, 3.85546875, 4.25634765625, 4.6572265625, 5.05810546875, 5.458984375, 5.85986328125, 6.2607421875, 6.66162109375, 7.0625, 7.46337890625, 7.8642578125, 8.26513671875, 8.666015625, 9.06689453125, 9.4677734375, 9.86865234375, 10.26953125, 10.67041015625, 11.0712890625, 11.47216796875, 11.873046875, 12.27392578125, 12.6748046875, 13.07568359375, 13.4765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 25.0, 210.0, 481.0, 213.0, 41.0, 10.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.833984375, -271.5758972167969, -264.3178405761719, -257.05975341796875, -249.80166625976562, -242.54359436035156, -235.2855224609375, -228.02743530273438, -220.7693634033203, -213.51129150390625, -206.25320434570312, -198.99513244628906, -191.737060546875, -184.47897338867188, -177.2209014892578, -169.96282958984375, -162.70474243164062, -155.44667053222656, -148.18858337402344, -140.93051147460938, -133.67242431640625, -126.41435241699219, -119.15628051757812, -111.89820098876953, -104.64012145996094, -97.38204193115234, -90.12396240234375, -82.86589050292969, -75.6078109741211, -68.3497314453125, -61.09165573120117, -53.833580017089844, -46.57550048828125, -39.317420959472656, -32.05934524536133, -24.801267623901367, -17.543190002441406, -10.285110473632812, -3.0270347595214844, 4.231040954589844, 11.489120483398438, 18.7471981048584, 26.00527572631836, 33.26335144042969, 40.52143096923828, 47.779510498046875, 55.0375862121582, 62.29566192626953, 69.55374145507812, 76.81182098388672, 84.06990051269531, 91.32797241210938, 98.58605194091797, 105.84413146972656, 113.10220336914062, 120.36028289794922, 127.61836242675781, 134.87643432617188, 142.134521484375, 149.39259338378906, 156.65066528320312, 163.90875244140625, 171.1668243408203, 178.42489624023438, 185.6829833984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 10.0, 7.0, 19.0, 19.0, 32.0, 39.0, 59.0, 62.0, 79.0, 123.0, 104.0, 95.0, 83.0, 59.0, 65.0, 39.0, 42.0, 19.0, 24.0, 13.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.65884399414062, -90.26581573486328, -87.87278747558594, -85.47976684570312, -83.08673858642578, -80.69371032714844, -78.30068969726562, -75.90766143798828, -73.51463317871094, -71.1216049194336, -68.72857666015625, -66.33555603027344, -63.942527770996094, -61.54949951171875, -59.15647506713867, -56.763450622558594, -54.37042236328125, -51.977394104003906, -49.58436965942383, -47.19134521484375, -44.798316955566406, -42.40528869628906, -40.012264251708984, -37.619239807128906, -35.22621154785156, -32.83318328857422, -30.44015884399414, -28.04713249206543, -25.65410614013672, -23.261079788208008, -20.868053436279297, -18.475027084350586, -16.08200454711914, -13.68897819519043, -11.295951843261719, -8.902925491333008, -6.509899139404297, -4.116872787475586, -1.723846435546875, 0.6691799163818359, 3.062206268310547, 5.455232620239258, 7.848258972167969, 10.24128532409668, 12.63431167602539, 15.027338027954102, 17.420364379882812, 19.813390731811523, 22.206417083740234, 24.599443435668945, 26.992469787597656, 29.385496139526367, 31.778522491455078, 34.171546936035156, 36.5645751953125, 38.957603454589844, 41.35062789916992, 43.74365234375, 46.136680603027344, 48.52970886230469, 50.922733306884766, 53.315757751464844, 55.70878601074219, 58.10181427001953, 60.49483871459961]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 9.0, 15.0, 17.0, 23.0, 40.0, 35.0, 72.0, 92.0, 169.0, 247.0, 389.0, 755.0, 1975.0, 7558.0, 36795.0, 212154.0, 594730.0, 156761.0, 27516.0, 5725.0, 1727.0, 715.0, 376.0, 224.0, 145.0, 86.0, 64.0, 42.0, 22.0, 15.0, 17.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.234375, -15.811767578125, -15.38916015625, -14.966552734375, -14.5439453125, -14.121337890625, -13.69873046875, -13.276123046875, -12.853515625, -12.430908203125, -12.00830078125, -11.585693359375, -11.1630859375, -10.740478515625, -10.31787109375, -9.895263671875, -9.47265625, -9.050048828125, -8.62744140625, -8.204833984375, -7.7822265625, -7.359619140625, -6.93701171875, -6.514404296875, -6.091796875, -5.669189453125, -5.24658203125, -4.823974609375, -4.4013671875, -3.978759765625, -3.55615234375, -3.133544921875, -2.7109375, -2.288330078125, -1.86572265625, -1.443115234375, -1.0205078125, -0.597900390625, -0.17529296875, 0.247314453125, 0.669921875, 1.092529296875, 1.51513671875, 1.937744140625, 2.3603515625, 2.782958984375, 3.20556640625, 3.628173828125, 4.05078125, 4.473388671875, 4.89599609375, 5.318603515625, 5.7412109375, 6.163818359375, 6.58642578125, 7.009033203125, 7.431640625, 7.854248046875, 8.27685546875, 8.699462890625, 9.1220703125, 9.544677734375, 9.96728515625, 10.389892578125, 10.8125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 7.0, 11.0, 12.0, 14.0, 20.0, 18.0, 37.0, 32.0, 37.0, 46.0, 39.0, 49.0, 43.0, 56.0, 61.0, 74.0, 59.0, 50.0, 56.0, 47.0, 43.0, 38.0, 20.0, 34.0, 23.0, 14.0, 19.0, 8.0, 8.0, 9.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.05859375, -3.926513671875, -3.79443359375, -3.662353515625, -3.5302734375, -3.398193359375, -3.26611328125, -3.134033203125, -3.001953125, -2.869873046875, -2.73779296875, -2.605712890625, -2.4736328125, -2.341552734375, -2.20947265625, -2.077392578125, -1.9453125, -1.813232421875, -1.68115234375, -1.549072265625, -1.4169921875, -1.284912109375, -1.15283203125, -1.020751953125, -0.888671875, -0.756591796875, -0.62451171875, -0.492431640625, -0.3603515625, -0.228271484375, -0.09619140625, 0.035888671875, 0.16796875, 0.300048828125, 0.43212890625, 0.564208984375, 0.6962890625, 0.828369140625, 0.96044921875, 1.092529296875, 1.224609375, 1.356689453125, 1.48876953125, 1.620849609375, 1.7529296875, 1.885009765625, 2.01708984375, 2.149169921875, 2.28125, 2.413330078125, 2.54541015625, 2.677490234375, 2.8095703125, 2.941650390625, 3.07373046875, 3.205810546875, 3.337890625, 3.469970703125, 3.60205078125, 3.734130859375, 3.8662109375, 3.998291015625, 4.13037109375, 4.262451171875, 4.39453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 12.0, 14.0, 23.0, 20.0, 33.0, 57.0, 89.0, 132.0, 269.0, 483.0, 931.0, 2147.0, 5949.0, 34056.0, 716285.0, 261906.0, 18488.0, 4325.0, 1628.0, 727.0, 350.0, 219.0, 139.0, 84.0, 46.0, 36.0, 15.0, 12.0, 14.0, 18.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.5341796875, -22.771484375, -22.0087890625, -21.24609375, -20.4833984375, -19.720703125, -18.9580078125, -18.1953125, -17.4326171875, -16.669921875, -15.9072265625, -15.14453125, -14.3818359375, -13.619140625, -12.8564453125, -12.09375, -11.3310546875, -10.568359375, -9.8056640625, -9.04296875, -8.2802734375, -7.517578125, -6.7548828125, -5.9921875, -5.2294921875, -4.466796875, -3.7041015625, -2.94140625, -2.1787109375, -1.416015625, -0.6533203125, 0.109375, 0.8720703125, 1.634765625, 2.3974609375, 3.16015625, 3.9228515625, 4.685546875, 5.4482421875, 6.2109375, 6.9736328125, 7.736328125, 8.4990234375, 9.26171875, 10.0244140625, 10.787109375, 11.5498046875, 12.3125, 13.0751953125, 13.837890625, 14.6005859375, 15.36328125, 16.1259765625, 16.888671875, 17.6513671875, 18.4140625, 19.1767578125, 19.939453125, 20.7021484375, 21.46484375, 22.2275390625, 22.990234375, 23.7529296875, 24.515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 9.0, 20.0, 26.0, 32.0, 51.0, 57.0, 76.0, 88.0, 73.0, 128.0, 90.0, 86.0, 68.0, 72.0, 41.0, 30.0, 16.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.47900390625, -30.6142578125, -29.74951171875, -28.884765625, -28.02001953125, -27.1552734375, -26.29052734375, -25.42578125, -24.56103515625, -23.6962890625, -22.83154296875, -21.966796875, -21.10205078125, -20.2373046875, -19.37255859375, -18.5078125, -17.64306640625, -16.7783203125, -15.91357421875, -15.048828125, -14.18408203125, -13.3193359375, -12.45458984375, -11.58984375, -10.72509765625, -9.8603515625, -8.99560546875, -8.130859375, -7.26611328125, -6.4013671875, -5.53662109375, -4.671875, -3.80712890625, -2.9423828125, -2.07763671875, -1.212890625, -0.34814453125, 0.5166015625, 1.38134765625, 2.24609375, 3.11083984375, 3.9755859375, 4.84033203125, 5.705078125, 6.56982421875, 7.4345703125, 8.29931640625, 9.1640625, 10.02880859375, 10.8935546875, 11.75830078125, 12.623046875, 13.48779296875, 14.3525390625, 15.21728515625, 16.08203125, 16.94677734375, 17.8115234375, 18.67626953125, 19.541015625, 20.40576171875, 21.2705078125, 22.13525390625, 23.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 3.0, 8.0, 5.0, 7.0, 4.0, 14.0, 17.0, 15.0, 43.0, 49.0, 94.0, 203.0, 484.0, 1973.0, 18135.0, 953989.0, 68198.0, 3976.0, 754.0, 227.0, 129.0, 60.0, 47.0, 37.0, 15.0, 8.0, 11.0, 6.0, 2.0, 11.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0577392578125, -13.584228515625, -13.1107177734375, -12.63720703125, -12.1636962890625, -11.690185546875, -11.2166748046875, -10.7431640625, -10.2696533203125, -9.796142578125, -9.3226318359375, -8.84912109375, -8.3756103515625, -7.902099609375, -7.4285888671875, -6.955078125, -6.4815673828125, -6.008056640625, -5.5345458984375, -5.06103515625, -4.5875244140625, -4.114013671875, -3.6405029296875, -3.1669921875, -2.6934814453125, -2.219970703125, -1.7464599609375, -1.27294921875, -0.7994384765625, -0.325927734375, 0.1475830078125, 0.62109375, 1.0946044921875, 1.568115234375, 2.0416259765625, 2.51513671875, 2.9886474609375, 3.462158203125, 3.9356689453125, 4.4091796875, 4.8826904296875, 5.356201171875, 5.8297119140625, 6.30322265625, 6.7767333984375, 7.250244140625, 7.7237548828125, 8.197265625, 8.6707763671875, 9.144287109375, 9.6177978515625, 10.09130859375, 10.5648193359375, 11.038330078125, 11.5118408203125, 11.9853515625, 12.4588623046875, 12.932373046875, 13.4058837890625, 13.87939453125, 14.3529052734375, 14.826416015625, 15.2999267578125, 15.7734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 9.0, 8.0, 16.0, 10.0, 19.0, 30.0, 59.0, 104.0, 219.0, 229.0, 111.0, 59.0, 29.0, 32.0, 13.0, 14.0, 8.0, 5.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00125885009765625, -0.0012066066265106201, -0.0011543631553649902, -0.0011021196842193604, -0.0010498762130737305, -0.0009976327419281006, -0.0009453892707824707, -0.0008931457996368408, -0.0008409023284912109, -0.0007886588573455811, -0.0007364153861999512, -0.0006841719150543213, -0.0006319284439086914, -0.0005796849727630615, -0.0005274415016174316, -0.00047519803047180176, -0.0004229545593261719, -0.000370711088180542, -0.0003184676170349121, -0.0002662241458892822, -0.00021398067474365234, -0.00016173720359802246, -0.00010949373245239258, -5.7250261306762695e-05, -5.0067901611328125e-06, 4.723668098449707e-05, 9.948015213012695e-05, 0.00015172362327575684, 0.00020396709442138672, 0.0002562105655670166, 0.0003084540367126465, 0.00036069750785827637, 0.00041294097900390625, 0.00046518445014953613, 0.000517427921295166, 0.0005696713924407959, 0.0006219148635864258, 0.0006741583347320557, 0.0007264018058776855, 0.0007786452770233154, 0.0008308887481689453, 0.0008831322193145752, 0.0009353756904602051, 0.000987619161605835, 0.0010398626327514648, 0.0010921061038970947, 0.0011443495750427246, 0.0011965930461883545, 0.0012488365173339844, 0.0013010799884796143, 0.0013533234596252441, 0.001405566930770874, 0.001457810401916504, 0.0015100538730621338, 0.0015622973442077637, 0.0016145408153533936, 0.0016667842864990234, 0.0017190277576446533, 0.0017712712287902832, 0.001823514699935913, 0.001875758171081543, 0.0019280016422271729, 0.0019802451133728027, 0.0020324885845184326, 0.0020847320556640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 12.0, 18.0, 27.0, 44.0, 51.0, 92.0, 127.0, 271.0, 439.0, 903.0, 2230.0, 5820.0, 19107.0, 138240.0, 806383.0, 55323.0, 12081.0, 4155.0, 1602.0, 727.0, 362.0, 174.0, 127.0, 76.0, 54.0, 32.0, 22.0, 17.0, 8.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.28875732421875, -8.0540771484375, -7.81939697265625, -7.584716796875, -7.35003662109375, -7.1153564453125, -6.88067626953125, -6.64599609375, -6.41131591796875, -6.1766357421875, -5.94195556640625, -5.707275390625, -5.47259521484375, -5.2379150390625, -5.00323486328125, -4.7685546875, -4.53387451171875, -4.2991943359375, -4.06451416015625, -3.829833984375, -3.59515380859375, -3.3604736328125, -3.12579345703125, -2.89111328125, -2.65643310546875, -2.4217529296875, -2.18707275390625, -1.952392578125, -1.71771240234375, -1.4830322265625, -1.24835205078125, -1.013671875, -0.77899169921875, -0.5443115234375, -0.30963134765625, -0.074951171875, 0.15972900390625, 0.3944091796875, 0.62908935546875, 0.86376953125, 1.09844970703125, 1.3331298828125, 1.56781005859375, 1.802490234375, 2.03717041015625, 2.2718505859375, 2.50653076171875, 2.7412109375, 2.97589111328125, 3.2105712890625, 3.44525146484375, 3.679931640625, 3.91461181640625, 4.1492919921875, 4.38397216796875, 4.61865234375, 4.85333251953125, 5.0880126953125, 5.32269287109375, 5.557373046875, 5.79205322265625, 6.0267333984375, 6.26141357421875, 6.49609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 8.0, 9.0, 11.0, 7.0, 12.0, 23.0, 41.0, 40.0, 87.0, 134.0, 151.0, 138.0, 105.0, 52.0, 45.0, 20.0, 12.0, 13.0, 14.0, 10.0, 9.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.99609375, -5.818359375, -5.640625, -5.462890625, -5.28515625, -5.107421875, -4.9296875, -4.751953125, -4.57421875, -4.396484375, -4.21875, -4.041015625, -3.86328125, -3.685546875, -3.5078125, -3.330078125, -3.15234375, -2.974609375, -2.796875, -2.619140625, -2.44140625, -2.263671875, -2.0859375, -1.908203125, -1.73046875, -1.552734375, -1.375, -1.197265625, -1.01953125, -0.841796875, -0.6640625, -0.486328125, -0.30859375, -0.130859375, 0.046875, 0.224609375, 0.40234375, 0.580078125, 0.7578125, 0.935546875, 1.11328125, 1.291015625, 1.46875, 1.646484375, 1.82421875, 2.001953125, 2.1796875, 2.357421875, 2.53515625, 2.712890625, 2.890625, 3.068359375, 3.24609375, 3.423828125, 3.6015625, 3.779296875, 3.95703125, 4.134765625, 4.3125, 4.490234375, 4.66796875, 4.845703125, 5.0234375, 5.201171875, 5.37890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 18.0, 41.0, 114.0, 288.0, 302.0, 128.0, 43.0, 22.0, 13.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.38447570800781, -83.46348571777344, -78.54249572753906, -73.62150573730469, -68.70051574707031, -63.77952194213867, -58.85852813720703, -53.937538146972656, -49.01654815673828, -44.095558166503906, -39.17456817626953, -34.25357437133789, -29.332584381103516, -24.41159439086914, -19.490602493286133, -14.569610595703125, -9.64862060546875, -4.727629661560059, 0.1933612823486328, 5.114352226257324, 10.035343170166016, 14.95633316040039, 19.8773250579834, 24.798316955566406, 29.71930694580078, 34.640296936035156, 39.56128692626953, 44.48228073120117, 49.40327072143555, 54.32426071166992, 59.24525451660156, 64.16624450683594, 69.08721923828125, 74.00820922851562, 78.92919921875, 83.85018920898438, 88.77117919921875, 93.69216918945312, 98.61316680908203, 103.5341567993164, 108.45514678955078, 113.37613677978516, 118.29712677001953, 123.2181167602539, 128.1391143798828, 133.0601043701172, 137.98109436035156, 142.90208435058594, 147.8230743408203, 152.7440643310547, 157.66505432128906, 162.58604431152344, 167.5070343017578, 172.4280242919922, 177.34901428222656, 182.27001953125, 187.19100952148438, 192.11199951171875, 197.03298950195312, 201.9539794921875, 206.87496948242188, 211.79595947265625, 216.71694946289062, 221.637939453125, 226.55892944335938]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 10.0, 14.0, 13.0, 20.0, 36.0, 26.0, 54.0, 52.0, 60.0, 84.0, 105.0, 94.0, 98.0, 83.0, 50.0, 50.0, 29.0, 33.0, 24.0, 19.0, 9.0, 13.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-100.71033477783203, -97.87418365478516, -95.03803253173828, -92.2018814086914, -89.36573028564453, -86.52957916259766, -83.69342803955078, -80.8572769165039, -78.02112579345703, -75.18497467041016, -72.34882354736328, -69.5126724243164, -66.67652130126953, -63.840370178222656, -61.00421905517578, -58.168067932128906, -55.33191680908203, -52.495765686035156, -49.65961456298828, -46.823463439941406, -43.98731231689453, -41.151161193847656, -38.31501007080078, -35.478858947753906, -32.64270782470703, -29.806556701660156, -26.97040557861328, -24.134254455566406, -21.29810333251953, -18.461952209472656, -15.625801086425781, -12.789649963378906, -9.9534912109375, -7.117340087890625, -4.28118896484375, -1.445037841796875, 1.39111328125, 4.227264404296875, 7.06341552734375, 9.899566650390625, 12.7357177734375, 15.571868896484375, 18.40802001953125, 21.244171142578125, 24.080322265625, 26.916473388671875, 29.75262451171875, 32.588775634765625, 35.4249267578125, 38.261077880859375, 41.09722900390625, 43.933380126953125, 46.76953125, 49.605682373046875, 52.44183349609375, 55.277984619140625, 58.1141357421875, 60.950286865234375, 63.78643798828125, 66.62258911132812, 69.458740234375, 72.29489135742188, 75.13104248046875, 77.96719360351562, 80.8033447265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 21.0, 33.0, 53.0, 95.0, 170.0, 326.0, 658.0, 1818.0, 5588.0, 27609.0, 1860149.0, 2260511.0, 28972.0, 5233.0, 1586.0, 635.0, 311.0, 158.0, 94.0, 62.0, 40.0, 22.0, 17.0, 18.0, 8.0, 9.0, 5.0, 11.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.859375, -12.400390625, -11.94140625, -11.482421875, -11.0234375, -10.564453125, -10.10546875, -9.646484375, -9.1875, -8.728515625, -8.26953125, -7.810546875, -7.3515625, -6.892578125, -6.43359375, -5.974609375, -5.515625, -5.056640625, -4.59765625, -4.138671875, -3.6796875, -3.220703125, -2.76171875, -2.302734375, -1.84375, -1.384765625, -0.92578125, -0.466796875, -0.0078125, 0.451171875, 0.91015625, 1.369140625, 1.828125, 2.287109375, 2.74609375, 3.205078125, 3.6640625, 4.123046875, 4.58203125, 5.041015625, 5.5, 5.958984375, 6.41796875, 6.876953125, 7.3359375, 7.794921875, 8.25390625, 8.712890625, 9.171875, 9.630859375, 10.08984375, 10.548828125, 11.0078125, 11.466796875, 11.92578125, 12.384765625, 12.84375, 13.302734375, 13.76171875, 14.220703125, 14.6796875, 15.138671875, 15.59765625, 16.056640625, 16.515625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 10.0, 20.0, 22.0, 55.0, 56.0, 68.0, 89.0, 92.0, 117.0, 101.0, 96.0, 90.0, 67.0, 48.0, 29.0, 19.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.21575927734375, -5.9822998046875, -5.74884033203125, -5.515380859375, -5.28192138671875, -5.0484619140625, -4.81500244140625, -4.58154296875, -4.34808349609375, -4.1146240234375, -3.88116455078125, -3.647705078125, -3.41424560546875, -3.1807861328125, -2.94732666015625, -2.7138671875, -2.48040771484375, -2.2469482421875, -2.01348876953125, -1.780029296875, -1.54656982421875, -1.3131103515625, -1.07965087890625, -0.84619140625, -0.61273193359375, -0.3792724609375, -0.14581298828125, 0.087646484375, 0.32110595703125, 0.5545654296875, 0.78802490234375, 1.021484375, 1.25494384765625, 1.4884033203125, 1.72186279296875, 1.955322265625, 2.18878173828125, 2.4222412109375, 2.65570068359375, 2.88916015625, 3.12261962890625, 3.3560791015625, 3.58953857421875, 3.822998046875, 4.05645751953125, 4.2899169921875, 4.52337646484375, 4.7568359375, 4.99029541015625, 5.2237548828125, 5.45721435546875, 5.690673828125, 5.92413330078125, 6.1575927734375, 6.39105224609375, 6.62451171875, 6.85797119140625, 7.0914306640625, 7.32489013671875, 7.558349609375, 7.79180908203125, 8.0252685546875, 8.25872802734375, 8.4921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 14.0, 20.0, 40.0, 69.0, 120.0, 175.0, 249.0, 508.0, 960.0, 1995.0, 5650.0, 41694.0, 3973014.0, 155708.0, 9274.0, 2431.0, 1064.0, 568.0, 320.0, 153.0, 84.0, 48.0, 29.0, 29.0, 13.0, 12.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.643310546875, -18.95849609375, -18.273681640625, -17.5888671875, -16.904052734375, -16.21923828125, -15.534423828125, -14.849609375, -14.164794921875, -13.47998046875, -12.795166015625, -12.1103515625, -11.425537109375, -10.74072265625, -10.055908203125, -9.37109375, -8.686279296875, -8.00146484375, -7.316650390625, -6.6318359375, -5.947021484375, -5.26220703125, -4.577392578125, -3.892578125, -3.207763671875, -2.52294921875, -1.838134765625, -1.1533203125, -0.468505859375, 0.21630859375, 0.901123046875, 1.5859375, 2.270751953125, 2.95556640625, 3.640380859375, 4.3251953125, 5.010009765625, 5.69482421875, 6.379638671875, 7.064453125, 7.749267578125, 8.43408203125, 9.118896484375, 9.8037109375, 10.488525390625, 11.17333984375, 11.858154296875, 12.54296875, 13.227783203125, 13.91259765625, 14.597412109375, 15.2822265625, 15.967041015625, 16.65185546875, 17.336669921875, 18.021484375, 18.706298828125, 19.39111328125, 20.075927734375, 20.7607421875, 21.445556640625, 22.13037109375, 22.815185546875, 23.5]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 30.0, 48.0, 165.0, 1187.0, 2217.0, 313.0, 53.0, 23.0, 14.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -36.04052734375, -35.1435546875, -34.24658203125, -33.349609375, -32.45263671875, -31.5556640625, -30.65869140625, -29.76171875, -28.86474609375, -27.9677734375, -27.07080078125, -26.173828125, -25.27685546875, -24.3798828125, -23.48291015625, -22.5859375, -21.68896484375, -20.7919921875, -19.89501953125, -18.998046875, -18.10107421875, -17.2041015625, -16.30712890625, -15.41015625, -14.51318359375, -13.6162109375, -12.71923828125, -11.822265625, -10.92529296875, -10.0283203125, -9.13134765625, -8.234375, -7.33740234375, -6.4404296875, -5.54345703125, -4.646484375, -3.74951171875, -2.8525390625, -1.95556640625, -1.05859375, -0.16162109375, 0.7353515625, 1.63232421875, 2.529296875, 3.42626953125, 4.3232421875, 5.22021484375, 6.1171875, 7.01416015625, 7.9111328125, 8.80810546875, 9.705078125, 10.60205078125, 11.4990234375, 12.39599609375, 13.29296875, 14.18994140625, 15.0869140625, 15.98388671875, 16.880859375, 17.77783203125, 18.6748046875, 19.57177734375, 20.46875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 31.0, 197.0, 505.0, 197.0, 33.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-330.3117980957031, -322.5531311035156, -314.7944641113281, -307.03582763671875, -299.27716064453125, -291.51849365234375, -283.75982666015625, -276.00115966796875, -268.2425231933594, -260.4838562011719, -252.72520446777344, -244.96653747558594, -237.2078857421875, -229.44921875, -221.6905517578125, -213.93190002441406, -206.17323303222656, -198.41456604003906, -190.65591430664062, -182.89724731445312, -175.1385955810547, -167.3799285888672, -159.62127685546875, -151.86260986328125, -144.10394287109375, -136.34527587890625, -128.5866241455078, -120.82795715332031, -113.06930541992188, -105.31063842773438, -97.5519790649414, -89.79331970214844, -82.03466796875, -74.27600860595703, -66.51734924316406, -58.75868606567383, -51.00002670288086, -43.24136734008789, -35.482704162597656, -27.724044799804688, -19.96538543701172, -12.206725120544434, -4.448064804077148, 3.310596466064453, 11.069255828857422, 18.82791519165039, 26.586578369140625, 34.345237731933594, 42.10389709472656, 49.86255645751953, 57.6212158203125, 65.3798828125, 73.13853454589844, 80.89720153808594, 88.6558609008789, 96.41452026367188, 104.17317962646484, 111.93183898925781, 119.69049835205078, 127.44915771484375, 135.20782470703125, 142.9664764404297, 150.7251434326172, 158.48379516601562, 166.24246215820312]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 45.0, 94.0, 142.0, 166.0, 175.0, 177.0, 100.0, 55.0, 26.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.42202758789062, -178.0589141845703, -173.69580078125, -169.3326873779297, -164.96957397460938, -160.60647583007812, -156.2433624267578, -151.8802490234375, -147.5171356201172, -143.15402221679688, -138.79090881347656, -134.42779541015625, -130.064697265625, -125.70157623291016, -121.33847045898438, -116.97535705566406, -112.61224365234375, -108.24913024902344, -103.88601684570312, -99.52291107177734, -95.15979766845703, -90.79668426513672, -86.43357849121094, -82.07046508789062, -77.70735168457031, -73.34423828125, -68.98112487792969, -64.6180191040039, -60.254905700683594, -55.89179229736328, -51.528682708740234, -47.16557312011719, -42.802467346191406, -38.439353942871094, -34.07624435424805, -29.713132858276367, -25.350021362304688, -20.986909866333008, -16.623798370361328, -12.260686874389648, -7.897575378417969, -3.534463882446289, 0.8286476135253906, 5.19175910949707, 9.55487060546875, 13.91798210144043, 18.28109359741211, 22.64420509338379, 27.00731658935547, 31.37042808532715, 35.73353958129883, 40.096649169921875, 44.45976257324219, 48.8228759765625, 53.18598556518555, 57.549095153808594, 61.912208557128906, 66.27532196044922, 70.638427734375, 75.00154113769531, 79.36465454101562, 83.72776794433594, 88.09088134765625, 92.45398712158203, 96.81710052490234]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 15.0, 21.0, 30.0, 37.0, 48.0, 86.0, 147.0, 267.0, 498.0, 1111.0, 3865.0, 19724.0, 147288.0, 654211.0, 189484.0, 24495.0, 4679.0, 1269.0, 506.0, 272.0, 171.0, 97.0, 61.0, 42.0, 34.0, 19.0, 13.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.878173828125, -15.44384765625, -15.009521484375, -14.5751953125, -14.140869140625, -13.70654296875, -13.272216796875, -12.837890625, -12.403564453125, -11.96923828125, -11.534912109375, -11.1005859375, -10.666259765625, -10.23193359375, -9.797607421875, -9.36328125, -8.928955078125, -8.49462890625, -8.060302734375, -7.6259765625, -7.191650390625, -6.75732421875, -6.322998046875, -5.888671875, -5.454345703125, -5.02001953125, -4.585693359375, -4.1513671875, -3.717041015625, -3.28271484375, -2.848388671875, -2.4140625, -1.979736328125, -1.54541015625, -1.111083984375, -0.6767578125, -0.242431640625, 0.19189453125, 0.626220703125, 1.060546875, 1.494873046875, 1.92919921875, 2.363525390625, 2.7978515625, 3.232177734375, 3.66650390625, 4.100830078125, 4.53515625, 4.969482421875, 5.40380859375, 5.838134765625, 6.2724609375, 6.706787109375, 7.14111328125, 7.575439453125, 8.009765625, 8.444091796875, 8.87841796875, 9.312744140625, 9.7470703125, 10.181396484375, 10.61572265625, 11.050048828125, 11.484375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 24.0, 19.0, 35.0, 50.0, 71.0, 76.0, 101.0, 102.0, 109.0, 101.0, 83.0, 66.0, 46.0, 42.0, 34.0, 15.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.64508056640625, -5.4190673828125, -5.19305419921875, -4.967041015625, -4.74102783203125, -4.5150146484375, -4.28900146484375, -4.06298828125, -3.83697509765625, -3.6109619140625, -3.38494873046875, -3.158935546875, -2.93292236328125, -2.7069091796875, -2.48089599609375, -2.2548828125, -2.02886962890625, -1.8028564453125, -1.57684326171875, -1.350830078125, -1.12481689453125, -0.8988037109375, -0.67279052734375, -0.44677734375, -0.22076416015625, 0.0052490234375, 0.23126220703125, 0.457275390625, 0.68328857421875, 0.9093017578125, 1.13531494140625, 1.361328125, 1.58734130859375, 1.8133544921875, 2.03936767578125, 2.265380859375, 2.49139404296875, 2.7174072265625, 2.94342041015625, 3.16943359375, 3.39544677734375, 3.6214599609375, 3.84747314453125, 4.073486328125, 4.29949951171875, 4.5255126953125, 4.75152587890625, 4.9775390625, 5.20355224609375, 5.4295654296875, 5.65557861328125, 5.881591796875, 6.10760498046875, 6.3336181640625, 6.55963134765625, 6.78564453125, 7.01165771484375, 7.2376708984375, 7.46368408203125, 7.689697265625, 7.91571044921875, 8.1417236328125, 8.36773681640625, 8.59375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 6.0, 9.0, 16.0, 11.0, 28.0, 42.0, 57.0, 66.0, 76.0, 122.0, 200.0, 396.0, 649.0, 1348.0, 3019.0, 7457.0, 20871.0, 67771.0, 253475.0, 529922.0, 111669.0, 32309.0, 10901.0, 4281.0, 1703.0, 851.0, 496.0, 260.0, 155.0, 110.0, 70.0, 49.0, 33.0, 30.0, 20.0, 19.0, 15.0, 5.0, 6.0, 4.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.4296875, -7.1751708984375, -6.920654296875, -6.6661376953125, -6.41162109375, -6.1571044921875, -5.902587890625, -5.6480712890625, -5.3935546875, -5.1390380859375, -4.884521484375, -4.6300048828125, -4.37548828125, -4.1209716796875, -3.866455078125, -3.6119384765625, -3.357421875, -3.1029052734375, -2.848388671875, -2.5938720703125, -2.33935546875, -2.0848388671875, -1.830322265625, -1.5758056640625, -1.3212890625, -1.0667724609375, -0.812255859375, -0.5577392578125, -0.30322265625, -0.0487060546875, 0.205810546875, 0.4603271484375, 0.71484375, 0.9693603515625, 1.223876953125, 1.4783935546875, 1.73291015625, 1.9874267578125, 2.241943359375, 2.4964599609375, 2.7509765625, 3.0054931640625, 3.260009765625, 3.5145263671875, 3.76904296875, 4.0235595703125, 4.278076171875, 4.5325927734375, 4.787109375, 5.0416259765625, 5.296142578125, 5.5506591796875, 5.80517578125, 6.0596923828125, 6.314208984375, 6.5687255859375, 6.8232421875, 7.0777587890625, 7.332275390625, 7.5867919921875, 7.84130859375, 8.0958251953125, 8.350341796875, 8.6048583984375, 8.859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 13.0, 8.0, 17.0, 15.0, 22.0, 29.0, 24.0, 29.0, 36.0, 37.0, 48.0, 46.0, 40.0, 42.0, 60.0, 53.0, 53.0, 40.0, 40.0, 40.0, 39.0, 27.0, 42.0, 27.0, 29.0, 17.0, 21.0, 16.0, 17.0, 10.0, 11.0, 5.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.53125, -10.1435546875, -9.755859375, -9.3681640625, -8.98046875, -8.5927734375, -8.205078125, -7.8173828125, -7.4296875, -7.0419921875, -6.654296875, -6.2666015625, -5.87890625, -5.4912109375, -5.103515625, -4.7158203125, -4.328125, -3.9404296875, -3.552734375, -3.1650390625, -2.77734375, -2.3896484375, -2.001953125, -1.6142578125, -1.2265625, -0.8388671875, -0.451171875, -0.0634765625, 0.32421875, 0.7119140625, 1.099609375, 1.4873046875, 1.875, 2.2626953125, 2.650390625, 3.0380859375, 3.42578125, 3.8134765625, 4.201171875, 4.5888671875, 4.9765625, 5.3642578125, 5.751953125, 6.1396484375, 6.52734375, 6.9150390625, 7.302734375, 7.6904296875, 8.078125, 8.4658203125, 8.853515625, 9.2412109375, 9.62890625, 10.0166015625, 10.404296875, 10.7919921875, 11.1796875, 11.5673828125, 11.955078125, 12.3427734375, 12.73046875, 13.1181640625, 13.505859375, 13.8935546875, 14.28125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 7.0, 8.0, 13.0, 15.0, 29.0, 48.0, 80.0, 171.0, 433.0, 1125.0, 4055.0, 17602.0, 110747.0, 764554.0, 124065.0, 19078.0, 4372.0, 1295.0, 425.0, 202.0, 105.0, 46.0, 26.0, 16.0, 18.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.0859375, -3.9375, -3.7890625, -3.640625, -3.4921875, -3.34375, -3.1953125, -3.046875, -2.8984375, -2.75, -2.6015625, -2.453125, -2.3046875, -2.15625, -2.0078125, -1.859375, -1.7109375, -1.5625, -1.4140625, -1.265625, -1.1171875, -0.96875, -0.8203125, -0.671875, -0.5234375, -0.375, -0.2265625, -0.078125, 0.0703125, 0.21875, 0.3671875, 0.515625, 0.6640625, 0.8125, 0.9609375, 1.109375, 1.2578125, 1.40625, 1.5546875, 1.703125, 1.8515625, 2.0, 2.1484375, 2.296875, 2.4453125, 2.59375, 2.7421875, 2.890625, 3.0390625, 3.1875, 3.3359375, 3.484375, 3.6328125, 3.78125, 3.9296875, 4.078125, 4.2265625, 4.375, 4.5234375, 4.671875, 4.8203125, 4.96875, 5.1171875, 5.265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 7.0, 10.0, 18.0, 27.0, 29.0, 45.0, 73.0, 91.0, 115.0, 144.0, 116.0, 90.0, 76.0, 27.0, 29.0, 29.0, 9.0, 11.0, 5.0, 10.0, 6.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010929107666015625, -0.001061178743839264, -0.0010294467210769653, -0.0009977146983146667, -0.0009659826755523682, -0.0009342506527900696, -0.000902518630027771, -0.0008707866072654724, -0.0008390545845031738, -0.0008073225617408752, -0.0007755905389785767, -0.0007438585162162781, -0.0007121264934539795, -0.0006803944706916809, -0.0006486624479293823, -0.0006169304251670837, -0.0005851984024047852, -0.0005534663796424866, -0.000521734356880188, -0.0004900023341178894, -0.0004582703113555908, -0.00042653828859329224, -0.00039480626583099365, -0.00036307424306869507, -0.0003313422203063965, -0.0002996101975440979, -0.0002678781747817993, -0.00023614615201950073, -0.00020441412925720215, -0.00017268210649490356, -0.00014095008373260498, -0.0001092180609703064, -7.748603820800781e-05, -4.575401544570923e-05, -1.4021992683410645e-05, 1.771003007888794e-05, 4.9442052841186523e-05, 8.117407560348511e-05, 0.00011290609836578369, 0.00014463812112808228, 0.00017637014389038086, 0.00020810216665267944, 0.00023983418941497803, 0.0002715662121772766, 0.0003032982349395752, 0.0003350302577018738, 0.00036676228046417236, 0.00039849430322647095, 0.00043022632598876953, 0.0004619583487510681, 0.0004936903715133667, 0.0005254223942756653, 0.0005571544170379639, 0.0005888864398002625, 0.000620618462562561, 0.0006523504853248596, 0.0006840825080871582, 0.0007158145308494568, 0.0007475465536117554, 0.000779278576374054, 0.0008110105991363525, 0.0008427426218986511, 0.0008744746446609497, 0.0009062066674232483, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 10.0, 9.0, 16.0, 23.0, 35.0, 57.0, 62.0, 136.0, 208.0, 384.0, 795.0, 1726.0, 3939.0, 10364.0, 33388.0, 140019.0, 640676.0, 160682.0, 36846.0, 11363.0, 4253.0, 1773.0, 823.0, 410.0, 208.0, 137.0, 79.0, 45.0, 30.0, 22.0, 7.0, 16.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2734375, -3.162628173828125, -3.05181884765625, -2.941009521484375, -2.8302001953125, -2.719390869140625, -2.60858154296875, -2.497772216796875, -2.386962890625, -2.276153564453125, -2.16534423828125, -2.054534912109375, -1.9437255859375, -1.832916259765625, -1.72210693359375, -1.611297607421875, -1.50048828125, -1.389678955078125, -1.27886962890625, -1.168060302734375, -1.0572509765625, -0.946441650390625, -0.83563232421875, -0.724822998046875, -0.614013671875, -0.503204345703125, -0.39239501953125, -0.281585693359375, -0.1707763671875, -0.059967041015625, 0.05084228515625, 0.161651611328125, 0.2724609375, 0.383270263671875, 0.49407958984375, 0.604888916015625, 0.7156982421875, 0.826507568359375, 0.93731689453125, 1.048126220703125, 1.158935546875, 1.269744873046875, 1.38055419921875, 1.491363525390625, 1.6021728515625, 1.712982177734375, 1.82379150390625, 1.934600830078125, 2.04541015625, 2.156219482421875, 2.26702880859375, 2.377838134765625, 2.4886474609375, 2.599456787109375, 2.71026611328125, 2.821075439453125, 2.931884765625, 3.042694091796875, 3.15350341796875, 3.264312744140625, 3.3751220703125, 3.485931396484375, 3.59674072265625, 3.707550048828125, 3.818359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 3.0, 5.0, 4.0, 12.0, 16.0, 17.0, 29.0, 30.0, 44.0, 48.0, 55.0, 74.0, 91.0, 102.0, 79.0, 79.0, 71.0, 59.0, 37.0, 43.0, 19.0, 22.0, 10.0, 8.0, 13.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.21875, -3.116912841796875, -3.01507568359375, -2.913238525390625, -2.8114013671875, -2.709564208984375, -2.60772705078125, -2.505889892578125, -2.404052734375, -2.302215576171875, -2.20037841796875, -2.098541259765625, -1.9967041015625, -1.894866943359375, -1.79302978515625, -1.691192626953125, -1.58935546875, -1.487518310546875, -1.38568115234375, -1.283843994140625, -1.1820068359375, -1.080169677734375, -0.97833251953125, -0.876495361328125, -0.774658203125, -0.672821044921875, -0.57098388671875, -0.469146728515625, -0.3673095703125, -0.265472412109375, -0.16363525390625, -0.061798095703125, 0.0400390625, 0.141876220703125, 0.24371337890625, 0.345550537109375, 0.4473876953125, 0.549224853515625, 0.65106201171875, 0.752899169921875, 0.854736328125, 0.956573486328125, 1.05841064453125, 1.160247802734375, 1.2620849609375, 1.363922119140625, 1.46575927734375, 1.567596435546875, 1.66943359375, 1.771270751953125, 1.87310791015625, 1.974945068359375, 2.0767822265625, 2.178619384765625, 2.28045654296875, 2.382293701171875, 2.484130859375, 2.585968017578125, 2.68780517578125, 2.789642333984375, 2.8914794921875, 2.993316650390625, 3.09515380859375, 3.196990966796875, 3.298828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 10.0, 7.0, 18.0, 37.0, 55.0, 129.0, 206.0, 240.0, 141.0, 73.0, 35.0, 25.0, 12.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.13380432128906, -81.34127807617188, -78.54875183105469, -75.7562255859375, -72.96369934082031, -70.1711654663086, -67.3786392211914, -64.58611297607422, -61.79358673095703, -59.001060485839844, -56.208534240722656, -53.4160041809082, -50.623477935791016, -47.83095169067383, -45.038421630859375, -42.24589538574219, -39.453369140625, -36.66084289550781, -33.868316650390625, -31.075786590576172, -28.283260345458984, -25.490734100341797, -22.698205947875977, -19.905677795410156, -17.11315155029297, -14.320624351501465, -11.528097152709961, -8.735569953918457, -5.943042755126953, -3.150515556335449, -0.3579883575439453, 2.434539794921875, 5.2270660400390625, 8.019593238830566, 10.81212043762207, 13.604647636413574, 16.397174835205078, 19.189701080322266, 21.982229232788086, 24.774757385253906, 27.567283630371094, 30.35980987548828, 33.15233612060547, 35.94486618041992, 38.73739242553711, 41.5299186706543, 44.32244873046875, 47.11497497558594, 49.907501220703125, 52.70002746582031, 55.4925537109375, 58.28508377075195, 61.07761001586914, 63.87013626098633, 66.66266632080078, 69.45519256591797, 72.24771881103516, 75.04024505615234, 77.83277130126953, 80.62529754638672, 83.41783142089844, 86.21035766601562, 89.00288391113281, 91.79541015625, 94.58793640136719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 16.0, 15.0, 25.0, 29.0, 33.0, 43.0, 57.0, 66.0, 79.0, 124.0, 132.0, 85.0, 51.0, 44.0, 49.0, 33.0, 29.0, 28.0, 16.0, 14.0, 8.0, 6.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.0905990600586, -94.52985382080078, -91.9691162109375, -89.40837097167969, -86.8476333618164, -84.2868881225586, -81.72615051269531, -79.1654052734375, -76.60466003417969, -74.04391479492188, -71.4831771850586, -68.92243194580078, -66.3616943359375, -63.80094909667969, -61.24020767211914, -58.679466247558594, -56.11872863769531, -53.557987213134766, -50.99724578857422, -48.43650436401367, -45.875762939453125, -43.31501770019531, -40.754276275634766, -38.19353485107422, -35.63279342651367, -33.072052001953125, -30.511310577392578, -27.9505672454834, -25.38982582092285, -22.829084396362305, -20.268341064453125, -17.707599639892578, -15.1468505859375, -12.586109161376953, -10.02536678314209, -7.464624881744385, -4.90388298034668, -2.343141555786133, 0.21760082244873047, 2.7783432006835938, 5.339084625244141, 7.899826526641846, 10.46056842803955, 13.021310806274414, 15.582052230834961, 18.142793655395508, 20.703536987304688, 23.264278411865234, 25.82501983642578, 28.385761260986328, 30.946502685546875, 33.50724411010742, 36.06798553466797, 38.62873077392578, 41.18947219848633, 43.750213623046875, 46.31095504760742, 48.87169647216797, 51.432437896728516, 53.99317932128906, 56.553924560546875, 59.114662170410156, 61.67540740966797, 64.23614501953125, 66.79689025878906]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 4.0, 12.0, 18.0, 21.0, 29.0, 43.0, 82.0, 196.0, 403.0, 913.0, 2432.0, 7380.0, 32944.0, 1604548.0, 2489635.0, 43256.0, 8166.0, 2492.0, 929.0, 379.0, 160.0, 81.0, 42.0, 28.0, 23.0, 21.0, 4.0, 8.0, 2.0, 6.0, 8.0, 2.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6953125, -10.3271484375, -9.958984375, -9.5908203125, -9.22265625, -8.8544921875, -8.486328125, -8.1181640625, -7.75, -7.3818359375, -7.013671875, -6.6455078125, -6.27734375, -5.9091796875, -5.541015625, -5.1728515625, -4.8046875, -4.4365234375, -4.068359375, -3.7001953125, -3.33203125, -2.9638671875, -2.595703125, -2.2275390625, -1.859375, -1.4912109375, -1.123046875, -0.7548828125, -0.38671875, -0.0185546875, 0.349609375, 0.7177734375, 1.0859375, 1.4541015625, 1.822265625, 2.1904296875, 2.55859375, 2.9267578125, 3.294921875, 3.6630859375, 4.03125, 4.3994140625, 4.767578125, 5.1357421875, 5.50390625, 5.8720703125, 6.240234375, 6.6083984375, 6.9765625, 7.3447265625, 7.712890625, 8.0810546875, 8.44921875, 8.8173828125, 9.185546875, 9.5537109375, 9.921875, 10.2900390625, 10.658203125, 11.0263671875, 11.39453125, 11.7626953125, 12.130859375, 12.4990234375, 12.8671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 13.0, 9.0, 18.0, 26.0, 29.0, 36.0, 48.0, 61.0, 64.0, 70.0, 63.0, 88.0, 89.0, 73.0, 71.0, 62.0, 50.0, 44.0, 27.0, 16.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9921875, -5.82647705078125, -5.6607666015625, -5.49505615234375, -5.329345703125, -5.16363525390625, -4.9979248046875, -4.83221435546875, -4.66650390625, -4.50079345703125, -4.3350830078125, -4.16937255859375, -4.003662109375, -3.83795166015625, -3.6722412109375, -3.50653076171875, -3.3408203125, -3.17510986328125, -3.0093994140625, -2.84368896484375, -2.677978515625, -2.51226806640625, -2.3465576171875, -2.18084716796875, -2.01513671875, -1.84942626953125, -1.6837158203125, -1.51800537109375, -1.352294921875, -1.18658447265625, -1.0208740234375, -0.85516357421875, -0.689453125, -0.52374267578125, -0.3580322265625, -0.19232177734375, -0.026611328125, 0.13909912109375, 0.3048095703125, 0.47052001953125, 0.63623046875, 0.80194091796875, 0.9676513671875, 1.13336181640625, 1.299072265625, 1.46478271484375, 1.6304931640625, 1.79620361328125, 1.9619140625, 2.12762451171875, 2.2933349609375, 2.45904541015625, 2.624755859375, 2.79046630859375, 2.9561767578125, 3.12188720703125, 3.28759765625, 3.45330810546875, 3.6190185546875, 3.78472900390625, 3.950439453125, 4.11614990234375, 4.2818603515625, 4.44757080078125, 4.61328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 12.0, 27.0, 57.0, 111.0, 195.0, 797.0, 7020.0, 2205293.0, 1972867.0, 6739.0, 718.0, 240.0, 111.0, 49.0, 24.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.34375, -29.451171875, -28.55859375, -27.666015625, -26.7734375, -25.880859375, -24.98828125, -24.095703125, -23.203125, -22.310546875, -21.41796875, -20.525390625, -19.6328125, -18.740234375, -17.84765625, -16.955078125, -16.0625, -15.169921875, -14.27734375, -13.384765625, -12.4921875, -11.599609375, -10.70703125, -9.814453125, -8.921875, -8.029296875, -7.13671875, -6.244140625, -5.3515625, -4.458984375, -3.56640625, -2.673828125, -1.78125, -0.888671875, 0.00390625, 0.896484375, 1.7890625, 2.681640625, 3.57421875, 4.466796875, 5.359375, 6.251953125, 7.14453125, 8.037109375, 8.9296875, 9.822265625, 10.71484375, 11.607421875, 12.5, 13.392578125, 14.28515625, 15.177734375, 16.0703125, 16.962890625, 17.85546875, 18.748046875, 19.640625, 20.533203125, 21.42578125, 22.318359375, 23.2109375, 24.103515625, 24.99609375, 25.888671875, 26.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 21.0, 29.0, 33.0, 61.0, 119.0, 322.0, 749.0, 1293.0, 813.0, 328.0, 127.0, 69.0, 31.0, 20.0, 15.0, 11.0, 9.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.578125, -7.209716796875, -6.84130859375, -6.472900390625, -6.1044921875, -5.736083984375, -5.36767578125, -4.999267578125, -4.630859375, -4.262451171875, -3.89404296875, -3.525634765625, -3.1572265625, -2.788818359375, -2.42041015625, -2.052001953125, -1.68359375, -1.315185546875, -0.94677734375, -0.578369140625, -0.2099609375, 0.158447265625, 0.52685546875, 0.895263671875, 1.263671875, 1.632080078125, 2.00048828125, 2.368896484375, 2.7373046875, 3.105712890625, 3.47412109375, 3.842529296875, 4.2109375, 4.579345703125, 4.94775390625, 5.316162109375, 5.6845703125, 6.052978515625, 6.42138671875, 6.789794921875, 7.158203125, 7.526611328125, 7.89501953125, 8.263427734375, 8.6318359375, 9.000244140625, 9.36865234375, 9.737060546875, 10.10546875, 10.473876953125, 10.84228515625, 11.210693359375, 11.5791015625, 11.947509765625, 12.31591796875, 12.684326171875, 13.052734375, 13.421142578125, 13.78955078125, 14.157958984375, 14.5263671875, 14.894775390625, 15.26318359375, 15.631591796875, 16.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 10.0, 12.0, 36.0, 51.0, 128.0, 162.0, 225.0, 175.0, 115.0, 47.0, 19.0, 9.0, 11.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-113.14717102050781, -110.3585205078125, -107.56987762451172, -104.7812271118164, -101.99258422851562, -99.20393371582031, -96.415283203125, -93.62663269042969, -90.8379898071289, -88.0493392944336, -85.26069641113281, -82.4720458984375, -79.68339538574219, -76.8947525024414, -74.1061019897461, -71.31745910644531, -68.52880859375, -65.74015808105469, -62.951515197753906, -60.162864685058594, -57.37421798706055, -54.5855712890625, -51.79692077636719, -49.00827407836914, -46.219627380371094, -43.43098068237305, -40.642333984375, -37.85368347167969, -35.06503677368164, -32.276390075683594, -29.487741470336914, -26.699092864990234, -23.910446166992188, -21.12179946899414, -18.33315086364746, -15.544503211975098, -12.755855560302734, -9.967207908630371, -7.178560256958008, -4.389911651611328, -1.6012649536132812, 1.187382698059082, 3.9760303497314453, 6.764678001403809, 9.553325653076172, 12.341973304748535, 15.130620956420898, 17.919269561767578, 20.707916259765625, 23.496562957763672, 26.28521156311035, 29.07386016845703, 31.862506866455078, 34.651153564453125, 37.43980407714844, 40.228450775146484, 43.01709747314453, 45.80574417114258, 48.594390869140625, 51.38304138183594, 54.171688079833984, 56.96033477783203, 59.748985290527344, 62.53763198852539, 65.32627868652344]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 7.0, 11.0, 14.0, 19.0, 16.0, 17.0, 26.0, 31.0, 34.0, 41.0, 48.0, 35.0, 46.0, 52.0, 44.0, 43.0, 44.0, 36.0, 40.0, 32.0, 38.0, 32.0, 56.0, 41.0, 27.0, 31.0, 23.0, 22.0, 22.0, 12.0, 13.0, 10.0, 7.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.988800048828125, -30.03738021850586, -29.08595848083496, -28.134538650512695, -27.18311882019043, -26.23169708251953, -25.280277252197266, -24.328857421875, -23.377437591552734, -22.42601776123047, -21.47459602355957, -20.523176193237305, -19.57175636291504, -18.62033462524414, -17.668914794921875, -16.71749496459961, -15.766074180603027, -14.814653396606445, -13.86323356628418, -12.911812782287598, -11.960392951965332, -11.00897216796875, -10.057552337646484, -9.106131553649902, -8.15471076965332, -7.2032904624938965, -6.251870155334473, -5.300449371337891, -4.349029541015625, -3.397608757019043, -2.446188449859619, -1.4947681427001953, -0.5433483123779297, 0.4080720543861389, 1.3594924211502075, 2.310912847518921, 3.2623331546783447, 4.213753700256348, 5.1651740074157715, 6.116594314575195, 7.068014621734619, 8.019434928894043, 8.970855712890625, 9.92227554321289, 10.873696327209473, 11.825117111206055, 12.77653694152832, 13.727956771850586, 14.679377555847168, 15.63079833984375, 16.582218170166016, 17.53363800048828, 18.48505973815918, 19.436479568481445, 20.38789939880371, 21.33932113647461, 22.290740966796875, 23.24216079711914, 24.19358253479004, 25.145002365112305, 26.09642219543457, 27.04784393310547, 27.999263763427734, 28.95068359375, 29.902103424072266]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 13.0, 5.0, 11.0, 20.0, 9.0, 18.0, 25.0, 59.0, 92.0, 125.0, 223.0, 422.0, 795.0, 1832.0, 4904.0, 15918.0, 62281.0, 275733.0, 497015.0, 140785.0, 33194.0, 9235.0, 3101.0, 1249.0, 621.0, 335.0, 164.0, 105.0, 78.0, 58.0, 30.0, 29.0, 17.0, 9.0, 11.0, 0.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.359375, -9.078125, -8.796875, -8.515625, -8.234375, -7.953125, -7.671875, -7.390625, -7.109375, -6.828125, -6.546875, -6.265625, -5.984375, -5.703125, -5.421875, -5.140625, -4.859375, -4.578125, -4.296875, -4.015625, -3.734375, -3.453125, -3.171875, -2.890625, -2.609375, -2.328125, -2.046875, -1.765625, -1.484375, -1.203125, -0.921875, -0.640625, -0.359375, -0.078125, 0.203125, 0.484375, 0.765625, 1.046875, 1.328125, 1.609375, 1.890625, 2.171875, 2.453125, 2.734375, 3.015625, 3.296875, 3.578125, 3.859375, 4.140625, 4.421875, 4.703125, 4.984375, 5.265625, 5.546875, 5.828125, 6.109375, 6.390625, 6.671875, 6.953125, 7.234375, 7.515625, 7.796875, 8.078125, 8.359375, 8.640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 8.0, 7.0, 15.0, 17.0, 15.0, 25.0, 37.0, 41.0, 52.0, 59.0, 65.0, 59.0, 80.0, 86.0, 59.0, 75.0, 70.0, 50.0, 48.0, 34.0, 29.0, 23.0, 17.0, 12.0, 12.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.87921142578125, -5.7115478515625, -5.54388427734375, -5.376220703125, -5.20855712890625, -5.0408935546875, -4.87322998046875, -4.70556640625, -4.53790283203125, -4.3702392578125, -4.20257568359375, -4.034912109375, -3.86724853515625, -3.6995849609375, -3.53192138671875, -3.3642578125, -3.19659423828125, -3.0289306640625, -2.86126708984375, -2.693603515625, -2.52593994140625, -2.3582763671875, -2.19061279296875, -2.02294921875, -1.85528564453125, -1.6876220703125, -1.51995849609375, -1.352294921875, -1.18463134765625, -1.0169677734375, -0.84930419921875, -0.681640625, -0.51397705078125, -0.3463134765625, -0.17864990234375, -0.010986328125, 0.15667724609375, 0.3243408203125, 0.49200439453125, 0.65966796875, 0.82733154296875, 0.9949951171875, 1.16265869140625, 1.330322265625, 1.49798583984375, 1.6656494140625, 1.83331298828125, 2.0009765625, 2.16864013671875, 2.3363037109375, 2.50396728515625, 2.671630859375, 2.83929443359375, 3.0069580078125, 3.17462158203125, 3.34228515625, 3.50994873046875, 3.6776123046875, 3.84527587890625, 4.012939453125, 4.18060302734375, 4.3482666015625, 4.51593017578125, 4.68359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 5.0, 5.0, 6.0, 8.0, 7.0, 20.0, 24.0, 35.0, 46.0, 77.0, 119.0, 209.0, 310.0, 578.0, 1294.0, 4123.0, 20125.0, 179005.0, 761569.0, 66577.0, 9808.0, 2503.0, 967.0, 429.0, 239.0, 167.0, 102.0, 59.0, 45.0, 31.0, 18.0, 7.0, 13.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.661865234375, -12.21435546875, -11.766845703125, -11.3193359375, -10.871826171875, -10.42431640625, -9.976806640625, -9.529296875, -9.081787109375, -8.63427734375, -8.186767578125, -7.7392578125, -7.291748046875, -6.84423828125, -6.396728515625, -5.94921875, -5.501708984375, -5.05419921875, -4.606689453125, -4.1591796875, -3.711669921875, -3.26416015625, -2.816650390625, -2.369140625, -1.921630859375, -1.47412109375, -1.026611328125, -0.5791015625, -0.131591796875, 0.31591796875, 0.763427734375, 1.2109375, 1.658447265625, 2.10595703125, 2.553466796875, 3.0009765625, 3.448486328125, 3.89599609375, 4.343505859375, 4.791015625, 5.238525390625, 5.68603515625, 6.133544921875, 6.5810546875, 7.028564453125, 7.47607421875, 7.923583984375, 8.37109375, 8.818603515625, 9.26611328125, 9.713623046875, 10.1611328125, 10.608642578125, 11.05615234375, 11.503662109375, 11.951171875, 12.398681640625, 12.84619140625, 13.293701171875, 13.7412109375, 14.188720703125, 14.63623046875, 15.083740234375, 15.53125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 2.0, 9.0, 10.0, 10.0, 12.0, 17.0, 16.0, 18.0, 14.0, 27.0, 32.0, 41.0, 38.0, 44.0, 48.0, 44.0, 46.0, 44.0, 54.0, 47.0, 54.0, 50.0, 24.0, 31.0, 29.0, 45.0, 30.0, 20.0, 22.0, 13.0, 20.0, 17.0, 15.0, 5.0, 3.0, 9.0, 7.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-12.984375, -12.61376953125, -12.2431640625, -11.87255859375, -11.501953125, -11.13134765625, -10.7607421875, -10.39013671875, -10.01953125, -9.64892578125, -9.2783203125, -8.90771484375, -8.537109375, -8.16650390625, -7.7958984375, -7.42529296875, -7.0546875, -6.68408203125, -6.3134765625, -5.94287109375, -5.572265625, -5.20166015625, -4.8310546875, -4.46044921875, -4.08984375, -3.71923828125, -3.3486328125, -2.97802734375, -2.607421875, -2.23681640625, -1.8662109375, -1.49560546875, -1.125, -0.75439453125, -0.3837890625, -0.01318359375, 0.357421875, 0.72802734375, 1.0986328125, 1.46923828125, 1.83984375, 2.21044921875, 2.5810546875, 2.95166015625, 3.322265625, 3.69287109375, 4.0634765625, 4.43408203125, 4.8046875, 5.17529296875, 5.5458984375, 5.91650390625, 6.287109375, 6.65771484375, 7.0283203125, 7.39892578125, 7.76953125, 8.14013671875, 8.5107421875, 8.88134765625, 9.251953125, 9.62255859375, 9.9931640625, 10.36376953125, 10.734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 19.0, 22.0, 40.0, 49.0, 92.0, 161.0, 324.0, 677.0, 1517.0, 4059.0, 12363.0, 56700.0, 769972.0, 166891.0, 24469.0, 6725.0, 2347.0, 987.0, 467.0, 244.0, 137.0, 91.0, 43.0, 32.0, 21.0, 17.0, 7.0, 10.0, 8.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.8359375, -4.692626953125, -4.54931640625, -4.406005859375, -4.2626953125, -4.119384765625, -3.97607421875, -3.832763671875, -3.689453125, -3.546142578125, -3.40283203125, -3.259521484375, -3.1162109375, -2.972900390625, -2.82958984375, -2.686279296875, -2.54296875, -2.399658203125, -2.25634765625, -2.113037109375, -1.9697265625, -1.826416015625, -1.68310546875, -1.539794921875, -1.396484375, -1.253173828125, -1.10986328125, -0.966552734375, -0.8232421875, -0.679931640625, -0.53662109375, -0.393310546875, -0.25, -0.106689453125, 0.03662109375, 0.179931640625, 0.3232421875, 0.466552734375, 0.60986328125, 0.753173828125, 0.896484375, 1.039794921875, 1.18310546875, 1.326416015625, 1.4697265625, 1.613037109375, 1.75634765625, 1.899658203125, 2.04296875, 2.186279296875, 2.32958984375, 2.472900390625, 2.6162109375, 2.759521484375, 2.90283203125, 3.046142578125, 3.189453125, 3.332763671875, 3.47607421875, 3.619384765625, 3.7626953125, 3.906005859375, 4.04931640625, 4.192626953125, 4.3359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 7.0, 4.0, 1.0, 14.0, 12.0, 17.0, 17.0, 27.0, 40.0, 54.0, 58.0, 114.0, 147.0, 126.0, 97.0, 68.0, 47.0, 42.0, 23.0, 14.0, 14.0, 10.0, 7.0, 4.0, 6.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007371902465820312, -0.0007107481360435486, -0.0006843060255050659, -0.0006578639149665833, -0.0006314218044281006, -0.0006049796938896179, -0.0005785375833511353, -0.0005520954728126526, -0.0005256533622741699, -0.0004992112517356873, -0.0004727691411972046, -0.0004463270306587219, -0.00041988492012023926, -0.0003934428095817566, -0.0003670006990432739, -0.00034055858850479126, -0.0003141164779663086, -0.00028767436742782593, -0.00026123225688934326, -0.0002347901463508606, -0.00020834803581237793, -0.00018190592527389526, -0.0001554638147354126, -0.00012902170419692993, -0.00010257959365844727, -7.61374831199646e-05, -4.9695372581481934e-05, -2.3253262042999268e-05, 3.1888484954833984e-06, 2.9630959033966064e-05, 5.607306957244873e-05, 8.25151801109314e-05, 0.00010895729064941406, 0.00013539940118789673, 0.0001618415117263794, 0.00018828362226486206, 0.00021472573280334473, 0.0002411678433418274, 0.00026760995388031006, 0.0002940520644187927, 0.0003204941749572754, 0.00034693628549575806, 0.0003733783960342407, 0.0003998205065727234, 0.00042626261711120605, 0.0004527047276496887, 0.0004791468381881714, 0.000505588948726654, 0.0005320310592651367, 0.0005584731698036194, 0.000584915280342102, 0.0006113573908805847, 0.0006377995014190674, 0.00066424161195755, 0.0006906837224960327, 0.0007171258330345154, 0.000743567943572998, 0.0007700100541114807, 0.0007964521646499634, 0.000822894275188446, 0.0008493363857269287, 0.0008757784962654114, 0.000902220606803894, 0.0009286627173423767, 0.0009551048278808594]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 9.0, 17.0, 17.0, 28.0, 47.0, 58.0, 97.0, 116.0, 218.0, 395.0, 657.0, 1206.0, 2418.0, 5525.0, 15258.0, 59284.0, 662581.0, 242959.0, 37893.0, 11044.0, 4306.0, 2024.0, 987.0, 528.0, 307.0, 183.0, 132.0, 73.0, 53.0, 35.0, 26.0, 14.0, 13.0, 11.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.657684326171875, -2.53607177734375, -2.414459228515625, -2.2928466796875, -2.171234130859375, -2.04962158203125, -1.928009033203125, -1.806396484375, -1.684783935546875, -1.56317138671875, -1.441558837890625, -1.3199462890625, -1.198333740234375, -1.07672119140625, -0.955108642578125, -0.83349609375, -0.711883544921875, -0.59027099609375, -0.468658447265625, -0.3470458984375, -0.225433349609375, -0.10382080078125, 0.017791748046875, 0.139404296875, 0.261016845703125, 0.38262939453125, 0.504241943359375, 0.6258544921875, 0.747467041015625, 0.86907958984375, 0.990692138671875, 1.1123046875, 1.233917236328125, 1.35552978515625, 1.477142333984375, 1.5987548828125, 1.720367431640625, 1.84197998046875, 1.963592529296875, 2.085205078125, 2.206817626953125, 2.32843017578125, 2.450042724609375, 2.5716552734375, 2.693267822265625, 2.81488037109375, 2.936492919921875, 3.05810546875, 3.179718017578125, 3.30133056640625, 3.422943115234375, 3.5445556640625, 3.666168212890625, 3.78778076171875, 3.909393310546875, 4.031005859375, 4.152618408203125, 4.27423095703125, 4.395843505859375, 4.5174560546875, 4.639068603515625, 4.76068115234375, 4.882293701171875, 5.00390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 10.0, 11.0, 11.0, 12.0, 14.0, 28.0, 26.0, 52.0, 71.0, 120.0, 168.0, 144.0, 102.0, 61.0, 38.0, 41.0, 14.0, 18.0, 13.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01953125, -3.889404296875, -3.75927734375, -3.629150390625, -3.4990234375, -3.368896484375, -3.23876953125, -3.108642578125, -2.978515625, -2.848388671875, -2.71826171875, -2.588134765625, -2.4580078125, -2.327880859375, -2.19775390625, -2.067626953125, -1.9375, -1.807373046875, -1.67724609375, -1.547119140625, -1.4169921875, -1.286865234375, -1.15673828125, -1.026611328125, -0.896484375, -0.766357421875, -0.63623046875, -0.506103515625, -0.3759765625, -0.245849609375, -0.11572265625, 0.014404296875, 0.14453125, 0.274658203125, 0.40478515625, 0.534912109375, 0.6650390625, 0.795166015625, 0.92529296875, 1.055419921875, 1.185546875, 1.315673828125, 1.44580078125, 1.575927734375, 1.7060546875, 1.836181640625, 1.96630859375, 2.096435546875, 2.2265625, 2.356689453125, 2.48681640625, 2.616943359375, 2.7470703125, 2.877197265625, 3.00732421875, 3.137451171875, 3.267578125, 3.397705078125, 3.52783203125, 3.657958984375, 3.7880859375, 3.918212890625, 4.04833984375, 4.178466796875, 4.30859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 20.0, 84.0, 245.0, 474.0, 114.0, 26.0, 13.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.65943908691406, -107.09862518310547, -101.5378189086914, -95.97700500488281, -90.41619873046875, -84.85538482666016, -79.29457092285156, -73.7337646484375, -68.1729507446289, -62.61214065551758, -57.05133056640625, -51.490516662597656, -45.92970657348633, -40.368896484375, -34.808082580566406, -29.247272491455078, -23.68646240234375, -18.125652313232422, -12.564840316772461, -7.0040283203125, -1.4432182312011719, 4.117591857910156, 9.67840576171875, 15.239215850830078, 20.800025939941406, 26.360836029052734, 31.921648025512695, 37.482460021972656, 43.043270111083984, 48.60408020019531, 54.164894104003906, 59.725704193115234, 65.2864990234375, 70.8473129272461, 76.40811920166016, 81.96893310546875, 87.52973937988281, 93.0905532836914, 98.6513671875, 104.21217346191406, 109.77298736572266, 115.33380126953125, 120.89460754394531, 126.4554214477539, 132.0162353515625, 137.57704162597656, 143.13784790039062, 148.69866943359375, 154.2594757080078, 159.82028198242188, 165.381103515625, 170.94190979003906, 176.50271606445312, 182.06353759765625, 187.6243438720703, 193.18515014648438, 198.7459716796875, 204.30677795410156, 209.8675994873047, 215.42840576171875, 220.9892120361328, 226.55001831054688, 232.11083984375, 237.67164611816406, 243.23245239257812]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 4.0, 3.0, 9.0, 8.0, 16.0, 14.0, 9.0, 7.0, 14.0, 19.0, 34.0, 34.0, 32.0, 48.0, 56.0, 66.0, 107.0, 112.0, 87.0, 47.0, 33.0, 38.0, 35.0, 23.0, 24.0, 18.0, 22.0, 18.0, 11.0, 11.0, 5.0, 6.0, 9.0, 8.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.681907653808594, -40.984588623046875, -39.287269592285156, -37.5899543762207, -35.892635345458984, -34.195316314697266, -32.49799728393555, -30.80068016052246, -29.103363037109375, -27.406044006347656, -25.70872688293457, -24.01140785217285, -22.314090728759766, -20.616771697998047, -18.919452667236328, -17.222135543823242, -15.524816513061523, -13.827498435974121, -12.130180358886719, -10.432861328125, -8.735544204711914, -7.038225173950195, -5.340907096862793, -3.6435890197753906, -1.9462709426879883, -0.2489527463912964, 1.4483654499053955, 3.145683765411377, 4.843001842498779, 6.54032039642334, 8.237638473510742, 9.934956550598145, 11.632274627685547, 13.32959270477295, 15.026910781860352, 16.72422981262207, 18.421546936035156, 20.118865966796875, 21.816184997558594, 23.51350212097168, 25.210819244384766, 26.908138275146484, 28.60545539855957, 30.30277442932129, 32.000091552734375, 33.697410583496094, 35.39472961425781, 37.09204864501953, 38.78936767578125, 40.48668670654297, 42.18400573730469, 43.88132095336914, 45.57863998413086, 47.27595901489258, 48.9732780456543, 50.67059326171875, 52.36791229248047, 54.06523132324219, 55.762550354003906, 57.45986557006836, 59.15718460083008, 60.8545036315918, 62.551822662353516, 64.24913787841797, 65.94645690917969]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 10.0, 19.0, 36.0, 66.0, 100.0, 159.0, 330.0, 609.0, 1390.0, 3275.0, 9501.0, 41609.0, 951651.0, 3046369.0, 115393.0, 15654.0, 4597.0, 1726.0, 775.0, 365.0, 209.0, 131.0, 63.0, 56.0, 48.0, 23.0, 21.0, 14.0, 12.0, 11.0, 5.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6484375, -8.341796875, -8.03515625, -7.728515625, -7.421875, -7.115234375, -6.80859375, -6.501953125, -6.1953125, -5.888671875, -5.58203125, -5.275390625, -4.96875, -4.662109375, -4.35546875, -4.048828125, -3.7421875, -3.435546875, -3.12890625, -2.822265625, -2.515625, -2.208984375, -1.90234375, -1.595703125, -1.2890625, -0.982421875, -0.67578125, -0.369140625, -0.0625, 0.244140625, 0.55078125, 0.857421875, 1.1640625, 1.470703125, 1.77734375, 2.083984375, 2.390625, 2.697265625, 3.00390625, 3.310546875, 3.6171875, 3.923828125, 4.23046875, 4.537109375, 4.84375, 5.150390625, 5.45703125, 5.763671875, 6.0703125, 6.376953125, 6.68359375, 6.990234375, 7.296875, 7.603515625, 7.91015625, 8.216796875, 8.5234375, 8.830078125, 9.13671875, 9.443359375, 9.75, 10.056640625, 10.36328125, 10.669921875, 10.9765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 2.0, 6.0, 13.0, 11.0, 11.0, 14.0, 20.0, 28.0, 27.0, 33.0, 41.0, 49.0, 50.0, 54.0, 64.0, 57.0, 68.0, 70.0, 65.0, 64.0, 38.0, 58.0, 31.0, 26.0, 29.0, 14.0, 16.0, 15.0, 8.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.583404541015625, -4.44805908203125, -4.312713623046875, -4.1773681640625, -4.042022705078125, -3.90667724609375, -3.771331787109375, -3.635986328125, -3.500640869140625, -3.36529541015625, -3.229949951171875, -3.0946044921875, -2.959259033203125, -2.82391357421875, -2.688568115234375, -2.55322265625, -2.417877197265625, -2.28253173828125, -2.147186279296875, -2.0118408203125, -1.876495361328125, -1.74114990234375, -1.605804443359375, -1.470458984375, -1.335113525390625, -1.19976806640625, -1.064422607421875, -0.9290771484375, -0.793731689453125, -0.65838623046875, -0.523040771484375, -0.3876953125, -0.252349853515625, -0.11700439453125, 0.018341064453125, 0.1536865234375, 0.289031982421875, 0.42437744140625, 0.559722900390625, 0.695068359375, 0.830413818359375, 0.96575927734375, 1.101104736328125, 1.2364501953125, 1.371795654296875, 1.50714111328125, 1.642486572265625, 1.77783203125, 1.913177490234375, 2.04852294921875, 2.183868408203125, 2.3192138671875, 2.454559326171875, 2.58990478515625, 2.725250244140625, 2.860595703125, 2.995941162109375, 3.13128662109375, 3.266632080078125, 3.4019775390625, 3.537322998046875, 3.67266845703125, 3.808013916015625, 3.943359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 8.0, 6.0, 4.0, 7.0, 8.0, 7.0, 17.0, 17.0, 27.0, 20.0, 62.0, 96.0, 164.0, 403.0, 1145.0, 4246.0, 24411.0, 823291.0, 3286214.0, 45197.0, 6437.0, 1551.0, 476.0, 179.0, 98.0, 56.0, 34.0, 28.0, 20.0, 15.0, 10.0, 14.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.921875, -14.45751953125, -13.9931640625, -13.52880859375, -13.064453125, -12.60009765625, -12.1357421875, -11.67138671875, -11.20703125, -10.74267578125, -10.2783203125, -9.81396484375, -9.349609375, -8.88525390625, -8.4208984375, -7.95654296875, -7.4921875, -7.02783203125, -6.5634765625, -6.09912109375, -5.634765625, -5.17041015625, -4.7060546875, -4.24169921875, -3.77734375, -3.31298828125, -2.8486328125, -2.38427734375, -1.919921875, -1.45556640625, -0.9912109375, -0.52685546875, -0.0625, 0.40185546875, 0.8662109375, 1.33056640625, 1.794921875, 2.25927734375, 2.7236328125, 3.18798828125, 3.65234375, 4.11669921875, 4.5810546875, 5.04541015625, 5.509765625, 5.97412109375, 6.4384765625, 6.90283203125, 7.3671875, 7.83154296875, 8.2958984375, 8.76025390625, 9.224609375, 9.68896484375, 10.1533203125, 10.61767578125, 11.08203125, 11.54638671875, 12.0107421875, 12.47509765625, 12.939453125, 13.40380859375, 13.8681640625, 14.33251953125, 14.796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 6.0, 13.0, 13.0, 22.0, 23.0, 31.0, 51.0, 94.0, 137.0, 293.0, 449.0, 732.0, 847.0, 563.0, 304.0, 170.0, 85.0, 70.0, 50.0, 29.0, 17.0, 10.0, 12.0, 10.0, 6.0, 5.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4921875, -9.2056884765625, -8.919189453125, -8.6326904296875, -8.34619140625, -8.0596923828125, -7.773193359375, -7.4866943359375, -7.2001953125, -6.9136962890625, -6.627197265625, -6.3406982421875, -6.05419921875, -5.7677001953125, -5.481201171875, -5.1947021484375, -4.908203125, -4.6217041015625, -4.335205078125, -4.0487060546875, -3.76220703125, -3.4757080078125, -3.189208984375, -2.9027099609375, -2.6162109375, -2.3297119140625, -2.043212890625, -1.7567138671875, -1.47021484375, -1.1837158203125, -0.897216796875, -0.6107177734375, -0.32421875, -0.0377197265625, 0.248779296875, 0.5352783203125, 0.82177734375, 1.1082763671875, 1.394775390625, 1.6812744140625, 1.9677734375, 2.2542724609375, 2.540771484375, 2.8272705078125, 3.11376953125, 3.4002685546875, 3.686767578125, 3.9732666015625, 4.259765625, 4.5462646484375, 4.832763671875, 5.1192626953125, 5.40576171875, 5.6922607421875, 5.978759765625, 6.2652587890625, 6.5517578125, 6.8382568359375, 7.124755859375, 7.4112548828125, 7.69775390625, 7.9842529296875, 8.270751953125, 8.5572509765625, 8.84375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 7.0, 9.0, 18.0, 28.0, 69.0, 108.0, 130.0, 180.0, 167.0, 137.0, 69.0, 32.0, 21.0, 5.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.88106536865234, -97.49269104003906, -95.10430908203125, -92.71592712402344, -90.32755279541016, -87.93917846679688, -85.55079650878906, -83.16241455078125, -80.77404022216797, -78.38566589355469, -75.99728393554688, -73.60890197753906, -71.22052764892578, -68.8321533203125, -66.44377136230469, -64.05538940429688, -61.667015075683594, -59.27863693237305, -56.8902587890625, -54.50188064575195, -52.113502502441406, -49.72512435913086, -47.33674621582031, -44.948368072509766, -42.55998992919922, -40.17161178588867, -37.783233642578125, -35.39485549926758, -33.00647735595703, -30.618099212646484, -28.229721069335938, -25.84134292602539, -23.452972412109375, -21.064594268798828, -18.67621612548828, -16.287837982177734, -13.899459838867188, -11.51108169555664, -9.122703552246094, -6.734325408935547, -4.345947265625, -1.9575691223144531, 0.43080902099609375, 2.8191871643066406, 5.2075653076171875, 7.595943450927734, 9.984321594238281, 12.372699737548828, 14.761077880859375, 17.149456024169922, 19.53783416748047, 21.926212310791016, 24.314590454101562, 26.70296859741211, 29.091346740722656, 31.479724884033203, 33.86810302734375, 36.2564811706543, 38.644859313964844, 41.03323745727539, 43.42161560058594, 45.809993743896484, 48.19837188720703, 50.58675003051758, 52.975128173828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 6.0, 4.0, 11.0, 13.0, 10.0, 18.0, 21.0, 21.0, 21.0, 22.0, 29.0, 30.0, 46.0, 46.0, 42.0, 48.0, 59.0, 60.0, 57.0, 51.0, 44.0, 48.0, 35.0, 38.0, 45.0, 33.0, 20.0, 20.0, 12.0, 14.0, 12.0, 8.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.42815399169922, -31.290611267089844, -30.1530704498291, -29.01552963256836, -27.877986907958984, -26.74044418334961, -25.602903366088867, -24.465362548828125, -23.32781982421875, -22.190277099609375, -21.052736282348633, -19.91519546508789, -18.777652740478516, -17.64011001586914, -16.5025691986084, -15.36502742767334, -14.227485656738281, -13.089943885803223, -11.952402114868164, -10.814860343933105, -9.677318572998047, -8.539776802062988, -7.40223503112793, -6.264693260192871, -5.1271514892578125, -3.989609718322754, -2.8520679473876953, -1.7145261764526367, -0.5769844055175781, 0.5605573654174805, 1.698099136352539, 2.8356409072875977, 3.9731788635253906, 5.110720634460449, 6.248262405395508, 7.385804176330566, 8.523345947265625, 9.660887718200684, 10.798429489135742, 11.9359712600708, 13.07351303100586, 14.211054801940918, 15.348596572875977, 16.48613739013672, 17.623680114746094, 18.76122283935547, 19.89876365661621, 21.036304473876953, 22.173847198486328, 23.311389923095703, 24.448930740356445, 25.586471557617188, 26.724014282226562, 27.861557006835938, 28.99909782409668, 30.136638641357422, 31.274181365966797, 32.41172409057617, 33.54926300048828, 34.686805725097656, 35.82434844970703, 36.961891174316406, 38.09943389892578, 39.23697280883789, 40.374515533447266]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 12.0, 18.0, 33.0, 53.0, 85.0, 120.0, 208.0, 407.0, 846.0, 1670.0, 4189.0, 11495.0, 35518.0, 132499.0, 462850.0, 291641.0, 73402.0, 20977.0, 7230.0, 2787.0, 1190.0, 576.0, 317.0, 148.0, 93.0, 58.0, 32.0, 15.0, 16.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.7178955078125, -6.467041015625, -6.2161865234375, -5.96533203125, -5.7144775390625, -5.463623046875, -5.2127685546875, -4.9619140625, -4.7110595703125, -4.460205078125, -4.2093505859375, -3.95849609375, -3.7076416015625, -3.456787109375, -3.2059326171875, -2.955078125, -2.7042236328125, -2.453369140625, -2.2025146484375, -1.95166015625, -1.7008056640625, -1.449951171875, -1.1990966796875, -0.9482421875, -0.6973876953125, -0.446533203125, -0.1956787109375, 0.05517578125, 0.3060302734375, 0.556884765625, 0.8077392578125, 1.05859375, 1.3094482421875, 1.560302734375, 1.8111572265625, 2.06201171875, 2.3128662109375, 2.563720703125, 2.8145751953125, 3.0654296875, 3.3162841796875, 3.567138671875, 3.8179931640625, 4.06884765625, 4.3197021484375, 4.570556640625, 4.8214111328125, 5.072265625, 5.3231201171875, 5.573974609375, 5.8248291015625, 6.07568359375, 6.3265380859375, 6.577392578125, 6.8282470703125, 7.0791015625, 7.3299560546875, 7.580810546875, 7.8316650390625, 8.08251953125, 8.3333740234375, 8.584228515625, 8.8350830078125, 9.0859375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 6.0, 4.0, 9.0, 10.0, 5.0, 14.0, 28.0, 23.0, 26.0, 36.0, 31.0, 39.0, 57.0, 57.0, 48.0, 51.0, 61.0, 65.0, 56.0, 54.0, 59.0, 48.0, 52.0, 32.0, 27.0, 24.0, 21.0, 24.0, 6.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.5745849609375, -4.438232421875, -4.3018798828125, -4.16552734375, -4.0291748046875, -3.892822265625, -3.7564697265625, -3.6201171875, -3.4837646484375, -3.347412109375, -3.2110595703125, -3.07470703125, -2.9383544921875, -2.802001953125, -2.6656494140625, -2.529296875, -2.3929443359375, -2.256591796875, -2.1202392578125, -1.98388671875, -1.8475341796875, -1.711181640625, -1.5748291015625, -1.4384765625, -1.3021240234375, -1.165771484375, -1.0294189453125, -0.89306640625, -0.7567138671875, -0.620361328125, -0.4840087890625, -0.34765625, -0.2113037109375, -0.074951171875, 0.0614013671875, 0.19775390625, 0.3341064453125, 0.470458984375, 0.6068115234375, 0.7431640625, 0.8795166015625, 1.015869140625, 1.1522216796875, 1.28857421875, 1.4249267578125, 1.561279296875, 1.6976318359375, 1.833984375, 1.9703369140625, 2.106689453125, 2.2430419921875, 2.37939453125, 2.5157470703125, 2.652099609375, 2.7884521484375, 2.9248046875, 3.0611572265625, 3.197509765625, 3.3338623046875, 3.47021484375, 3.6065673828125, 3.742919921875, 3.8792724609375, 4.015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 16.0, 12.0, 35.0, 53.0, 62.0, 94.0, 165.0, 262.0, 451.0, 944.0, 2282.0, 9783.0, 154041.0, 846007.0, 27732.0, 3825.0, 1287.0, 594.0, 343.0, 196.0, 130.0, 84.0, 46.0, 33.0, 24.0, 12.0, 11.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1796875, -14.6009521484375, -14.022216796875, -13.4434814453125, -12.86474609375, -12.2860107421875, -11.707275390625, -11.1285400390625, -10.5498046875, -9.9710693359375, -9.392333984375, -8.8135986328125, -8.23486328125, -7.6561279296875, -7.077392578125, -6.4986572265625, -5.919921875, -5.3411865234375, -4.762451171875, -4.1837158203125, -3.60498046875, -3.0262451171875, -2.447509765625, -1.8687744140625, -1.2900390625, -0.7113037109375, -0.132568359375, 0.4461669921875, 1.02490234375, 1.6036376953125, 2.182373046875, 2.7611083984375, 3.33984375, 3.9185791015625, 4.497314453125, 5.0760498046875, 5.65478515625, 6.2335205078125, 6.812255859375, 7.3909912109375, 7.9697265625, 8.5484619140625, 9.127197265625, 9.7059326171875, 10.28466796875, 10.8634033203125, 11.442138671875, 12.0208740234375, 12.599609375, 13.1783447265625, 13.757080078125, 14.3358154296875, 14.91455078125, 15.4932861328125, 16.072021484375, 16.6507568359375, 17.2294921875, 17.8082275390625, 18.386962890625, 18.9656982421875, 19.54443359375, 20.1231689453125, 20.701904296875, 21.2806396484375, 21.859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 9.0, 25.0, 18.0, 27.0, 44.0, 46.0, 47.0, 62.0, 62.0, 71.0, 76.0, 80.0, 60.0, 71.0, 60.0, 37.0, 38.0, 35.0, 30.0, 14.0, 16.0, 16.0, 5.0, 12.0, 10.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.758056640625, -21.18798828125, -20.617919921875, -20.0478515625, -19.477783203125, -18.90771484375, -18.337646484375, -17.767578125, -17.197509765625, -16.62744140625, -16.057373046875, -15.4873046875, -14.917236328125, -14.34716796875, -13.777099609375, -13.20703125, -12.636962890625, -12.06689453125, -11.496826171875, -10.9267578125, -10.356689453125, -9.78662109375, -9.216552734375, -8.646484375, -8.076416015625, -7.50634765625, -6.936279296875, -6.3662109375, -5.796142578125, -5.22607421875, -4.656005859375, -4.0859375, -3.515869140625, -2.94580078125, -2.375732421875, -1.8056640625, -1.235595703125, -0.66552734375, -0.095458984375, 0.474609375, 1.044677734375, 1.61474609375, 2.184814453125, 2.7548828125, 3.324951171875, 3.89501953125, 4.465087890625, 5.03515625, 5.605224609375, 6.17529296875, 6.745361328125, 7.3154296875, 7.885498046875, 8.45556640625, 9.025634765625, 9.595703125, 10.165771484375, 10.73583984375, 11.305908203125, 11.8759765625, 12.446044921875, 13.01611328125, 13.586181640625, 14.15625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 5.0, 7.0, 7.0, 12.0, 6.0, 12.0, 19.0, 15.0, 17.0, 31.0, 26.0, 41.0, 49.0, 54.0, 104.0, 146.0, 217.0, 447.0, 1054.0, 2954.0, 14086.0, 841545.0, 174718.0, 8781.0, 2268.0, 846.0, 365.0, 191.0, 126.0, 103.0, 59.0, 48.0, 43.0, 26.0, 22.0, 18.0, 15.0, 15.0, 13.0, 10.0, 3.0, 9.0, 3.0, 2.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.06640625, -6.8577880859375, -6.649169921875, -6.4405517578125, -6.23193359375, -6.0233154296875, -5.814697265625, -5.6060791015625, -5.3974609375, -5.1888427734375, -4.980224609375, -4.7716064453125, -4.56298828125, -4.3543701171875, -4.145751953125, -3.9371337890625, -3.728515625, -3.5198974609375, -3.311279296875, -3.1026611328125, -2.89404296875, -2.6854248046875, -2.476806640625, -2.2681884765625, -2.0595703125, -1.8509521484375, -1.642333984375, -1.4337158203125, -1.22509765625, -1.0164794921875, -0.807861328125, -0.5992431640625, -0.390625, -0.1820068359375, 0.026611328125, 0.2352294921875, 0.44384765625, 0.6524658203125, 0.861083984375, 1.0697021484375, 1.2783203125, 1.4869384765625, 1.695556640625, 1.9041748046875, 2.11279296875, 2.3214111328125, 2.530029296875, 2.7386474609375, 2.947265625, 3.1558837890625, 3.364501953125, 3.5731201171875, 3.78173828125, 3.9903564453125, 4.198974609375, 4.4075927734375, 4.6162109375, 4.8248291015625, 5.033447265625, 5.2420654296875, 5.45068359375, 5.6593017578125, 5.867919921875, 6.0765380859375, 6.28515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 7.0, 20.0, 23.0, 38.0, 51.0, 112.0, 212.0, 221.0, 114.0, 59.0, 31.0, 28.0, 17.0, 6.0, 6.0, 4.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00102996826171875, -0.0009988471865653992, -0.0009677261114120483, -0.0009366050362586975, -0.0009054839611053467, -0.0008743628859519958, -0.000843241810798645, -0.0008121207356452942, -0.0007809996604919434, -0.0007498785853385925, -0.0007187575101852417, -0.0006876364350318909, -0.00065651535987854, -0.0006253942847251892, -0.0005942732095718384, -0.0005631521344184875, -0.0005320310592651367, -0.0005009099841117859, -0.00046978890895843506, -0.00043866783380508423, -0.0004075467586517334, -0.00037642568349838257, -0.00034530460834503174, -0.0003141835331916809, -0.0002830624580383301, -0.00025194138288497925, -0.00022082030773162842, -0.0001896992325782776, -0.00015857815742492676, -0.00012745708227157593, -9.63360071182251e-05, -6.521493196487427e-05, -3.409385681152344e-05, -2.9727816581726074e-06, 2.8148293495178223e-05, 5.926936864852905e-05, 9.039044380187988e-05, 0.00012151151895523071, 0.00015263259410858154, 0.00018375366926193237, 0.0002148747444152832, 0.00024599581956863403, 0.00027711689472198486, 0.0003082379698753357, 0.0003393590450286865, 0.00037048012018203735, 0.0004016011953353882, 0.000432722270488739, 0.00046384334564208984, 0.0004949644207954407, 0.0005260854959487915, 0.0005572065711021423, 0.0005883276462554932, 0.000619448721408844, 0.0006505697965621948, 0.0006816908717155457, 0.0007128119468688965, 0.0007439330220222473, 0.0007750540971755981, 0.000806175172328949, 0.0008372962474822998, 0.0008684173226356506, 0.0008995383977890015, 0.0009306594729423523, 0.0009617805480957031]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 5.0, 7.0, 4.0, 7.0, 3.0, 7.0, 18.0, 14.0, 14.0, 35.0, 54.0, 58.0, 84.0, 110.0, 127.0, 209.0, 388.0, 641.0, 1322.0, 2798.0, 6759.0, 28674.0, 698922.0, 275441.0, 21788.0, 5909.0, 2422.0, 1137.0, 615.0, 312.0, 203.0, 127.0, 83.0, 50.0, 47.0, 40.0, 26.0, 20.0, 18.0, 14.0, 6.0, 7.0, 4.0, 5.0, 8.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.3203125, -4.1890869140625, -4.057861328125, -3.9266357421875, -3.79541015625, -3.6641845703125, -3.532958984375, -3.4017333984375, -3.2705078125, -3.1392822265625, -3.008056640625, -2.8768310546875, -2.74560546875, -2.6143798828125, -2.483154296875, -2.3519287109375, -2.220703125, -2.0894775390625, -1.958251953125, -1.8270263671875, -1.69580078125, -1.5645751953125, -1.433349609375, -1.3021240234375, -1.1708984375, -1.0396728515625, -0.908447265625, -0.7772216796875, -0.64599609375, -0.5147705078125, -0.383544921875, -0.2523193359375, -0.12109375, 0.0101318359375, 0.141357421875, 0.2725830078125, 0.40380859375, 0.5350341796875, 0.666259765625, 0.7974853515625, 0.9287109375, 1.0599365234375, 1.191162109375, 1.3223876953125, 1.45361328125, 1.5848388671875, 1.716064453125, 1.8472900390625, 1.978515625, 2.1097412109375, 2.240966796875, 2.3721923828125, 2.50341796875, 2.6346435546875, 2.765869140625, 2.8970947265625, 3.0283203125, 3.1595458984375, 3.290771484375, 3.4219970703125, 3.55322265625, 3.6844482421875, 3.815673828125, 3.9468994140625, 4.078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 13.0, 18.0, 47.0, 46.0, 104.0, 166.0, 209.0, 163.0, 107.0, 61.0, 22.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8515625, -5.6763916015625, -5.501220703125, -5.3260498046875, -5.15087890625, -4.9757080078125, -4.800537109375, -4.6253662109375, -4.4501953125, -4.2750244140625, -4.099853515625, -3.9246826171875, -3.74951171875, -3.5743408203125, -3.399169921875, -3.2239990234375, -3.048828125, -2.8736572265625, -2.698486328125, -2.5233154296875, -2.34814453125, -2.1729736328125, -1.997802734375, -1.8226318359375, -1.6474609375, -1.4722900390625, -1.297119140625, -1.1219482421875, -0.94677734375, -0.7716064453125, -0.596435546875, -0.4212646484375, -0.24609375, -0.0709228515625, 0.104248046875, 0.2794189453125, 0.45458984375, 0.6297607421875, 0.804931640625, 0.9801025390625, 1.1552734375, 1.3304443359375, 1.505615234375, 1.6807861328125, 1.85595703125, 2.0311279296875, 2.206298828125, 2.3814697265625, 2.556640625, 2.7318115234375, 2.906982421875, 3.0821533203125, 3.25732421875, 3.4324951171875, 3.607666015625, 3.7828369140625, 3.9580078125, 4.1331787109375, 4.308349609375, 4.4835205078125, 4.65869140625, 4.8338623046875, 5.009033203125, 5.1842041015625, 5.359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 21.0, 82.0, 496.0, 295.0, 73.0, 12.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.68496704101562, -192.44651794433594, -186.20806884765625, -179.9696044921875, -173.7311553955078, -167.49270629882812, -161.25425720214844, -155.01580810546875, -148.77734375, -142.5388946533203, -136.30044555664062, -130.06198120117188, -123.82353210449219, -117.5850830078125, -111.34663391113281, -105.10818481445312, -98.86973571777344, -92.63128662109375, -86.39282989501953, -80.15438079833984, -73.91592407226562, -67.67747497558594, -61.43902587890625, -55.2005729675293, -48.962120056152344, -42.72366714477539, -36.48521423339844, -30.24676513671875, -24.008312225341797, -17.769859313964844, -11.531410217285156, -5.292957305908203, 0.9455108642578125, 7.183962821960449, 13.422414779663086, 19.660865783691406, 25.89931869506836, 32.13777160644531, 38.376220703125, 44.61467361450195, 50.853126525878906, 57.09157943725586, 63.33003234863281, 69.5684814453125, 75.80693054199219, 82.0453872680664, 88.2838363647461, 94.52229309082031, 100.7607421875, 106.99919128417969, 113.2376480102539, 119.4760971069336, 125.71455383300781, 131.9530029296875, 138.1914520263672, 144.42990112304688, 150.66836547851562, 156.9068145751953, 163.145263671875, 169.38372802734375, 175.62217712402344, 181.86062622070312, 188.0990753173828, 194.3375244140625, 200.5759735107422]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 6.0, 16.0, 13.0, 14.0, 18.0, 31.0, 29.0, 16.0, 30.0, 21.0, 35.0, 39.0, 65.0, 132.0, 130.0, 64.0, 42.0, 33.0, 32.0, 24.0, 27.0, 27.0, 18.0, 19.0, 13.0, 9.0, 11.0, 17.0, 7.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.74113464355469, -45.06919860839844, -43.39726257324219, -41.72532272338867, -40.05338668823242, -38.38145065307617, -36.709510803222656, -35.037574768066406, -33.365638732910156, -31.693702697753906, -30.021764755249023, -28.34982681274414, -26.67789077758789, -25.00595474243164, -23.334016799926758, -21.662078857421875, -19.990142822265625, -18.318206787109375, -16.646268844604492, -14.974331855773926, -13.30239486694336, -11.630457878112793, -9.958520889282227, -8.28658390045166, -6.614646911621094, -4.942709922790527, -3.270772933959961, -1.5988359451293945, 0.07310104370117188, 1.7450380325317383, 3.4169750213623047, 5.088912010192871, 6.760852813720703, 8.43278980255127, 10.104726791381836, 11.776663780212402, 13.448600769042969, 15.120537757873535, 16.7924747467041, 18.464412689208984, 20.136348724365234, 21.808284759521484, 23.480222702026367, 25.15216064453125, 26.8240966796875, 28.49603271484375, 30.167970657348633, 31.839908599853516, 33.511844635009766, 35.183780670166016, 36.85572052001953, 38.52765655517578, 40.19959259033203, 41.87152862548828, 43.54346466064453, 45.21540451049805, 46.8873405456543, 48.55927658081055, 50.23121643066406, 51.90315246582031, 53.57508850097656, 55.24702453613281, 56.91896057128906, 58.59090042114258, 60.26283645629883]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 14.0, 11.0, 9.0, 23.0, 32.0, 42.0, 56.0, 94.0, 152.0, 321.0, 579.0, 1182.0, 2628.0, 7029.0, 23784.0, 158460.0, 2147354.0, 1695105.0, 126133.0, 20570.0, 6034.0, 2365.0, 1025.0, 474.0, 252.0, 162.0, 102.0, 69.0, 61.0, 34.0, 21.0, 22.0, 21.0, 13.0, 8.0, 11.0, 6.0, 2.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4276123046875, -8.136474609375, -7.8453369140625, -7.55419921875, -7.2630615234375, -6.971923828125, -6.6807861328125, -6.3896484375, -6.0985107421875, -5.807373046875, -5.5162353515625, -5.22509765625, -4.9339599609375, -4.642822265625, -4.3516845703125, -4.060546875, -3.7694091796875, -3.478271484375, -3.1871337890625, -2.89599609375, -2.6048583984375, -2.313720703125, -2.0225830078125, -1.7314453125, -1.4403076171875, -1.149169921875, -0.8580322265625, -0.56689453125, -0.2757568359375, 0.015380859375, 0.3065185546875, 0.59765625, 0.8887939453125, 1.179931640625, 1.4710693359375, 1.76220703125, 2.0533447265625, 2.344482421875, 2.6356201171875, 2.9267578125, 3.2178955078125, 3.509033203125, 3.8001708984375, 4.09130859375, 4.3824462890625, 4.673583984375, 4.9647216796875, 5.255859375, 5.5469970703125, 5.838134765625, 6.1292724609375, 6.42041015625, 6.7115478515625, 7.002685546875, 7.2938232421875, 7.5849609375, 7.8760986328125, 8.167236328125, 8.4583740234375, 8.74951171875, 9.0406494140625, 9.331787109375, 9.6229248046875, 9.9140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 10.0, 1.0, 5.0, 10.0, 14.0, 16.0, 20.0, 16.0, 22.0, 22.0, 21.0, 31.0, 53.0, 45.0, 45.0, 38.0, 43.0, 49.0, 38.0, 55.0, 51.0, 59.0, 47.0, 48.0, 40.0, 50.0, 28.0, 29.0, 19.0, 19.0, 15.0, 8.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5703125, -3.463165283203125, -3.35601806640625, -3.248870849609375, -3.1417236328125, -3.034576416015625, -2.92742919921875, -2.820281982421875, -2.713134765625, -2.605987548828125, -2.49884033203125, -2.391693115234375, -2.2845458984375, -2.177398681640625, -2.07025146484375, -1.963104248046875, -1.85595703125, -1.748809814453125, -1.64166259765625, -1.534515380859375, -1.4273681640625, -1.320220947265625, -1.21307373046875, -1.105926513671875, -0.998779296875, -0.891632080078125, -0.78448486328125, -0.677337646484375, -0.5701904296875, -0.463043212890625, -0.35589599609375, -0.248748779296875, -0.1416015625, -0.034454345703125, 0.07269287109375, 0.179840087890625, 0.2869873046875, 0.394134521484375, 0.50128173828125, 0.608428955078125, 0.715576171875, 0.822723388671875, 0.92987060546875, 1.037017822265625, 1.1441650390625, 1.251312255859375, 1.35845947265625, 1.465606689453125, 1.57275390625, 1.679901123046875, 1.78704833984375, 1.894195556640625, 2.0013427734375, 2.108489990234375, 2.21563720703125, 2.322784423828125, 2.429931640625, 2.537078857421875, 2.64422607421875, 2.751373291015625, 2.8585205078125, 2.965667724609375, 3.07281494140625, 3.179962158203125, 3.287109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 11.0, 18.0, 16.0, 29.0, 52.0, 81.0, 120.0, 241.0, 402.0, 839.0, 1859.0, 5710.0, 46639.0, 3937414.0, 186944.0, 9298.0, 2384.0, 1043.0, 488.0, 266.0, 147.0, 91.0, 42.0, 38.0, 26.0, 16.0, 12.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.5, -22.78076171875, -22.0615234375, -21.34228515625, -20.623046875, -19.90380859375, -19.1845703125, -18.46533203125, -17.74609375, -17.02685546875, -16.3076171875, -15.58837890625, -14.869140625, -14.14990234375, -13.4306640625, -12.71142578125, -11.9921875, -11.27294921875, -10.5537109375, -9.83447265625, -9.115234375, -8.39599609375, -7.6767578125, -6.95751953125, -6.23828125, -5.51904296875, -4.7998046875, -4.08056640625, -3.361328125, -2.64208984375, -1.9228515625, -1.20361328125, -0.484375, 0.23486328125, 0.9541015625, 1.67333984375, 2.392578125, 3.11181640625, 3.8310546875, 4.55029296875, 5.26953125, 5.98876953125, 6.7080078125, 7.42724609375, 8.146484375, 8.86572265625, 9.5849609375, 10.30419921875, 11.0234375, 11.74267578125, 12.4619140625, 13.18115234375, 13.900390625, 14.61962890625, 15.3388671875, 16.05810546875, 16.77734375, 17.49658203125, 18.2158203125, 18.93505859375, 19.654296875, 20.37353515625, 21.0927734375, 21.81201171875, 22.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 15.0, 18.0, 21.0, 34.0, 48.0, 77.0, 117.0, 168.0, 260.0, 416.0, 642.0, 795.0, 517.0, 337.0, 220.0, 121.0, 97.0, 50.0, 32.0, 28.0, 17.0, 7.0, 10.0, 8.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.375, -16.955322265625, -16.53564453125, -16.115966796875, -15.6962890625, -15.276611328125, -14.85693359375, -14.437255859375, -14.017578125, -13.597900390625, -13.17822265625, -12.758544921875, -12.3388671875, -11.919189453125, -11.49951171875, -11.079833984375, -10.66015625, -10.240478515625, -9.82080078125, -9.401123046875, -8.9814453125, -8.561767578125, -8.14208984375, -7.722412109375, -7.302734375, -6.883056640625, -6.46337890625, -6.043701171875, -5.6240234375, -5.204345703125, -4.78466796875, -4.364990234375, -3.9453125, -3.525634765625, -3.10595703125, -2.686279296875, -2.2666015625, -1.846923828125, -1.42724609375, -1.007568359375, -0.587890625, -0.168212890625, 0.25146484375, 0.671142578125, 1.0908203125, 1.510498046875, 1.93017578125, 2.349853515625, 2.76953125, 3.189208984375, 3.60888671875, 4.028564453125, 4.4482421875, 4.867919921875, 5.28759765625, 5.707275390625, 6.126953125, 6.546630859375, 6.96630859375, 7.385986328125, 7.8056640625, 8.225341796875, 8.64501953125, 9.064697265625, 9.484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 14.0, 30.0, 38.0, 77.0, 140.0, 232.0, 213.0, 105.0, 56.0, 35.0, 9.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.79296112060547, -113.8218994140625, -108.85083770751953, -103.87977600097656, -98.9087142944336, -93.93765258789062, -88.96659851074219, -83.99552917480469, -79.02447509765625, -74.05341339111328, -69.08235168457031, -64.11128997802734, -59.140228271484375, -54.169166564941406, -49.1981086730957, -44.227046966552734, -39.2559814453125, -34.28491973876953, -29.313858032226562, -24.342798233032227, -19.371736526489258, -14.400674819946289, -9.429615020751953, -4.458553314208984, 0.5125083923339844, 5.483569622039795, 10.454630851745605, 15.425691604614258, 20.396753311157227, 25.367815017700195, 30.33887481689453, 35.3099365234375, 40.28099060058594, 45.252052307128906, 50.223114013671875, 55.194175720214844, 60.16523742675781, 65.13629913330078, 70.10736083984375, 75.07841491699219, 80.04948425292969, 85.02054595947266, 89.99160766601562, 94.9626693725586, 99.93373107910156, 104.90479278564453, 109.8758544921875, 114.84690856933594, 119.8179702758789, 124.78903198242188, 129.7600860595703, 134.7311553955078, 139.70220947265625, 144.67327880859375, 149.6443328857422, 154.6154022216797, 159.58645629882812, 164.55751037597656, 169.52857971191406, 174.4996337890625, 179.470703125, 184.44175720214844, 189.41282653808594, 194.38388061523438, 199.35494995117188]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 9.0, 9.0, 14.0, 18.0, 20.0, 21.0, 27.0, 38.0, 44.0, 41.0, 47.0, 72.0, 69.0, 68.0, 63.0, 58.0, 48.0, 60.0, 46.0, 43.0, 29.0, 25.0, 29.0, 21.0, 17.0, 16.0, 12.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.29485321044922, -63.03205490112305, -60.769256591796875, -58.50645446777344, -56.243656158447266, -53.980857849121094, -51.718055725097656, -49.455257415771484, -47.19245910644531, -44.92966079711914, -42.66686248779297, -40.40406036376953, -38.14126205444336, -35.87846374511719, -33.61566162109375, -31.352863311767578, -29.090065002441406, -26.827266693115234, -24.56446647644043, -22.301666259765625, -20.038867950439453, -17.77606964111328, -15.513269424438477, -13.250470161437988, -10.9876708984375, -8.724871635437012, -6.462072372436523, -4.199273109436035, -1.9364738464355469, 0.3263254165649414, 2.5891246795654297, 4.851923942565918, 7.114723205566406, 9.377522468566895, 11.640321731567383, 13.903120994567871, 16.16592025756836, 18.42871856689453, 20.691518783569336, 22.95431900024414, 25.217117309570312, 27.479915618896484, 29.74271583557129, 32.005516052246094, 34.268314361572266, 36.53111267089844, 38.793914794921875, 41.05671310424805, 43.31951141357422, 45.58230972290039, 47.84510803222656, 50.10791015625, 52.37070846557617, 54.633506774902344, 56.89630889892578, 59.15910720825195, 61.421905517578125, 63.6847038269043, 65.94750213623047, 68.2103042602539, 70.47309875488281, 72.73590087890625, 74.99870300292969, 77.2614974975586, 79.52429962158203]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 7.0, 16.0, 16.0, 36.0, 76.0, 141.0, 312.0, 797.0, 2308.0, 7472.0, 32387.0, 276624.0, 654898.0, 57137.0, 11173.0, 3209.0, 1122.0, 425.0, 167.0, 79.0, 57.0, 22.0, 25.0, 15.0, 9.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9195556640625, -7.604736328125, -7.2899169921875, -6.97509765625, -6.6602783203125, -6.345458984375, -6.0306396484375, -5.7158203125, -5.4010009765625, -5.086181640625, -4.7713623046875, -4.45654296875, -4.1417236328125, -3.826904296875, -3.5120849609375, -3.197265625, -2.8824462890625, -2.567626953125, -2.2528076171875, -1.93798828125, -1.6231689453125, -1.308349609375, -0.9935302734375, -0.6787109375, -0.3638916015625, -0.049072265625, 0.2657470703125, 0.58056640625, 0.8953857421875, 1.210205078125, 1.5250244140625, 1.83984375, 2.1546630859375, 2.469482421875, 2.7843017578125, 3.09912109375, 3.4139404296875, 3.728759765625, 4.0435791015625, 4.3583984375, 4.6732177734375, 4.988037109375, 5.3028564453125, 5.61767578125, 5.9324951171875, 6.247314453125, 6.5621337890625, 6.876953125, 7.1917724609375, 7.506591796875, 7.8214111328125, 8.13623046875, 8.4510498046875, 8.765869140625, 9.0806884765625, 9.3955078125, 9.7103271484375, 10.025146484375, 10.3399658203125, 10.65478515625, 10.9696044921875, 11.284423828125, 11.5992431640625, 11.9140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 13.0, 9.0, 17.0, 21.0, 18.0, 23.0, 29.0, 40.0, 46.0, 50.0, 62.0, 57.0, 56.0, 56.0, 64.0, 62.0, 62.0, 41.0, 48.0, 39.0, 49.0, 27.0, 23.0, 20.0, 13.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.9415283203125, -4.789306640625, -4.6370849609375, -4.48486328125, -4.3326416015625, -4.180419921875, -4.0281982421875, -3.8759765625, -3.7237548828125, -3.571533203125, -3.4193115234375, -3.26708984375, -3.1148681640625, -2.962646484375, -2.8104248046875, -2.658203125, -2.5059814453125, -2.353759765625, -2.2015380859375, -2.04931640625, -1.8970947265625, -1.744873046875, -1.5926513671875, -1.4404296875, -1.2882080078125, -1.135986328125, -0.9837646484375, -0.83154296875, -0.6793212890625, -0.527099609375, -0.3748779296875, -0.22265625, -0.0704345703125, 0.081787109375, 0.2340087890625, 0.38623046875, 0.5384521484375, 0.690673828125, 0.8428955078125, 0.9951171875, 1.1473388671875, 1.299560546875, 1.4517822265625, 1.60400390625, 1.7562255859375, 1.908447265625, 2.0606689453125, 2.212890625, 2.3651123046875, 2.517333984375, 2.6695556640625, 2.82177734375, 2.9739990234375, 3.126220703125, 3.2784423828125, 3.4306640625, 3.5828857421875, 3.735107421875, 3.8873291015625, 4.03955078125, 4.1917724609375, 4.343994140625, 4.4962158203125, 4.6484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 6.0, 6.0, 6.0, 5.0, 6.0, 10.0, 15.0, 18.0, 20.0, 46.0, 57.0, 87.0, 157.0, 248.0, 464.0, 1023.0, 3420.0, 24724.0, 909942.0, 97488.0, 7663.0, 1642.0, 615.0, 345.0, 202.0, 107.0, 80.0, 48.0, 27.0, 18.0, 18.0, 12.0, 9.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -8.9581298828125, -8.595947265625, -8.2337646484375, -7.87158203125, -7.5093994140625, -7.147216796875, -6.7850341796875, -6.4228515625, -6.0606689453125, -5.698486328125, -5.3363037109375, -4.97412109375, -4.6119384765625, -4.249755859375, -3.8875732421875, -3.525390625, -3.1632080078125, -2.801025390625, -2.4388427734375, -2.07666015625, -1.7144775390625, -1.352294921875, -0.9901123046875, -0.6279296875, -0.2657470703125, 0.096435546875, 0.4586181640625, 0.82080078125, 1.1829833984375, 1.545166015625, 1.9073486328125, 2.26953125, 2.6317138671875, 2.993896484375, 3.3560791015625, 3.71826171875, 4.0804443359375, 4.442626953125, 4.8048095703125, 5.1669921875, 5.5291748046875, 5.891357421875, 6.2535400390625, 6.61572265625, 6.9779052734375, 7.340087890625, 7.7022705078125, 8.064453125, 8.4266357421875, 8.788818359375, 9.1510009765625, 9.51318359375, 9.8753662109375, 10.237548828125, 10.5997314453125, 10.9619140625, 11.3240966796875, 11.686279296875, 12.0484619140625, 12.41064453125, 12.7728271484375, 13.135009765625, 13.4971923828125, 13.859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 5.0, 9.0, 11.0, 11.0, 18.0, 19.0, 17.0, 24.0, 31.0, 34.0, 34.0, 51.0, 79.0, 88.0, 89.0, 71.0, 73.0, 64.0, 36.0, 39.0, 33.0, 22.0, 17.0, 22.0, 19.0, 18.0, 10.0, 9.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -14.066162109375, -13.53857421875, -13.010986328125, -12.4833984375, -11.955810546875, -11.42822265625, -10.900634765625, -10.373046875, -9.845458984375, -9.31787109375, -8.790283203125, -8.2626953125, -7.735107421875, -7.20751953125, -6.679931640625, -6.15234375, -5.624755859375, -5.09716796875, -4.569580078125, -4.0419921875, -3.514404296875, -2.98681640625, -2.459228515625, -1.931640625, -1.404052734375, -0.87646484375, -0.348876953125, 0.1787109375, 0.706298828125, 1.23388671875, 1.761474609375, 2.2890625, 2.816650390625, 3.34423828125, 3.871826171875, 4.3994140625, 4.927001953125, 5.45458984375, 5.982177734375, 6.509765625, 7.037353515625, 7.56494140625, 8.092529296875, 8.6201171875, 9.147705078125, 9.67529296875, 10.202880859375, 10.73046875, 11.258056640625, 11.78564453125, 12.313232421875, 12.8408203125, 13.368408203125, 13.89599609375, 14.423583984375, 14.951171875, 15.478759765625, 16.00634765625, 16.533935546875, 17.0615234375, 17.589111328125, 18.11669921875, 18.644287109375, 19.171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 7.0, 4.0, 5.0, 17.0, 12.0, 4.0, 16.0, 15.0, 34.0, 36.0, 72.0, 98.0, 171.0, 305.0, 704.0, 1848.0, 6899.0, 42700.0, 922267.0, 60966.0, 8406.0, 2291.0, 776.0, 343.0, 163.0, 125.0, 96.0, 40.0, 30.0, 22.0, 7.0, 7.0, 9.0, 7.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.810546875, -1.7549591064453125, -1.699371337890625, -1.6437835693359375, -1.58819580078125, -1.5326080322265625, -1.477020263671875, -1.4214324951171875, -1.3658447265625, -1.3102569580078125, -1.254669189453125, -1.1990814208984375, -1.14349365234375, -1.0879058837890625, -1.032318115234375, -0.9767303466796875, -0.921142578125, -0.8655548095703125, -0.809967041015625, -0.7543792724609375, -0.69879150390625, -0.6432037353515625, -0.587615966796875, -0.5320281982421875, -0.4764404296875, -0.4208526611328125, -0.365264892578125, -0.3096771240234375, -0.25408935546875, -0.1985015869140625, -0.142913818359375, -0.0873260498046875, -0.03173828125, 0.0238494873046875, 0.079437255859375, 0.1350250244140625, 0.19061279296875, 0.2462005615234375, 0.301788330078125, 0.3573760986328125, 0.4129638671875, 0.4685516357421875, 0.524139404296875, 0.5797271728515625, 0.63531494140625, 0.6909027099609375, 0.746490478515625, 0.8020782470703125, 0.857666015625, 0.9132537841796875, 0.968841552734375, 1.0244293212890625, 1.08001708984375, 1.1356048583984375, 1.191192626953125, 1.2467803955078125, 1.3023681640625, 1.3579559326171875, 1.413543701171875, 1.4691314697265625, 1.52471923828125, 1.5803070068359375, 1.635894775390625, 1.6914825439453125, 1.7470703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 5.0, 12.0, 9.0, 15.0, 16.0, 23.0, 17.0, 28.0, 35.0, 45.0, 62.0, 104.0, 105.0, 120.0, 90.0, 57.0, 49.0, 38.0, 24.0, 20.0, 19.0, 20.0, 19.0, 4.0, 13.0, 7.0, 4.0, 5.0, 4.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002646446228027344, -0.0002555251121520996, -0.00024640560150146484, -0.00023728609085083008, -0.0002281665802001953, -0.00021904706954956055, -0.00020992755889892578, -0.00020080804824829102, -0.00019168853759765625, -0.00018256902694702148, -0.00017344951629638672, -0.00016433000564575195, -0.0001552104949951172, -0.00014609098434448242, -0.00013697147369384766, -0.0001278519630432129, -0.00011873245239257812, -0.00010961294174194336, -0.0001004934310913086, -9.137392044067383e-05, -8.225440979003906e-05, -7.31348991394043e-05, -6.401538848876953e-05, -5.4895877838134766e-05, -4.57763671875e-05, -3.6656856536865234e-05, -2.753734588623047e-05, -1.8417835235595703e-05, -9.298324584960938e-06, -1.7881393432617188e-07, 8.940696716308594e-06, 1.806020736694336e-05, 2.7179718017578125e-05, 3.629922866821289e-05, 4.5418739318847656e-05, 5.453824996948242e-05, 6.365776062011719e-05, 7.277727127075195e-05, 8.189678192138672e-05, 9.101629257202148e-05, 0.00010013580322265625, 0.00010925531387329102, 0.00011837482452392578, 0.00012749433517456055, 0.0001366138458251953, 0.00014573335647583008, 0.00015485286712646484, 0.0001639723777770996, 0.00017309188842773438, 0.00018221139907836914, 0.0001913309097290039, 0.00020045042037963867, 0.00020956993103027344, 0.0002186894416809082, 0.00022780895233154297, 0.00023692846298217773, 0.0002460479736328125, 0.00025516748428344727, 0.00026428699493408203, 0.0002734065055847168, 0.00028252601623535156, 0.00029164552688598633, 0.0003007650375366211, 0.00030988454818725586, 0.0003190040588378906]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 4.0, 5.0, 10.0, 11.0, 20.0, 23.0, 29.0, 49.0, 113.0, 155.0, 293.0, 525.0, 1040.0, 2366.0, 5917.0, 18845.0, 102298.0, 836525.0, 58790.0, 13352.0, 4435.0, 1876.0, 834.0, 451.0, 239.0, 136.0, 70.0, 36.0, 38.0, 26.0, 8.0, 13.0, 4.0, 6.0, 4.0, 1.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.264556884765625, -1.22149658203125, -1.178436279296875, -1.1353759765625, -1.092315673828125, -1.04925537109375, -1.006195068359375, -0.963134765625, -0.920074462890625, -0.87701416015625, -0.833953857421875, -0.7908935546875, -0.747833251953125, -0.70477294921875, -0.661712646484375, -0.61865234375, -0.575592041015625, -0.53253173828125, -0.489471435546875, -0.4464111328125, -0.403350830078125, -0.36029052734375, -0.317230224609375, -0.274169921875, -0.231109619140625, -0.18804931640625, -0.144989013671875, -0.1019287109375, -0.058868408203125, -0.01580810546875, 0.027252197265625, 0.0703125, 0.113372802734375, 0.15643310546875, 0.199493408203125, 0.2425537109375, 0.285614013671875, 0.32867431640625, 0.371734619140625, 0.414794921875, 0.457855224609375, 0.50091552734375, 0.543975830078125, 0.5870361328125, 0.630096435546875, 0.67315673828125, 0.716217041015625, 0.75927734375, 0.802337646484375, 0.84539794921875, 0.888458251953125, 0.9315185546875, 0.974578857421875, 1.01763916015625, 1.060699462890625, 1.103759765625, 1.146820068359375, 1.18988037109375, 1.232940673828125, 1.2760009765625, 1.319061279296875, 1.36212158203125, 1.405181884765625, 1.4482421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 4.0, 8.0, 4.0, 6.0, 8.0, 6.0, 6.0, 7.0, 14.0, 30.0, 25.0, 30.0, 45.0, 61.0, 99.0, 113.0, 111.0, 121.0, 75.0, 55.0, 30.0, 34.0, 26.0, 19.0, 12.0, 12.0, 8.0, 3.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.292449951171875, -1.24798583984375, -1.203521728515625, -1.1590576171875, -1.114593505859375, -1.07012939453125, -1.025665283203125, -0.981201171875, -0.936737060546875, -0.89227294921875, -0.847808837890625, -0.8033447265625, -0.758880615234375, -0.71441650390625, -0.669952392578125, -0.62548828125, -0.581024169921875, -0.53656005859375, -0.492095947265625, -0.4476318359375, -0.403167724609375, -0.35870361328125, -0.314239501953125, -0.269775390625, -0.225311279296875, -0.18084716796875, -0.136383056640625, -0.0919189453125, -0.047454833984375, -0.00299072265625, 0.041473388671875, 0.0859375, 0.130401611328125, 0.17486572265625, 0.219329833984375, 0.2637939453125, 0.308258056640625, 0.35272216796875, 0.397186279296875, 0.441650390625, 0.486114501953125, 0.53057861328125, 0.575042724609375, 0.6195068359375, 0.663970947265625, 0.70843505859375, 0.752899169921875, 0.79736328125, 0.841827392578125, 0.88629150390625, 0.930755615234375, 0.9752197265625, 1.019683837890625, 1.06414794921875, 1.108612060546875, 1.153076171875, 1.197540283203125, 1.24200439453125, 1.286468505859375, 1.3309326171875, 1.375396728515625, 1.41986083984375, 1.464324951171875, 1.5087890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 14.0, 9.0, 11.0, 34.0, 31.0, 77.0, 235.0, 357.0, 93.0, 46.0, 30.0, 21.0, 15.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.122108459472656, -54.56947708129883, -53.016845703125, -51.46421432495117, -49.911582946777344, -48.358951568603516, -46.80632019042969, -45.253692626953125, -43.70105743408203, -42.1484260559082, -40.595794677734375, -39.04316329956055, -37.49053192138672, -35.93790054321289, -34.38526916503906, -32.8326416015625, -31.280010223388672, -29.727378845214844, -28.174747467041016, -26.622116088867188, -25.06948471069336, -23.51685333251953, -21.964223861694336, -20.411592483520508, -18.85896110534668, -17.30632972717285, -15.753698348999023, -14.201067924499512, -12.648436546325684, -11.095805168151855, -9.543174743652344, -7.990543365478516, -6.437915802001953, -4.885284423828125, -3.332653522491455, -1.7800226211547852, -0.22739124298095703, 1.325240135192871, 2.877870559692383, 4.430501937866211, 5.983133316040039, 7.535764694213867, 9.088396072387695, 10.641026496887207, 12.193657875061035, 13.746289253234863, 15.298919677734375, 16.851551055908203, 18.40418243408203, 19.95681381225586, 21.509445190429688, 23.062076568603516, 24.614707946777344, 26.167339324951172, 27.719968795776367, 29.272600173950195, 30.825231552124023, 32.37786102294922, 33.93049240112305, 35.483123779296875, 37.0357551574707, 38.58838653564453, 40.14101791381836, 41.69364929199219, 43.246280670166016]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [6.0, 3.0, 1.0, 5.0, 4.0, 15.0, 6.0, 9.0, 15.0, 18.0, 22.0, 20.0, 26.0, 28.0, 29.0, 97.0, 210.0, 189.0, 91.0, 29.0, 30.0, 25.0, 11.0, 22.0, 16.0, 21.0, 17.0, 17.0, 7.0, 5.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.048458099365234, -24.511716842651367, -22.9749755859375, -21.438236236572266, -19.9014949798584, -18.36475372314453, -16.828014373779297, -15.29127311706543, -13.754531860351562, -12.217790603637695, -10.681050300598145, -9.144309997558594, -7.607568740844727, -6.070827960968018, -4.534087181091309, -2.997346878051758, -1.4606056213378906, 0.07613515853881836, 1.6128759384155273, 3.1496167182922363, 4.686357498168945, 6.223098278045654, 7.759839057922363, 9.296579360961914, 10.833320617675781, 12.370061874389648, 13.9068021774292, 15.44354248046875, 16.980283737182617, 18.517024993896484, 20.05376434326172, 21.590505599975586, 23.12725067138672, 24.663991928100586, 26.200733184814453, 27.737472534179688, 29.274213790893555, 30.810955047607422, 32.347694396972656, 33.884437561035156, 35.42117691040039, 36.957916259765625, 38.494659423828125, 40.03139877319336, 41.568138122558594, 43.104881286621094, 44.64162063598633, 46.17835998535156, 47.71510314941406, 49.2518424987793, 50.7885856628418, 52.32532501220703, 53.86206817626953, 55.398807525634766, 56.935546875, 58.4722900390625, 60.009029388427734, 61.54576873779297, 63.08251190185547, 64.61925506591797, 66.15599060058594, 67.69273376464844, 69.22947692871094, 70.7662124633789, 72.3029556274414]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 12.0, 16.0, 17.0, 24.0, 28.0, 50.0, 49.0, 69.0, 262.0, 199.0, 64.0, 57.0, 37.0, 33.0, 21.0, 22.0, 13.0, 7.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -4.961181640625, -4.73486328125, -4.508544921875, -4.2822265625, -4.055908203125, -3.82958984375, -3.603271484375, -3.376953125, -3.150634765625, -2.92431640625, -2.697998046875, -2.4716796875, -2.245361328125, -2.01904296875, -1.792724609375, -1.56640625, -1.340087890625, -1.11376953125, -0.887451171875, -0.6611328125, -0.434814453125, -0.20849609375, 0.017822265625, 0.244140625, 0.470458984375, 0.69677734375, 0.923095703125, 1.1494140625, 1.375732421875, 1.60205078125, 1.828369140625, 2.0546875, 2.281005859375, 2.50732421875, 2.733642578125, 2.9599609375, 3.186279296875, 3.41259765625, 3.638916015625, 3.865234375, 4.091552734375, 4.31787109375, 4.544189453125, 4.7705078125, 4.996826171875, 5.22314453125, 5.449462890625, 5.67578125, 5.902099609375, 6.12841796875, 6.354736328125, 6.5810546875, 6.807373046875, 7.03369140625, 7.260009765625, 7.486328125, 7.712646484375, 7.93896484375, 8.165283203125, 8.3916015625, 8.617919921875, 8.84423828125, 9.070556640625, 9.296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 18.0, 46.0, 71.0, 257.0, 1674.0, 8332157.0, 52909.0, 1111.0, 185.0, 61.0, 33.0, 32.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-182.10321044921875, -178.22169494628906, -174.3401641845703, -170.45864868164062, -166.57713317871094, -162.6956024169922, -158.8140869140625, -154.93255615234375, -151.05104064941406, -147.16952514648438, -143.28799438476562, -139.40647888183594, -135.52496337890625, -131.6434326171875, -127.76191711425781, -123.8803939819336, -119.99887084960938, -116.11734771728516, -112.23583221435547, -108.35430908203125, -104.47278594970703, -100.59126281738281, -96.70974731445312, -92.8282241821289, -88.94670867919922, -85.065185546875, -81.18367004394531, -77.3021469116211, -73.42062377929688, -69.53910827636719, -65.65758514404297, -61.77606201171875, -57.89453887939453, -54.01301956176758, -50.13149642944336, -46.249977111816406, -42.36845397949219, -38.486934661865234, -34.60541534423828, -30.723892211914062, -26.842370986938477, -22.96084976196289, -19.079328536987305, -15.197808265686035, -11.31628704071045, -7.43476676940918, -3.5532455444335938, 0.3282756805419922, 4.209796905517578, 8.091318130493164, 11.97283935546875, 15.85435962677002, 19.735881805419922, 23.617401123046875, 27.49892234802246, 31.380443572998047, 35.261962890625, 39.14348220825195, 43.02500534057617, 46.906524658203125, 50.788047790527344, 54.6695671081543, 58.55108642578125, 62.43260955810547, 66.31413269042969]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 8.0, 5.0, 3.0, 5.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-148.4525604248047, -144.3014373779297, -140.15029907226562, -135.99917602539062, -131.84805297851562, -127.69692993164062, -123.5457992553711, -119.39466857910156, -115.24354553222656, -111.09242248535156, -106.94129180908203, -102.7901611328125, -98.6390380859375, -94.4879150390625, -90.33678436279297, -86.18565368652344, -82.03453063964844, -77.88340759277344, -73.7322769165039, -69.58114624023438, -65.43002319335938, -61.27889633178711, -57.127769470214844, -52.97664260864258, -48.82551574707031, -44.67438888549805, -40.52326202392578, -36.372135162353516, -32.22100830078125, -28.069881439208984, -23.91875457763672, -19.767627716064453, -15.61651611328125, -11.465389251708984, -7.314262390136719, -3.163135528564453, 0.9879913330078125, 5.139118194580078, 9.290245056152344, 13.44137191772461, 17.592498779296875, 21.74362564086914, 25.894752502441406, 30.045879364013672, 34.19700622558594, 38.3481330871582, 42.49925994873047, 46.650386810302734, 50.801513671875, 54.952640533447266, 59.10376739501953, 63.2548942565918, 67.40602111816406, 71.55714416503906, 75.7082748413086, 79.85940551757812, 84.01052856445312, 88.16165161132812, 92.31278228759766, 96.46391296386719, 100.61503601074219, 104.76615905761719, 108.91728973388672, 113.06842041015625, 117.21954345703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 11.0, 7.0, 29.0, 51.0, 128.0, 252.0, 670.0, 2136.0, 10366.0, 84306.0, 350611.0, 64366.0, 8312.0, 1874.0, 604.0, 255.0, 130.0, 68.0, 41.0, 14.0, 13.0, 8.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -67.8408203125, -65.369140625, -62.8974609375, -60.42578125, -57.9541015625, -55.482421875, -53.0107421875, -50.5390625, -48.0673828125, -45.595703125, -43.1240234375, -40.65234375, -38.1806640625, -35.708984375, -33.2373046875, -30.765625, -28.2939453125, -25.822265625, -23.3505859375, -20.87890625, -18.4072265625, -15.935546875, -13.4638671875, -10.9921875, -8.5205078125, -6.048828125, -3.5771484375, -1.10546875, 1.3662109375, 3.837890625, 6.3095703125, 8.78125, 11.2529296875, 13.724609375, 16.1962890625, 18.66796875, 21.1396484375, 23.611328125, 26.0830078125, 28.5546875, 31.0263671875, 33.498046875, 35.9697265625, 38.44140625, 40.9130859375, 43.384765625, 45.8564453125, 48.328125, 50.7998046875, 53.271484375, 55.7431640625, 58.21484375, 60.6865234375, 63.158203125, 65.6298828125, 68.1015625, 70.5732421875, 73.044921875, 75.5166015625, 77.98828125, 80.4599609375, 82.931640625, 85.4033203125, 87.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 3.0, 4.0, 8.0, 14.0, 15.0, 21.0, 16.0, 21.0, 20.0, 27.0, 37.0, 38.0, 49.0, 69.0, 79.0, 60.0, 83.0, 72.0, 80.0, 49.0, 47.0, 35.0, 22.0, 28.0, 12.0, 15.0, 12.0, 10.0, 17.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5546875, -4.39349365234375, -4.2322998046875, -4.07110595703125, -3.909912109375, -3.74871826171875, -3.5875244140625, -3.42633056640625, -3.26513671875, -3.10394287109375, -2.9427490234375, -2.78155517578125, -2.620361328125, -2.45916748046875, -2.2979736328125, -2.13677978515625, -1.9755859375, -1.81439208984375, -1.6531982421875, -1.49200439453125, -1.330810546875, -1.16961669921875, -1.0084228515625, -0.84722900390625, -0.68603515625, -0.52484130859375, -0.3636474609375, -0.20245361328125, -0.041259765625, 0.11993408203125, 0.2811279296875, 0.44232177734375, 0.603515625, 0.76470947265625, 0.9259033203125, 1.08709716796875, 1.248291015625, 1.40948486328125, 1.5706787109375, 1.73187255859375, 1.89306640625, 2.05426025390625, 2.2154541015625, 2.37664794921875, 2.537841796875, 2.69903564453125, 2.8602294921875, 3.02142333984375, 3.1826171875, 3.34381103515625, 3.5050048828125, 3.66619873046875, 3.827392578125, 3.98858642578125, 4.1497802734375, 4.31097412109375, 4.47216796875, 4.63336181640625, 4.7945556640625, 4.95574951171875, 5.116943359375, 5.27813720703125, 5.4393310546875, 5.60052490234375, 5.76171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 11.0, 11.0, 14.0, 10.0, 28.0, 30.0, 42.0, 57.0, 61.0, 46.0, 41.0, 25.0, 32.0, 13.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.920490264892578, -25.069591522216797, -24.218692779541016, -23.3677921295166, -22.51689338684082, -21.66599464416504, -20.815093994140625, -19.964195251464844, -19.113296508789062, -18.26239776611328, -17.4114990234375, -16.560598373413086, -15.709699630737305, -14.858800888061523, -14.007901191711426, -13.157001495361328, -12.306102752685547, -11.455204010009766, -10.604304313659668, -9.75340461730957, -8.902505874633789, -8.051607131958008, -7.20070743560791, -6.349808216094971, -5.498908996582031, -4.648009777069092, -3.7971105575561523, -2.946211338043213, -2.0953121185302734, -1.244412899017334, -0.39351367950439453, 0.4573855400085449, 1.3082847595214844, 2.159183979034424, 3.0100831985473633, 3.8609824180603027, 4.711881637573242, 5.562780857086182, 6.413680076599121, 7.2645792961120605, 8.115478515625, 8.966377258300781, 9.817276954650879, 10.668176651000977, 11.519075393676758, 12.369974136352539, 13.220873832702637, 14.071773529052734, 14.922672271728516, 15.773571014404297, 16.624469757080078, 17.475370407104492, 18.326269149780273, 19.177167892456055, 20.02806854248047, 20.87896728515625, 21.72986602783203, 22.580764770507812, 23.431663513183594, 24.282564163208008, 25.13346290588379, 25.98436164855957, 26.835262298583984, 27.686161041259766, 28.537059783935547]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 10.0, 8.0, 15.0, 34.0, 60.0, 68.0, 83.0, 69.0, 49.0, 20.0, 12.0, 8.0, 5.0, 6.0, 7.0, 10.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-40.37859344482422, -39.307743072509766, -38.23689270019531, -37.16604232788086, -36.095191955566406, -35.02434539794922, -33.953495025634766, -32.88264465332031, -31.81179428100586, -30.740943908691406, -29.670093536376953, -28.599245071411133, -27.52839469909668, -26.457544326782227, -25.386695861816406, -24.315845489501953, -23.2449951171875, -22.174144744873047, -21.103294372558594, -20.032445907592773, -18.96159553527832, -17.890745162963867, -16.819896697998047, -15.749046325683594, -14.67819595336914, -13.607345581054688, -12.53649616241455, -11.465646743774414, -10.394796371459961, -9.323945999145508, -8.253096580505371, -7.182246685028076, -6.111396789550781, -5.040546894073486, -3.9696969985961914, -2.8988471031188965, -1.8279972076416016, -0.7571473121643066, 0.3137025833129883, 1.3845524787902832, 2.455402374267578, 3.526252269744873, 4.597102165222168, 5.667952060699463, 6.738801956176758, 7.809651851654053, 8.880501747131348, 9.951351165771484, 11.022201538085938, 12.09305191040039, 13.163901329040527, 14.234750747680664, 15.305601119995117, 16.37645149230957, 17.44729995727539, 18.518150329589844, 19.589000701904297, 20.65985107421875, 21.730701446533203, 22.801549911499023, 23.872400283813477, 24.94325065612793, 26.01409912109375, 27.084949493408203, 28.155799865722656]}, "eval/loss": 5.21882963180542, "eval/wer": 0.9237653034902871, "eval/runtime": 426.2702, "eval/samples_per_second": 6.198, "eval/steps_per_second": 0.389, "train/train_runtime": 83793.5909, "train/train_samples_per_second": 6.811, "train/train_steps_per_second": 0.053, "train/total_flos": 0.0, "train/train_loss": 5.624244330977111} \ No newline at end of file