diff --git "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" --- "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" +++ "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0162, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 108038, "_timestamp": 1647482580, "_step": 17851, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 12.0, 6.0, 8.0, 6.0, 12.0, 15.0, 17.0, 22.0, 35.0, 43.0, 41.0, 53.0, 54.0, 47.0, 56.0, 65.0, 50.0, 58.0, 50.0, 53.0, 44.0, 45.0, 43.0, 38.0, 23.0, 22.0, 17.0, 19.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.21875762939453, -88.52344512939453, -86.828125, -85.1328125, -83.43749237060547, -81.74217987060547, -80.04685974121094, -78.35154724121094, -76.65623474121094, -74.96092224121094, -73.2656021118164, -71.5702896118164, -69.87496948242188, -68.17965698242188, -66.48433685302734, -64.78902435302734, -63.09370422363281, -61.39838790893555, -59.70307159423828, -58.007755279541016, -56.31243896484375, -54.61712646484375, -52.921810150146484, -51.22649383544922, -49.53117752075195, -47.83586120605469, -46.14054489135742, -44.445228576660156, -42.749916076660156, -41.054595947265625, -39.359283447265625, -37.66396713256836, -35.96865463256836, -34.273338317871094, -32.57802200317383, -30.882707595825195, -29.18739128112793, -27.492074966430664, -25.79676055908203, -24.101444244384766, -22.4061279296875, -20.710811614990234, -19.01549530029297, -17.320180892944336, -15.62486457824707, -13.929548263549805, -12.234232902526855, -10.538917541503906, -8.84360122680664, -7.148285388946533, -5.452969551086426, -3.7576537132263184, -2.062337875366211, -0.3670215606689453, 1.328293800354004, 3.023609161376953, 4.718925476074219, 6.414241313934326, 8.109557151794434, 9.804872512817383, 11.500188827514648, 13.195505142211914, 14.890820503234863, 16.586135864257812, 18.281452178955078]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 2.0, 7.0, 7.0, 12.0, 14.0, 7.0, 15.0, 15.0, 26.0, 24.0, 24.0, 22.0, 35.0, 31.0, 23.0, 37.0, 38.0, 36.0, 32.0, 50.0, 48.0, 40.0, 41.0, 39.0, 35.0, 33.0, 49.0, 19.0, 29.0, 29.0, 18.0, 25.0, 19.0, 16.0, 24.0, 9.0, 14.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.85319900512695, -38.5408935546875, -37.22859191894531, -35.91628646850586, -34.60398483276367, -33.29167938232422, -31.9793758392334, -30.667072296142578, -29.354766845703125, -28.042463302612305, -26.730159759521484, -25.41785430908203, -24.10555076599121, -22.79324722290039, -21.48094367980957, -20.16864013671875, -18.85633659362793, -17.54403305053711, -16.23172950744629, -14.919425010681152, -13.607120513916016, -12.294816970825195, -10.982513427734375, -9.670208930969238, -8.357905387878418, -7.0456013679504395, -5.733297348022461, -4.420993804931641, -3.108689785003662, -1.7963857650756836, -0.4840822219848633, 0.8282222747802734, 2.1405258178710938, 3.4528298377990723, 4.765133857727051, 6.077437400817871, 7.38974142074585, 8.702045440673828, 10.014348983764648, 11.326653480529785, 12.638957023620605, 13.951260566711426, 15.263565063476562, 16.575868606567383, 17.888172149658203, 19.200477600097656, 20.512779235839844, 21.825084686279297, 23.137388229370117, 24.449691772460938, 25.761995315551758, 27.074298858642578, 28.38660430908203, 29.69890785217285, 31.011211395263672, 32.323516845703125, 33.63581848144531, 34.948123931884766, 36.26042556762695, 37.572731018066406, 38.885032653808594, 40.19733810424805, 41.5096435546875, 42.82194519042969, 44.13425064086914]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 25.0, 40.0, 47.0, 82.0, 141.0, 254.0, 401.0, 613.0, 991.0, 1579.0, 2531.0, 4057.0, 6334.0, 10190.0, 15867.0, 25238.0, 39251.0, 60422.0, 93260.0, 140151.0, 206561.0, 294505.0, 398751.0, 495048.0, 539183.0, 503644.0, 412134.0, 306321.0, 215690.0, 146820.0, 97775.0, 62907.0, 41042.0, 26517.0, 16954.0, 10778.0, 6679.0, 4275.0, 2650.0, 1652.0, 1122.0, 678.0, 415.0, 250.0, 173.0, 99.0, 64.0, 38.0, 33.0, 10.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0], "bins": [-69.375, -67.244140625, -65.11328125, -62.982421875, -60.8515625, -58.720703125, -56.58984375, -54.458984375, -52.328125, -50.197265625, -48.06640625, -45.935546875, -43.8046875, -41.673828125, -39.54296875, -37.412109375, -35.28125, -33.150390625, -31.01953125, -28.888671875, -26.7578125, -24.626953125, -22.49609375, -20.365234375, -18.234375, -16.103515625, -13.97265625, -11.841796875, -9.7109375, -7.580078125, -5.44921875, -3.318359375, -1.1875, 0.943359375, 3.07421875, 5.205078125, 7.3359375, 9.466796875, 11.59765625, 13.728515625, 15.859375, 17.990234375, 20.12109375, 22.251953125, 24.3828125, 26.513671875, 28.64453125, 30.775390625, 32.90625, 35.037109375, 37.16796875, 39.298828125, 41.4296875, 43.560546875, 45.69140625, 47.822265625, 49.953125, 52.083984375, 54.21484375, 56.345703125, 58.4765625, 60.607421875, 62.73828125, 64.869140625, 67.0]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 3.0, 8.0, 12.0, 9.0, 7.0, 7.0, 9.0, 20.0, 23.0, 17.0, 19.0, 19.0, 32.0, 23.0, 21.0, 29.0, 28.0, 30.0, 42.0, 37.0, 47.0, 35.0, 42.0, 34.0, 29.0, 32.0, 33.0, 40.0, 29.0, 17.0, 22.0, 24.0, 28.0, 23.0, 16.0, 8.0, 15.0, 16.0, 24.0, 10.0, 10.0, 10.0, 11.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 6.0], "bins": [-44.59375, -43.29345703125, -41.9931640625, -40.69287109375, -39.392578125, -38.09228515625, -36.7919921875, -35.49169921875, -34.19140625, -32.89111328125, -31.5908203125, -30.29052734375, -28.990234375, -27.68994140625, -26.3896484375, -25.08935546875, -23.7890625, -22.48876953125, -21.1884765625, -19.88818359375, -18.587890625, -17.28759765625, -15.9873046875, -14.68701171875, -13.38671875, -12.08642578125, -10.7861328125, -9.48583984375, -8.185546875, -6.88525390625, -5.5849609375, -4.28466796875, -2.984375, -1.68408203125, -0.3837890625, 0.91650390625, 2.216796875, 3.51708984375, 4.8173828125, 6.11767578125, 7.41796875, 8.71826171875, 10.0185546875, 11.31884765625, 12.619140625, 13.91943359375, 15.2197265625, 16.52001953125, 17.8203125, 19.12060546875, 20.4208984375, 21.72119140625, 23.021484375, 24.32177734375, 25.6220703125, 26.92236328125, 28.22265625, 29.52294921875, 30.8232421875, 32.12353515625, 33.423828125, 34.72412109375, 36.0244140625, 37.32470703125, 38.625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 11.0, 12.0, 27.0, 26.0, 44.0, 74.0, 134.0, 188.0, 283.0, 516.0, 890.0, 1421.0, 2352.0, 3865.0, 6632.0, 11175.0, 18153.0, 29958.0, 48549.0, 76983.0, 119442.0, 180406.0, 259012.0, 353465.0, 443011.0, 505307.0, 508941.0, 454892.0, 365317.0, 272535.0, 189286.0, 126771.0, 81705.0, 51802.0, 31955.0, 19354.0, 11873.0, 7158.0, 4307.0, 2539.0, 1601.0, 909.0, 554.0, 342.0, 180.0, 125.0, 80.0, 47.0, 28.0, 18.0, 12.0, 11.0, 3.0, 3.0, 3.0], "bins": [-63.9375, -62.1142578125, -60.291015625, -58.4677734375, -56.64453125, -54.8212890625, -52.998046875, -51.1748046875, -49.3515625, -47.5283203125, -45.705078125, -43.8818359375, -42.05859375, -40.2353515625, -38.412109375, -36.5888671875, -34.765625, -32.9423828125, -31.119140625, -29.2958984375, -27.47265625, -25.6494140625, -23.826171875, -22.0029296875, -20.1796875, -18.3564453125, -16.533203125, -14.7099609375, -12.88671875, -11.0634765625, -9.240234375, -7.4169921875, -5.59375, -3.7705078125, -1.947265625, -0.1240234375, 1.69921875, 3.5224609375, 5.345703125, 7.1689453125, 8.9921875, 10.8154296875, 12.638671875, 14.4619140625, 16.28515625, 18.1083984375, 19.931640625, 21.7548828125, 23.578125, 25.4013671875, 27.224609375, 29.0478515625, 30.87109375, 32.6943359375, 34.517578125, 36.3408203125, 38.1640625, 39.9873046875, 41.810546875, 43.6337890625, 45.45703125, 47.2802734375, 49.103515625, 50.9267578125, 52.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 8.0, 4.0, 6.0, 13.0, 10.0, 21.0, 16.0, 24.0, 26.0, 31.0, 30.0, 48.0, 58.0, 77.0, 75.0, 86.0, 118.0, 124.0, 114.0, 150.0, 153.0, 144.0, 208.0, 194.0, 204.0, 208.0, 216.0, 222.0, 181.0, 174.0, 173.0, 137.0, 132.0, 109.0, 109.0, 89.0, 70.0, 64.0, 50.0, 41.0, 39.0, 36.0, 20.0, 16.0, 10.0, 15.0, 5.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.989013671875, -21.21240234375, -20.435791015625, -19.6591796875, -18.882568359375, -18.10595703125, -17.329345703125, -16.552734375, -15.776123046875, -14.99951171875, -14.222900390625, -13.4462890625, -12.669677734375, -11.89306640625, -11.116455078125, -10.33984375, -9.563232421875, -8.78662109375, -8.010009765625, -7.2333984375, -6.456787109375, -5.68017578125, -4.903564453125, -4.126953125, -3.350341796875, -2.57373046875, -1.797119140625, -1.0205078125, -0.243896484375, 0.53271484375, 1.309326171875, 2.0859375, 2.862548828125, 3.63916015625, 4.415771484375, 5.1923828125, 5.968994140625, 6.74560546875, 7.522216796875, 8.298828125, 9.075439453125, 9.85205078125, 10.628662109375, 11.4052734375, 12.181884765625, 12.95849609375, 13.735107421875, 14.51171875, 15.288330078125, 16.06494140625, 16.841552734375, 17.6181640625, 18.394775390625, 19.17138671875, 19.947998046875, 20.724609375, 21.501220703125, 22.27783203125, 23.054443359375, 23.8310546875, 24.607666015625, 25.38427734375, 26.160888671875, 26.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 13.0, 25.0, 20.0, 19.0, 29.0, 29.0, 32.0, 37.0, 40.0, 34.0, 62.0, 40.0, 40.0, 39.0, 40.0, 51.0, 46.0, 42.0, 44.0, 35.0, 44.0, 26.0, 29.0, 25.0, 25.0, 21.0, 17.0, 14.0, 16.0, 10.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-78.66213989257812, -76.70450592041016, -74.74687957763672, -72.78924560546875, -70.83161163330078, -68.87398529052734, -66.91635131835938, -64.9587173461914, -63.00109100341797, -61.043460845947266, -59.0858268737793, -57.128196716308594, -55.17056655883789, -53.21293640136719, -51.25530242919922, -49.297672271728516, -47.34003829956055, -45.382408142089844, -43.424774169921875, -41.46714401245117, -39.50951385498047, -37.5518798828125, -35.5942497253418, -33.636619567871094, -31.678987503051758, -29.721355438232422, -27.76372528076172, -25.806093215942383, -23.848461151123047, -21.890830993652344, -19.933198928833008, -17.975566864013672, -16.01793670654297, -14.06030559539795, -12.10267448425293, -10.145042419433594, -8.187411308288574, -6.229780197143555, -4.272148132324219, -2.314517021179199, -0.3568859100341797, 1.600745439529419, 3.5583767890930176, 5.516008377075195, 7.473639488220215, 9.431270599365234, 11.38890266418457, 13.34653377532959, 15.30416488647461, 17.261796951293945, 19.21942710876465, 21.177059173583984, 23.134689331054688, 25.092321395874023, 27.04995346069336, 29.007583618164062, 30.9652156829834, 32.922847747802734, 34.88047790527344, 36.838111877441406, 38.79574203491211, 40.75337219238281, 42.71100616455078, 44.668636322021484, 46.62626647949219]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 9.0, 19.0, 19.0, 17.0, 25.0, 30.0, 20.0, 25.0, 38.0, 39.0, 30.0, 35.0, 28.0, 41.0, 38.0, 50.0, 41.0, 42.0, 46.0, 35.0, 28.0, 31.0, 26.0, 42.0, 27.0, 34.0, 23.0, 19.0, 18.0, 13.0, 10.0, 10.0, 7.0, 12.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.91980743408203, -60.128684997558594, -58.33755874633789, -56.54643630981445, -54.75531005859375, -52.96418762207031, -51.173065185546875, -49.38194274902344, -47.590816497802734, -45.7996940612793, -44.008567810058594, -42.217445373535156, -40.42632293701172, -38.635196685791016, -36.84407424926758, -35.052947998046875, -33.26182556152344, -31.470701217651367, -29.679576873779297, -27.88845443725586, -26.09733009338379, -24.30620574951172, -22.51508331298828, -20.72395896911621, -18.93283462524414, -17.14171028137207, -15.350586891174316, -13.559463500976562, -11.768339157104492, -9.977214813232422, -8.186091423034668, -6.394968032836914, -4.603847503662109, -2.8127236366271973, -1.0215997695922852, 0.769524097442627, 2.560647964477539, 4.351772308349609, 6.142895698547363, 7.934019088745117, 9.725143432617188, 11.516267776489258, 13.307391166687012, 15.098514556884766, 16.889638900756836, 18.680763244628906, 20.471885681152344, 22.263010025024414, 24.054134368896484, 25.845258712768555, 27.636383056640625, 29.427505493164062, 31.218629837036133, 33.0097541809082, 34.80087661743164, 36.592002868652344, 38.38312530517578, 40.17424774169922, 41.96537399291992, 43.75649642944336, 45.54762268066406, 47.3387451171875, 49.12986755371094, 50.920989990234375, 52.71211624145508]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 12.0, 13.0, 28.0, 43.0, 55.0, 60.0, 123.0, 208.0, 287.0, 476.0, 743.0, 1171.0, 1851.0, 3053.0, 4997.0, 8039.0, 13451.0, 22545.0, 37176.0, 60395.0, 93730.0, 133593.0, 161822.0, 156923.0, 124441.0, 85225.0, 54203.0, 32889.0, 20007.0, 11904.0, 7386.0, 4376.0, 2726.0, 1632.0, 1085.0, 678.0, 388.0, 297.0, 198.0, 110.0, 84.0, 41.0, 29.0, 19.0, 16.0, 6.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-27.84375, -26.970458984375, -26.09716796875, -25.223876953125, -24.3505859375, -23.477294921875, -22.60400390625, -21.730712890625, -20.857421875, -19.984130859375, -19.11083984375, -18.237548828125, -17.3642578125, -16.490966796875, -15.61767578125, -14.744384765625, -13.87109375, -12.997802734375, -12.12451171875, -11.251220703125, -10.3779296875, -9.504638671875, -8.63134765625, -7.758056640625, -6.884765625, -6.011474609375, -5.13818359375, -4.264892578125, -3.3916015625, -2.518310546875, -1.64501953125, -0.771728515625, 0.1015625, 0.974853515625, 1.84814453125, 2.721435546875, 3.5947265625, 4.468017578125, 5.34130859375, 6.214599609375, 7.087890625, 7.961181640625, 8.83447265625, 9.707763671875, 10.5810546875, 11.454345703125, 12.32763671875, 13.200927734375, 14.07421875, 14.947509765625, 15.82080078125, 16.694091796875, 17.5673828125, 18.440673828125, 19.31396484375, 20.187255859375, 21.060546875, 21.933837890625, 22.80712890625, 23.680419921875, 24.5537109375, 25.427001953125, 26.30029296875, 27.173583984375, 28.046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 9.0, 8.0, 13.0, 16.0, 16.0, 17.0, 18.0, 24.0, 34.0, 16.0, 21.0, 36.0, 40.0, 31.0, 25.0, 36.0, 38.0, 41.0, 40.0, 41.0, 43.0, 41.0, 38.0, 33.0, 30.0, 24.0, 37.0, 34.0, 29.0, 27.0, 22.0, 16.0, 17.0, 15.0, 9.0, 7.0, 9.0, 8.0, 11.0, 8.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-63.125, -61.3271484375, -59.529296875, -57.7314453125, -55.93359375, -54.1357421875, -52.337890625, -50.5400390625, -48.7421875, -46.9443359375, -45.146484375, -43.3486328125, -41.55078125, -39.7529296875, -37.955078125, -36.1572265625, -34.359375, -32.5615234375, -30.763671875, -28.9658203125, -27.16796875, -25.3701171875, -23.572265625, -21.7744140625, -19.9765625, -18.1787109375, -16.380859375, -14.5830078125, -12.78515625, -10.9873046875, -9.189453125, -7.3916015625, -5.59375, -3.7958984375, -1.998046875, -0.2001953125, 1.59765625, 3.3955078125, 5.193359375, 6.9912109375, 8.7890625, 10.5869140625, 12.384765625, 14.1826171875, 15.98046875, 17.7783203125, 19.576171875, 21.3740234375, 23.171875, 24.9697265625, 26.767578125, 28.5654296875, 30.36328125, 32.1611328125, 33.958984375, 35.7568359375, 37.5546875, 39.3525390625, 41.150390625, 42.9482421875, 44.74609375, 46.5439453125, 48.341796875, 50.1396484375, 51.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 9.0, 10.0, 19.0, 30.0, 36.0, 43.0, 67.0, 76.0, 119.0, 172.0, 235.0, 322.0, 479.0, 715.0, 1129.0, 1667.0, 2723.0, 4209.0, 7163.0, 12027.0, 22436.0, 56611.0, 843408.0, 44976.0, 20407.0, 11344.0, 6641.0, 4013.0, 2580.0, 1604.0, 1038.0, 692.0, 449.0, 321.0, 250.0, 138.0, 88.0, 87.0, 58.0, 37.0, 32.0, 31.0, 16.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-58.9375, -57.1201171875, -55.302734375, -53.4853515625, -51.66796875, -49.8505859375, -48.033203125, -46.2158203125, -44.3984375, -42.5810546875, -40.763671875, -38.9462890625, -37.12890625, -35.3115234375, -33.494140625, -31.6767578125, -29.859375, -28.0419921875, -26.224609375, -24.4072265625, -22.58984375, -20.7724609375, -18.955078125, -17.1376953125, -15.3203125, -13.5029296875, -11.685546875, -9.8681640625, -8.05078125, -6.2333984375, -4.416015625, -2.5986328125, -0.78125, 1.0361328125, 2.853515625, 4.6708984375, 6.48828125, 8.3056640625, 10.123046875, 11.9404296875, 13.7578125, 15.5751953125, 17.392578125, 19.2099609375, 21.02734375, 22.8447265625, 24.662109375, 26.4794921875, 28.296875, 30.1142578125, 31.931640625, 33.7490234375, 35.56640625, 37.3837890625, 39.201171875, 41.0185546875, 42.8359375, 44.6533203125, 46.470703125, 48.2880859375, 50.10546875, 51.9228515625, 53.740234375, 55.5576171875, 57.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 9.0, 8.0, 6.0, 15.0, 10.0, 16.0, 14.0, 22.0, 14.0, 21.0, 20.0, 23.0, 38.0, 34.0, 42.0, 29.0, 44.0, 37.0, 40.0, 54.0, 45.0, 39.0, 27.0, 46.0, 40.0, 33.0, 40.0, 28.0, 40.0, 28.0, 28.0, 17.0, 13.0, 22.0, 14.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.65625, -39.41064453125, -38.1650390625, -36.91943359375, -35.673828125, -34.42822265625, -33.1826171875, -31.93701171875, -30.69140625, -29.44580078125, -28.2001953125, -26.95458984375, -25.708984375, -24.46337890625, -23.2177734375, -21.97216796875, -20.7265625, -19.48095703125, -18.2353515625, -16.98974609375, -15.744140625, -14.49853515625, -13.2529296875, -12.00732421875, -10.76171875, -9.51611328125, -8.2705078125, -7.02490234375, -5.779296875, -4.53369140625, -3.2880859375, -2.04248046875, -0.796875, 0.44873046875, 1.6943359375, 2.93994140625, 4.185546875, 5.43115234375, 6.6767578125, 7.92236328125, 9.16796875, 10.41357421875, 11.6591796875, 12.90478515625, 14.150390625, 15.39599609375, 16.6416015625, 17.88720703125, 19.1328125, 20.37841796875, 21.6240234375, 22.86962890625, 24.115234375, 25.36083984375, 26.6064453125, 27.85205078125, 29.09765625, 30.34326171875, 31.5888671875, 32.83447265625, 34.080078125, 35.32568359375, 36.5712890625, 37.81689453125, 39.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 5.0, 13.0, 11.0, 19.0, 49.0, 39.0, 72.0, 85.0, 142.0, 213.0, 415.0, 938.0, 2470.0, 10350.0, 92506.0, 916821.0, 18308.0, 3572.0, 1174.0, 541.0, 275.0, 138.0, 118.0, 61.0, 46.0, 39.0, 20.0, 18.0, 23.0, 11.0, 11.0, 6.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.0859375, -11.721435546875, -11.35693359375, -10.992431640625, -10.6279296875, -10.263427734375, -9.89892578125, -9.534423828125, -9.169921875, -8.805419921875, -8.44091796875, -8.076416015625, -7.7119140625, -7.347412109375, -6.98291015625, -6.618408203125, -6.25390625, -5.889404296875, -5.52490234375, -5.160400390625, -4.7958984375, -4.431396484375, -4.06689453125, -3.702392578125, -3.337890625, -2.973388671875, -2.60888671875, -2.244384765625, -1.8798828125, -1.515380859375, -1.15087890625, -0.786376953125, -0.421875, -0.057373046875, 0.30712890625, 0.671630859375, 1.0361328125, 1.400634765625, 1.76513671875, 2.129638671875, 2.494140625, 2.858642578125, 3.22314453125, 3.587646484375, 3.9521484375, 4.316650390625, 4.68115234375, 5.045654296875, 5.41015625, 5.774658203125, 6.13916015625, 6.503662109375, 6.8681640625, 7.232666015625, 7.59716796875, 7.961669921875, 8.326171875, 8.690673828125, 9.05517578125, 9.419677734375, 9.7841796875, 10.148681640625, 10.51318359375, 10.877685546875, 11.2421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 23.0, 30.0, 33.0, 54.0, 77.0, 108.0, 137.0, 147.0, 102.0, 86.0, 60.0, 36.0, 18.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005898475646972656, -0.0005728527903556824, -0.0005558580160140991, -0.0005388632416725159, -0.0005218684673309326, -0.0005048736929893494, -0.0004878789186477661, -0.00047088414430618286, -0.0004538893699645996, -0.00043689459562301636, -0.0004198998212814331, -0.00040290504693984985, -0.0003859102725982666, -0.00036891549825668335, -0.0003519207239151001, -0.00033492594957351685, -0.0003179311752319336, -0.00030093640089035034, -0.0002839416265487671, -0.00026694685220718384, -0.0002499520778656006, -0.00023295730352401733, -0.00021596252918243408, -0.00019896775484085083, -0.00018197298049926758, -0.00016497820615768433, -0.00014798343181610107, -0.00013098865747451782, -0.00011399388313293457, -9.699910879135132e-05, -8.000433444976807e-05, -6.300956010818481e-05, -4.601478576660156e-05, -2.902001142501831e-05, -1.2025237083435059e-05, 4.969537258148193e-06, 2.1964311599731445e-05, 3.89590859413147e-05, 5.595386028289795e-05, 7.29486346244812e-05, 8.994340896606445e-05, 0.0001069381833076477, 0.00012393295764923096, 0.0001409277319908142, 0.00015792250633239746, 0.0001749172806739807, 0.00019191205501556396, 0.00020890682935714722, 0.00022590160369873047, 0.00024289637804031372, 0.00025989115238189697, 0.0002768859267234802, 0.0002938807010650635, 0.00031087547540664673, 0.00032787024974823, 0.00034486502408981323, 0.0003618597984313965, 0.00037885457277297974, 0.000395849347114563, 0.00041284412145614624, 0.0004298388957977295, 0.00044683367013931274, 0.000463828444480896, 0.00048082321882247925, 0.0004978179931640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 18.0, 26.0, 27.0, 44.0, 60.0, 74.0, 151.0, 212.0, 399.0, 745.0, 1475.0, 3388.0, 8242.0, 20828.0, 54635.0, 139127.0, 277642.0, 290147.0, 151537.0, 60375.0, 22905.0, 9126.0, 3815.0, 1639.0, 815.0, 402.0, 230.0, 156.0, 92.0, 59.0, 43.0, 22.0, 17.0, 21.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.02288818359375, -7.7801513671875, -7.53741455078125, -7.294677734375, -7.05194091796875, -6.8092041015625, -6.56646728515625, -6.32373046875, -6.08099365234375, -5.8382568359375, -5.59552001953125, -5.352783203125, -5.11004638671875, -4.8673095703125, -4.62457275390625, -4.3818359375, -4.13909912109375, -3.8963623046875, -3.65362548828125, -3.410888671875, -3.16815185546875, -2.9254150390625, -2.68267822265625, -2.43994140625, -2.19720458984375, -1.9544677734375, -1.71173095703125, -1.468994140625, -1.22625732421875, -0.9835205078125, -0.74078369140625, -0.498046875, -0.25531005859375, -0.0125732421875, 0.23016357421875, 0.472900390625, 0.71563720703125, 0.9583740234375, 1.20111083984375, 1.44384765625, 1.68658447265625, 1.9293212890625, 2.17205810546875, 2.414794921875, 2.65753173828125, 2.9002685546875, 3.14300537109375, 3.3857421875, 3.62847900390625, 3.8712158203125, 4.11395263671875, 4.356689453125, 4.59942626953125, 4.8421630859375, 5.08489990234375, 5.32763671875, 5.57037353515625, 5.8131103515625, 6.05584716796875, 6.298583984375, 6.54132080078125, 6.7840576171875, 7.02679443359375, 7.26953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 8.0, 15.0, 13.0, 17.0, 19.0, 17.0, 25.0, 38.0, 31.0, 42.0, 46.0, 71.0, 58.0, 50.0, 58.0, 52.0, 47.0, 55.0, 43.0, 30.0, 33.0, 31.0, 27.0, 27.0, 15.0, 13.0, 18.0, 16.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.37042236328125, -1.3238525390625, -1.27728271484375, -1.230712890625, -1.18414306640625, -1.1375732421875, -1.09100341796875, -1.04443359375, -0.99786376953125, -0.9512939453125, -0.90472412109375, -0.858154296875, -0.81158447265625, -0.7650146484375, -0.71844482421875, -0.671875, -0.62530517578125, -0.5787353515625, -0.53216552734375, -0.485595703125, -0.43902587890625, -0.3924560546875, -0.34588623046875, -0.29931640625, -0.25274658203125, -0.2061767578125, -0.15960693359375, -0.113037109375, -0.06646728515625, -0.0198974609375, 0.02667236328125, 0.0732421875, 0.11981201171875, 0.1663818359375, 0.21295166015625, 0.259521484375, 0.30609130859375, 0.3526611328125, 0.39923095703125, 0.44580078125, 0.49237060546875, 0.5389404296875, 0.58551025390625, 0.632080078125, 0.67864990234375, 0.7252197265625, 0.77178955078125, 0.818359375, 0.86492919921875, 0.9114990234375, 0.95806884765625, 1.004638671875, 1.05120849609375, 1.0977783203125, 1.14434814453125, 1.19091796875, 1.23748779296875, 1.2840576171875, 1.33062744140625, 1.377197265625, 1.42376708984375, 1.4703369140625, 1.51690673828125, 1.5634765625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 5.0, 6.0, 14.0, 18.0, 22.0, 26.0, 22.0, 29.0, 34.0, 46.0, 41.0, 53.0, 47.0, 45.0, 44.0, 46.0, 47.0, 47.0, 51.0, 54.0, 42.0, 46.0, 25.0, 28.0, 29.0, 18.0, 20.0, 20.0, 15.0, 9.0, 12.0, 10.0, 5.0, 7.0, 4.0, 2.0, 4.0], "bins": [-92.06939697265625, -89.90866088867188, -87.7479248046875, -85.5871810913086, -83.42644500732422, -81.26570892333984, -79.10497283935547, -76.9442367553711, -74.78349304199219, -72.62275695800781, -70.46202087402344, -68.30127716064453, -66.14054107666016, -63.97980499267578, -61.819068908691406, -59.65833282470703, -57.497596740722656, -55.33686065673828, -53.17612075805664, -51.015384674072266, -48.854644775390625, -46.69390869140625, -44.533172607421875, -42.3724365234375, -40.21169662475586, -38.050960540771484, -35.890220642089844, -33.72948455810547, -31.56874656677246, -29.408008575439453, -27.247272491455078, -25.08653450012207, -22.925800323486328, -20.76506233215332, -18.604324340820312, -16.443588256835938, -14.28285026550293, -12.122112274169922, -9.96137523651123, -7.800638198852539, -5.639900207519531, -3.4791626930236816, -1.318425178527832, 0.8423123359680176, 3.003049850463867, 5.163787841796875, 7.324524879455566, 9.485261917114258, 11.645999908447266, 13.806737899780273, 15.967474937438965, 18.128211975097656, 20.288949966430664, 22.449687957763672, 24.610424041748047, 26.771162033081055, 28.931900024414062, 31.09263801574707, 33.25337600708008, 35.41411209106445, 37.574851989746094, 39.73558807373047, 41.896324157714844, 44.05706024169922, 46.21780014038086]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 8.0, 18.0, 7.0, 12.0, 22.0, 16.0, 24.0, 35.0, 20.0, 23.0, 29.0, 36.0, 37.0, 25.0, 31.0, 38.0, 38.0, 39.0, 46.0, 34.0, 45.0, 39.0, 37.0, 28.0, 22.0, 33.0, 40.0, 29.0, 27.0, 22.0, 19.0, 15.0, 14.0, 14.0, 9.0, 3.0, 12.0, 8.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-62.82893371582031, -61.046478271484375, -59.2640266418457, -57.481571197509766, -55.69911575317383, -53.916664123535156, -52.13420867919922, -50.35175323486328, -48.569297790527344, -46.786842346191406, -45.004390716552734, -43.2219352722168, -41.43947982788086, -39.65702819824219, -37.87457275390625, -36.09211730957031, -34.30966567993164, -32.5272102355957, -30.7447566986084, -28.962303161621094, -27.179847717285156, -25.39739418029785, -23.614940643310547, -21.83248519897461, -20.050031661987305, -18.267578125, -16.485122680664062, -14.702669143676758, -12.920214653015137, -11.137760162353516, -9.355306625366211, -7.57285213470459, -5.790393829345703, -4.007939338684082, -2.225485324859619, -0.44303131103515625, 1.3394231796264648, 3.121877670288086, 4.904331207275391, 6.686785697937012, 8.469240188598633, 10.251694679260254, 12.034149169921875, 13.81660270690918, 15.5990571975708, 17.381511688232422, 19.163965225219727, 20.94641876220703, 22.72887420654297, 24.511327743530273, 26.29378318786621, 28.076236724853516, 29.858692169189453, 31.641145706176758, 33.42359924316406, 35.2060546875, 36.98851013183594, 38.770965576171875, 40.55341720581055, 42.335872650146484, 44.11832809448242, 45.900779724121094, 47.68323516845703, 49.46569061279297, 51.24814224243164]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 13.0, 22.0, 31.0, 34.0, 80.0, 111.0, 177.0, 265.0, 400.0, 644.0, 1055.0, 1798.0, 2974.0, 5285.0, 9544.0, 16776.0, 29014.0, 48286.0, 75929.0, 107305.0, 135026.0, 147042.0, 139357.0, 114342.0, 82199.0, 53526.0, 32988.0, 19083.0, 10638.0, 6040.0, 3380.0, 2016.0, 1126.0, 741.0, 468.0, 260.0, 184.0, 118.0, 97.0, 62.0, 49.0, 22.0, 13.0, 9.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.693359375, -66.44921875, -64.205078125, -61.9609375, -59.716796875, -57.47265625, -55.228515625, -52.984375, -50.740234375, -48.49609375, -46.251953125, -44.0078125, -41.763671875, -39.51953125, -37.275390625, -35.03125, -32.787109375, -30.54296875, -28.298828125, -26.0546875, -23.810546875, -21.56640625, -19.322265625, -17.078125, -14.833984375, -12.58984375, -10.345703125, -8.1015625, -5.857421875, -3.61328125, -1.369140625, 0.875, 3.119140625, 5.36328125, 7.607421875, 9.8515625, 12.095703125, 14.33984375, 16.583984375, 18.828125, 21.072265625, 23.31640625, 25.560546875, 27.8046875, 30.048828125, 32.29296875, 34.537109375, 36.78125, 39.025390625, 41.26953125, 43.513671875, 45.7578125, 48.001953125, 50.24609375, 52.490234375, 54.734375, 56.978515625, 59.22265625, 61.466796875, 63.7109375, 65.955078125, 68.19921875, 70.443359375, 72.6875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 13.0, 20.0, 20.0, 22.0, 34.0, 22.0, 20.0, 33.0, 39.0, 34.0, 25.0, 36.0, 39.0, 43.0, 37.0, 44.0, 35.0, 47.0, 43.0, 26.0, 31.0, 29.0, 37.0, 36.0, 29.0, 25.0, 18.0, 14.0, 17.0, 15.0, 12.0, 4.0, 10.0, 9.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-63.15625, -61.34814453125, -59.5400390625, -57.73193359375, -55.923828125, -54.11572265625, -52.3076171875, -50.49951171875, -48.69140625, -46.88330078125, -45.0751953125, -43.26708984375, -41.458984375, -39.65087890625, -37.8427734375, -36.03466796875, -34.2265625, -32.41845703125, -30.6103515625, -28.80224609375, -26.994140625, -25.18603515625, -23.3779296875, -21.56982421875, -19.76171875, -17.95361328125, -16.1455078125, -14.33740234375, -12.529296875, -10.72119140625, -8.9130859375, -7.10498046875, -5.296875, -3.48876953125, -1.6806640625, 0.12744140625, 1.935546875, 3.74365234375, 5.5517578125, 7.35986328125, 9.16796875, 10.97607421875, 12.7841796875, 14.59228515625, 16.400390625, 18.20849609375, 20.0166015625, 21.82470703125, 23.6328125, 25.44091796875, 27.2490234375, 29.05712890625, 30.865234375, 32.67333984375, 34.4814453125, 36.28955078125, 38.09765625, 39.90576171875, 41.7138671875, 43.52197265625, 45.330078125, 47.13818359375, 48.9462890625, 50.75439453125, 52.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 5.0, 5.0, 24.0, 25.0, 48.0, 56.0, 94.0, 140.0, 191.0, 276.0, 448.0, 636.0, 996.0, 1483.0, 2353.0, 3777.0, 6082.0, 10086.0, 17115.0, 28073.0, 45244.0, 69942.0, 98908.0, 126951.0, 142416.0, 138377.0, 115862.0, 85563.0, 58079.0, 37091.0, 22561.0, 13524.0, 8290.0, 5013.0, 3177.0, 1963.0, 1259.0, 763.0, 566.0, 363.0, 240.0, 158.0, 115.0, 68.0, 58.0, 28.0, 18.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-79.75, -77.3173828125, -74.884765625, -72.4521484375, -70.01953125, -67.5869140625, -65.154296875, -62.7216796875, -60.2890625, -57.8564453125, -55.423828125, -52.9912109375, -50.55859375, -48.1259765625, -45.693359375, -43.2607421875, -40.828125, -38.3955078125, -35.962890625, -33.5302734375, -31.09765625, -28.6650390625, -26.232421875, -23.7998046875, -21.3671875, -18.9345703125, -16.501953125, -14.0693359375, -11.63671875, -9.2041015625, -6.771484375, -4.3388671875, -1.90625, 0.5263671875, 2.958984375, 5.3916015625, 7.82421875, 10.2568359375, 12.689453125, 15.1220703125, 17.5546875, 19.9873046875, 22.419921875, 24.8525390625, 27.28515625, 29.7177734375, 32.150390625, 34.5830078125, 37.015625, 39.4482421875, 41.880859375, 44.3134765625, 46.74609375, 49.1787109375, 51.611328125, 54.0439453125, 56.4765625, 58.9091796875, 61.341796875, 63.7744140625, 66.20703125, 68.6396484375, 71.072265625, 73.5048828125, 75.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 10.0, 7.0, 14.0, 9.0, 17.0, 14.0, 14.0, 27.0, 32.0, 30.0, 33.0, 37.0, 34.0, 48.0, 46.0, 35.0, 39.0, 51.0, 42.0, 35.0, 46.0, 42.0, 33.0, 33.0, 36.0, 33.0, 21.0, 25.0, 16.0, 21.0, 20.0, 23.0, 10.0, 13.0, 7.0, 13.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -34.94482421875, -33.7333984375, -32.52197265625, -31.310546875, -30.09912109375, -28.8876953125, -27.67626953125, -26.46484375, -25.25341796875, -24.0419921875, -22.83056640625, -21.619140625, -20.40771484375, -19.1962890625, -17.98486328125, -16.7734375, -15.56201171875, -14.3505859375, -13.13916015625, -11.927734375, -10.71630859375, -9.5048828125, -8.29345703125, -7.08203125, -5.87060546875, -4.6591796875, -3.44775390625, -2.236328125, -1.02490234375, 0.1865234375, 1.39794921875, 2.609375, 3.82080078125, 5.0322265625, 6.24365234375, 7.455078125, 8.66650390625, 9.8779296875, 11.08935546875, 12.30078125, 13.51220703125, 14.7236328125, 15.93505859375, 17.146484375, 18.35791015625, 19.5693359375, 20.78076171875, 21.9921875, 23.20361328125, 24.4150390625, 25.62646484375, 26.837890625, 28.04931640625, 29.2607421875, 30.47216796875, 31.68359375, 32.89501953125, 34.1064453125, 35.31787109375, 36.529296875, 37.74072265625, 38.9521484375, 40.16357421875, 41.375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 23.0, 24.0, 40.0, 68.0, 90.0, 123.0, 202.0, 323.0, 467.0, 684.0, 1080.0, 1618.0, 2529.0, 3866.0, 6005.0, 9517.0, 14857.0, 23139.0, 35281.0, 52759.0, 74891.0, 99049.0, 119334.0, 128011.0, 121432.0, 104619.0, 80654.0, 57572.0, 39025.0, 25472.0, 16312.0, 10361.0, 6739.0, 4398.0, 2716.0, 1773.0, 1172.0, 785.0, 504.0, 354.0, 219.0, 171.0, 86.0, 70.0, 42.0, 23.0, 27.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0625, -13.587646484375, -13.11279296875, -12.637939453125, -12.1630859375, -11.688232421875, -11.21337890625, -10.738525390625, -10.263671875, -9.788818359375, -9.31396484375, -8.839111328125, -8.3642578125, -7.889404296875, -7.41455078125, -6.939697265625, -6.46484375, -5.989990234375, -5.51513671875, -5.040283203125, -4.5654296875, -4.090576171875, -3.61572265625, -3.140869140625, -2.666015625, -2.191162109375, -1.71630859375, -1.241455078125, -0.7666015625, -0.291748046875, 0.18310546875, 0.657958984375, 1.1328125, 1.607666015625, 2.08251953125, 2.557373046875, 3.0322265625, 3.507080078125, 3.98193359375, 4.456787109375, 4.931640625, 5.406494140625, 5.88134765625, 6.356201171875, 6.8310546875, 7.305908203125, 7.78076171875, 8.255615234375, 8.73046875, 9.205322265625, 9.68017578125, 10.155029296875, 10.6298828125, 11.104736328125, 11.57958984375, 12.054443359375, 12.529296875, 13.004150390625, 13.47900390625, 13.953857421875, 14.4287109375, 14.903564453125, 15.37841796875, 15.853271484375, 16.328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 3.0, 13.0, 8.0, 14.0, 17.0, 23.0, 30.0, 35.0, 42.0, 53.0, 64.0, 63.0, 71.0, 73.0, 69.0, 69.0, 72.0, 53.0, 49.0, 44.0, 31.0, 23.0, 19.0, 11.0, 19.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028591156005859375, -0.0027809441089630127, -0.002702772617340088, -0.002624601125717163, -0.0025464296340942383, -0.0024682581424713135, -0.0023900866508483887, -0.002311915159225464, -0.002233743667602539, -0.0021555721759796143, -0.0020774006843566895, -0.0019992291927337646, -0.0019210577011108398, -0.001842886209487915, -0.0017647147178649902, -0.0016865432262420654, -0.0016083717346191406, -0.0015302002429962158, -0.001452028751373291, -0.0013738572597503662, -0.0012956857681274414, -0.0012175142765045166, -0.0011393427848815918, -0.001061171293258667, -0.0009829998016357422, -0.0009048283100128174, -0.0008266568183898926, -0.0007484853267669678, -0.000670313835144043, -0.0005921423435211182, -0.0005139708518981934, -0.00043579936027526855, -0.00035762786865234375, -0.00027945637702941895, -0.00020128488540649414, -0.00012311339378356934, -4.494190216064453e-05, 3.3229589462280273e-05, 0.00011140108108520508, 0.00018957257270812988, 0.0002677440643310547, 0.0003459155559539795, 0.0004240870475769043, 0.0005022585391998291, 0.0005804300308227539, 0.0006586015224456787, 0.0007367730140686035, 0.0008149445056915283, 0.0008931159973144531, 0.0009712874889373779, 0.0010494589805603027, 0.0011276304721832275, 0.0012058019638061523, 0.0012839734554290771, 0.001362144947052002, 0.0014403164386749268, 0.0015184879302978516, 0.0015966594219207764, 0.0016748309135437012, 0.001753002405166626, 0.0018311738967895508, 0.0019093453884124756, 0.0019875168800354004, 0.002065688371658325, 0.00214385986328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 32.0, 32.0, 61.0, 74.0, 99.0, 155.0, 256.0, 351.0, 579.0, 893.0, 1343.0, 2156.0, 3288.0, 5144.0, 8244.0, 12763.0, 19728.0, 29843.0, 44074.0, 61781.0, 82483.0, 102674.0, 116517.0, 119695.0, 110736.0, 93304.0, 73067.0, 53043.0, 36491.0, 24690.0, 16037.0, 10327.0, 6573.0, 4262.0, 2800.0, 1752.0, 1113.0, 721.0, 430.0, 313.0, 214.0, 122.0, 82.0, 65.0, 33.0, 32.0, 26.0, 15.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.828125, -13.3712158203125, -12.914306640625, -12.4573974609375, -12.00048828125, -11.5435791015625, -11.086669921875, -10.6297607421875, -10.1728515625, -9.7159423828125, -9.259033203125, -8.8021240234375, -8.34521484375, -7.8883056640625, -7.431396484375, -6.9744873046875, -6.517578125, -6.0606689453125, -5.603759765625, -5.1468505859375, -4.68994140625, -4.2330322265625, -3.776123046875, -3.3192138671875, -2.8623046875, -2.4053955078125, -1.948486328125, -1.4915771484375, -1.03466796875, -0.5777587890625, -0.120849609375, 0.3360595703125, 0.79296875, 1.2498779296875, 1.706787109375, 2.1636962890625, 2.62060546875, 3.0775146484375, 3.534423828125, 3.9913330078125, 4.4482421875, 4.9051513671875, 5.362060546875, 5.8189697265625, 6.27587890625, 6.7327880859375, 7.189697265625, 7.6466064453125, 8.103515625, 8.5604248046875, 9.017333984375, 9.4742431640625, 9.93115234375, 10.3880615234375, 10.844970703125, 11.3018798828125, 11.7587890625, 12.2156982421875, 12.672607421875, 13.1295166015625, 13.58642578125, 14.0433349609375, 14.500244140625, 14.9571533203125, 15.4140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 11.0, 11.0, 7.0, 7.0, 15.0, 10.0, 16.0, 27.0, 16.0, 33.0, 33.0, 44.0, 45.0, 28.0, 49.0, 54.0, 56.0, 41.0, 48.0, 55.0, 50.0, 45.0, 44.0, 41.0, 39.0, 30.0, 17.0, 26.0, 22.0, 14.0, 9.0, 11.0, 13.0, 8.0, 10.0, 1.0, 5.0, 2.0, 0.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.34375, -8.1080322265625, -7.872314453125, -7.6365966796875, -7.40087890625, -7.1651611328125, -6.929443359375, -6.6937255859375, -6.4580078125, -6.2222900390625, -5.986572265625, -5.7508544921875, -5.51513671875, -5.2794189453125, -5.043701171875, -4.8079833984375, -4.572265625, -4.3365478515625, -4.100830078125, -3.8651123046875, -3.62939453125, -3.3936767578125, -3.157958984375, -2.9222412109375, -2.6865234375, -2.4508056640625, -2.215087890625, -1.9793701171875, -1.74365234375, -1.5079345703125, -1.272216796875, -1.0364990234375, -0.80078125, -0.5650634765625, -0.329345703125, -0.0936279296875, 0.14208984375, 0.3778076171875, 0.613525390625, 0.8492431640625, 1.0849609375, 1.3206787109375, 1.556396484375, 1.7921142578125, 2.02783203125, 2.2635498046875, 2.499267578125, 2.7349853515625, 2.970703125, 3.2064208984375, 3.442138671875, 3.6778564453125, 3.91357421875, 4.1492919921875, 4.385009765625, 4.6207275390625, 4.8564453125, 5.0921630859375, 5.327880859375, 5.5635986328125, 5.79931640625, 6.0350341796875, 6.270751953125, 6.5064697265625, 6.7421875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 6.0, 10.0, 12.0, 13.0, 15.0, 14.0, 19.0, 25.0, 26.0, 29.0, 27.0, 35.0, 35.0, 34.0, 45.0, 44.0, 59.0, 38.0, 37.0, 48.0, 39.0, 39.0, 41.0, 33.0, 28.0, 37.0, 34.0, 27.0, 15.0, 20.0, 19.0, 13.0, 15.0, 12.0, 14.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.18128967285156, -63.26628494262695, -61.351280212402344, -59.436275482177734, -57.521270751953125, -55.606266021728516, -53.691261291503906, -51.7762565612793, -49.86125183105469, -47.94624710083008, -46.03124237060547, -44.11623764038086, -42.20123291015625, -40.28622817993164, -38.37122344970703, -36.45621871948242, -34.54121398925781, -32.6262092590332, -30.711204528808594, -28.796199798583984, -26.881195068359375, -24.966190338134766, -23.051185607910156, -21.136180877685547, -19.221176147460938, -17.306171417236328, -15.391166687011719, -13.47616195678711, -11.5611572265625, -9.64615249633789, -7.731147766113281, -5.816143035888672, -3.9011383056640625, -1.9861335754394531, -0.07112884521484375, 1.8438758850097656, 3.758880615234375, 5.673885345458984, 7.588890075683594, 9.503894805908203, 11.418899536132812, 13.333904266357422, 15.248908996582031, 17.16391372680664, 19.07891845703125, 20.99392318725586, 22.90892791748047, 24.823932647705078, 26.738937377929688, 28.653942108154297, 30.568946838378906, 32.483951568603516, 34.398956298828125, 36.313961029052734, 38.228965759277344, 40.14397048950195, 42.05897521972656, 43.97397994995117, 45.88898468017578, 47.80398941040039, 49.718994140625, 51.63399887084961, 53.54900360107422, 55.46400833129883, 57.37901306152344]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 5.0, 13.0, 13.0, 14.0, 14.0, 15.0, 18.0, 18.0, 24.0, 24.0, 15.0, 28.0, 25.0, 27.0, 43.0, 40.0, 26.0, 43.0, 38.0, 35.0, 33.0, 44.0, 37.0, 33.0, 30.0, 36.0, 37.0, 27.0, 28.0, 33.0, 20.0, 28.0, 18.0, 16.0, 14.0, 13.0, 11.0, 8.0, 10.0, 7.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.16705322265625, -54.35741424560547, -52.54777908325195, -50.73814010620117, -48.92850112915039, -47.118865966796875, -45.309226989746094, -43.49958801269531, -41.68994903564453, -39.88031005859375, -38.070674896240234, -36.26103591918945, -34.45139694213867, -32.641761779785156, -30.832122802734375, -29.022483825683594, -27.212848663330078, -25.40321159362793, -23.59357261657715, -21.783935546875, -19.97429656982422, -18.16465950012207, -16.355022430419922, -14.545384407043457, -12.735746383666992, -10.926108360290527, -9.116470336914062, -7.306833267211914, -5.497195243835449, -3.6875572204589844, -1.877920150756836, -0.0682821273803711, 1.7413597106933594, 3.550997495651245, 5.360635280609131, 7.1702728271484375, 8.979910850524902, 10.789548873901367, 12.599185943603516, 14.40882396697998, 16.218461990356445, 18.028099060058594, 19.837738037109375, 21.647375106811523, 23.457012176513672, 25.266651153564453, 27.0762882232666, 28.88592529296875, 30.69556427001953, 32.50520324707031, 34.31483840942383, 36.12447738647461, 37.93411636352539, 39.743751525878906, 41.55339050292969, 43.36302947998047, 45.17266845703125, 46.98230743408203, 48.79194259643555, 50.60158157348633, 52.41122055053711, 54.220855712890625, 56.030494689941406, 57.84013366699219, 59.6497688293457]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 17.0, 24.0, 38.0, 61.0, 70.0, 136.0, 198.0, 348.0, 498.0, 784.0, 1193.0, 1968.0, 3114.0, 4883.0, 7999.0, 12563.0, 19346.0, 30379.0, 47212.0, 73457.0, 111603.0, 166203.0, 239627.0, 329306.0, 422832.0, 494039.0, 510119.0, 465316.0, 379643.0, 282874.0, 200389.0, 135679.0, 89448.0, 58529.0, 37780.0, 23956.0, 15367.0, 9803.0, 6309.0, 3970.0, 2620.0, 1659.0, 1086.0, 631.0, 419.0, 276.0, 182.0, 121.0, 71.0, 35.0, 31.0, 21.0, 19.0, 12.0, 6.0, 5.0, 4.0, 1.0], "bins": [-56.96875, -55.2021484375, -53.435546875, -51.6689453125, -49.90234375, -48.1357421875, -46.369140625, -44.6025390625, -42.8359375, -41.0693359375, -39.302734375, -37.5361328125, -35.76953125, -34.0029296875, -32.236328125, -30.4697265625, -28.703125, -26.9365234375, -25.169921875, -23.4033203125, -21.63671875, -19.8701171875, -18.103515625, -16.3369140625, -14.5703125, -12.8037109375, -11.037109375, -9.2705078125, -7.50390625, -5.7373046875, -3.970703125, -2.2041015625, -0.4375, 1.3291015625, 3.095703125, 4.8623046875, 6.62890625, 8.3955078125, 10.162109375, 11.9287109375, 13.6953125, 15.4619140625, 17.228515625, 18.9951171875, 20.76171875, 22.5283203125, 24.294921875, 26.0615234375, 27.828125, 29.5947265625, 31.361328125, 33.1279296875, 34.89453125, 36.6611328125, 38.427734375, 40.1943359375, 41.9609375, 43.7275390625, 45.494140625, 47.2607421875, 49.02734375, 50.7939453125, 52.560546875, 54.3271484375, 56.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 7.0, 10.0, 12.0, 15.0, 15.0, 17.0, 16.0, 13.0, 31.0, 17.0, 26.0, 23.0, 20.0, 30.0, 40.0, 40.0, 28.0, 38.0, 44.0, 25.0, 36.0, 43.0, 35.0, 35.0, 30.0, 37.0, 35.0, 27.0, 27.0, 29.0, 27.0, 25.0, 21.0, 18.0, 12.0, 12.0, 12.0, 7.0, 10.0, 11.0, 10.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.03125, -47.46875, -45.90625, -44.34375, -42.78125, -41.21875, -39.65625, -38.09375, -36.53125, -34.96875, -33.40625, -31.84375, -30.28125, -28.71875, -27.15625, -25.59375, -24.03125, -22.46875, -20.90625, -19.34375, -17.78125, -16.21875, -14.65625, -13.09375, -11.53125, -9.96875, -8.40625, -6.84375, -5.28125, -3.71875, -2.15625, -0.59375, 0.96875, 2.53125, 4.09375, 5.65625, 7.21875, 8.78125, 10.34375, 11.90625, 13.46875, 15.03125, 16.59375, 18.15625, 19.71875, 21.28125, 22.84375, 24.40625, 25.96875, 27.53125, 29.09375, 30.65625, 32.21875, 33.78125, 35.34375, 36.90625, 38.46875, 40.03125, 41.59375, 43.15625, 44.71875, 46.28125, 47.84375, 49.40625, 50.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 42.0, 69.0, 120.0, 155.0, 246.0, 378.0, 726.0, 1250.0, 2134.0, 3834.0, 6950.0, 12806.0, 23908.0, 43825.0, 80598.0, 143223.0, 241744.0, 380137.0, 535252.0, 646465.0, 640993.0, 524491.0, 367146.0, 231874.0, 136760.0, 76565.0, 42223.0, 22903.0, 12034.0, 6843.0, 3637.0, 2009.0, 1158.0, 621.0, 378.0, 268.0, 152.0, 87.0, 56.0, 44.0, 31.0, 22.0, 17.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-74.125, -71.8056640625, -69.486328125, -67.1669921875, -64.84765625, -62.5283203125, -60.208984375, -57.8896484375, -55.5703125, -53.2509765625, -50.931640625, -48.6123046875, -46.29296875, -43.9736328125, -41.654296875, -39.3349609375, -37.015625, -34.6962890625, -32.376953125, -30.0576171875, -27.73828125, -25.4189453125, -23.099609375, -20.7802734375, -18.4609375, -16.1416015625, -13.822265625, -11.5029296875, -9.18359375, -6.8642578125, -4.544921875, -2.2255859375, 0.09375, 2.4130859375, 4.732421875, 7.0517578125, 9.37109375, 11.6904296875, 14.009765625, 16.3291015625, 18.6484375, 20.9677734375, 23.287109375, 25.6064453125, 27.92578125, 30.2451171875, 32.564453125, 34.8837890625, 37.203125, 39.5224609375, 41.841796875, 44.1611328125, 46.48046875, 48.7998046875, 51.119140625, 53.4384765625, 55.7578125, 58.0771484375, 60.396484375, 62.7158203125, 65.03515625, 67.3544921875, 69.673828125, 71.9931640625, 74.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 9.0, 8.0, 17.0, 13.0, 32.0, 34.0, 30.0, 48.0, 48.0, 69.0, 83.0, 83.0, 102.0, 106.0, 141.0, 160.0, 180.0, 184.0, 201.0, 223.0, 196.0, 224.0, 235.0, 209.0, 191.0, 180.0, 146.0, 154.0, 130.0, 107.0, 84.0, 81.0, 72.0, 68.0, 51.0, 42.0, 32.0, 23.0, 21.0, 18.0, 9.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.265625, -26.41650390625, -25.5673828125, -24.71826171875, -23.869140625, -23.02001953125, -22.1708984375, -21.32177734375, -20.47265625, -19.62353515625, -18.7744140625, -17.92529296875, -17.076171875, -16.22705078125, -15.3779296875, -14.52880859375, -13.6796875, -12.83056640625, -11.9814453125, -11.13232421875, -10.283203125, -9.43408203125, -8.5849609375, -7.73583984375, -6.88671875, -6.03759765625, -5.1884765625, -4.33935546875, -3.490234375, -2.64111328125, -1.7919921875, -0.94287109375, -0.09375, 0.75537109375, 1.6044921875, 2.45361328125, 3.302734375, 4.15185546875, 5.0009765625, 5.85009765625, 6.69921875, 7.54833984375, 8.3974609375, 9.24658203125, 10.095703125, 10.94482421875, 11.7939453125, 12.64306640625, 13.4921875, 14.34130859375, 15.1904296875, 16.03955078125, 16.888671875, 17.73779296875, 18.5869140625, 19.43603515625, 20.28515625, 21.13427734375, 21.9833984375, 22.83251953125, 23.681640625, 24.53076171875, 25.3798828125, 26.22900390625, 27.078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 5.0, 6.0, 8.0, 9.0, 14.0, 13.0, 22.0, 18.0, 23.0, 32.0, 27.0, 35.0, 30.0, 42.0, 47.0, 44.0, 38.0, 49.0, 43.0, 48.0, 37.0, 33.0, 32.0, 46.0, 43.0, 30.0, 44.0, 34.0, 18.0, 20.0, 18.0, 13.0, 17.0, 9.0, 9.0, 5.0, 12.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-66.95327758789062, -64.97203826904297, -62.99079132080078, -61.00954818725586, -59.02830505371094, -57.04706573486328, -55.06582260131836, -53.08457946777344, -51.103336334228516, -49.122093200683594, -47.14085006713867, -45.15960693359375, -43.178367614746094, -41.197120666503906, -39.21588134765625, -37.23463821411133, -35.253395080566406, -33.272151947021484, -31.290908813476562, -29.309667587280273, -27.32842445373535, -25.34718132019043, -23.36594009399414, -21.38469696044922, -19.403453826904297, -17.422210693359375, -15.44096851348877, -13.459726333618164, -11.478483200073242, -9.49724006652832, -7.515997886657715, -5.534755706787109, -3.5535125732421875, -1.5722699165344238, 0.40897274017333984, 2.3902153968811035, 4.371458053588867, 6.352701187133789, 8.333943367004395, 10.315185546875, 12.296428680419922, 14.277671813964844, 16.258914947509766, 18.240156173706055, 20.221399307250977, 22.2026424407959, 24.183883666992188, 26.16512680053711, 28.14636993408203, 30.127613067626953, 32.108856201171875, 34.0900993347168, 36.07134246826172, 38.052581787109375, 40.0338249206543, 42.01506805419922, 43.99631118774414, 45.97755432128906, 47.958797454833984, 49.940040588378906, 51.92127990722656, 53.90252685546875, 55.883766174316406, 57.86500930786133, 59.84625244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 7.0, 6.0, 10.0, 14.0, 12.0, 13.0, 15.0, 17.0, 11.0, 22.0, 29.0, 30.0, 28.0, 35.0, 36.0, 34.0, 43.0, 29.0, 42.0, 45.0, 40.0, 49.0, 46.0, 30.0, 37.0, 36.0, 25.0, 38.0, 31.0, 31.0, 19.0, 22.0, 22.0, 14.0, 17.0, 12.0, 6.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.89384078979492, -53.91671371459961, -51.9395866394043, -49.96245574951172, -47.985328674316406, -46.008201599121094, -44.03107452392578, -42.05394744873047, -40.076820373535156, -38.099693298339844, -36.12256622314453, -34.14543914794922, -32.16830825805664, -30.191181182861328, -28.214054107666016, -26.236927032470703, -24.259796142578125, -22.282669067382812, -20.305540084838867, -18.328413009643555, -16.35128402709961, -14.374156951904297, -12.397029876708984, -10.419901847839355, -8.442773818969727, -6.465645790100098, -4.488518238067627, -2.5113906860351562, -0.5342626571655273, 1.4428653717041016, 3.419992446899414, 5.397120475769043, 7.3742523193359375, 9.351380348205566, 11.328508377075195, 13.305635452270508, 15.282763481140137, 17.259891510009766, 19.237018585205078, 21.21414566040039, 23.191274642944336, 25.16840171813965, 27.145530700683594, 29.122657775878906, 31.09978485107422, 33.07691192626953, 35.054039001464844, 37.03116989135742, 39.008296966552734, 40.98542404174805, 42.96255111694336, 44.93968200683594, 46.91680908203125, 48.89393615722656, 50.871063232421875, 52.84819030761719, 54.8253173828125, 56.80244445800781, 58.779571533203125, 60.75669860839844, 62.733829498291016, 64.71095275878906, 66.68807983398438, 68.66521453857422, 70.64234161376953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 2.0, 20.0, 28.0, 31.0, 60.0, 80.0, 117.0, 189.0, 346.0, 494.0, 725.0, 1171.0, 1862.0, 2890.0, 4407.0, 7115.0, 11148.0, 17391.0, 26691.0, 39669.0, 57090.0, 77675.0, 99170.0, 115209.0, 121406.0, 115026.0, 99080.0, 78407.0, 57105.0, 39580.0, 26534.0, 17482.0, 11035.0, 7010.0, 4471.0, 2827.0, 1746.0, 1219.0, 720.0, 460.0, 304.0, 196.0, 116.0, 85.0, 50.0, 41.0, 22.0, 15.0, 8.0, 14.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.74609375, -25.7734375, -24.80078125, -23.828125, -22.85546875, -21.8828125, -20.91015625, -19.9375, -18.96484375, -17.9921875, -17.01953125, -16.046875, -15.07421875, -14.1015625, -13.12890625, -12.15625, -11.18359375, -10.2109375, -9.23828125, -8.265625, -7.29296875, -6.3203125, -5.34765625, -4.375, -3.40234375, -2.4296875, -1.45703125, -0.484375, 0.48828125, 1.4609375, 2.43359375, 3.40625, 4.37890625, 5.3515625, 6.32421875, 7.296875, 8.26953125, 9.2421875, 10.21484375, 11.1875, 12.16015625, 13.1328125, 14.10546875, 15.078125, 16.05078125, 17.0234375, 17.99609375, 18.96875, 19.94140625, 20.9140625, 21.88671875, 22.859375, 23.83203125, 24.8046875, 25.77734375, 26.75, 27.72265625, 28.6953125, 29.66796875, 30.640625, 31.61328125, 32.5859375, 33.55859375, 34.53125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 3.0, 12.0, 13.0, 13.0, 9.0, 17.0, 13.0, 20.0, 19.0, 21.0, 30.0, 34.0, 29.0, 34.0, 42.0, 39.0, 29.0, 40.0, 49.0, 32.0, 44.0, 41.0, 47.0, 36.0, 29.0, 35.0, 32.0, 33.0, 29.0, 24.0, 24.0, 17.0, 18.0, 13.0, 15.0, 10.0, 6.0, 7.0, 13.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.03125, -53.98583984375, -51.9404296875, -49.89501953125, -47.849609375, -45.80419921875, -43.7587890625, -41.71337890625, -39.66796875, -37.62255859375, -35.5771484375, -33.53173828125, -31.486328125, -29.44091796875, -27.3955078125, -25.35009765625, -23.3046875, -21.25927734375, -19.2138671875, -17.16845703125, -15.123046875, -13.07763671875, -11.0322265625, -8.98681640625, -6.94140625, -4.89599609375, -2.8505859375, -0.80517578125, 1.240234375, 3.28564453125, 5.3310546875, 7.37646484375, 9.421875, 11.46728515625, 13.5126953125, 15.55810546875, 17.603515625, 19.64892578125, 21.6943359375, 23.73974609375, 25.78515625, 27.83056640625, 29.8759765625, 31.92138671875, 33.966796875, 36.01220703125, 38.0576171875, 40.10302734375, 42.1484375, 44.19384765625, 46.2392578125, 48.28466796875, 50.330078125, 52.37548828125, 54.4208984375, 56.46630859375, 58.51171875, 60.55712890625, 62.6025390625, 64.64794921875, 66.693359375, 68.73876953125, 70.7841796875, 72.82958984375, 74.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 3.0, 17.0, 16.0, 27.0, 42.0, 41.0, 55.0, 82.0, 117.0, 139.0, 230.0, 351.0, 422.0, 685.0, 1009.0, 1491.0, 2145.0, 3177.0, 4888.0, 7677.0, 11506.0, 17810.0, 29831.0, 287047.0, 587386.0, 34705.0, 19876.0, 12723.0, 8289.0, 5356.0, 3622.0, 2416.0, 1625.0, 1155.0, 782.0, 561.0, 351.0, 248.0, 172.0, 139.0, 100.0, 67.0, 63.0, 31.0, 28.0, 12.0, 9.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0, 3.0], "bins": [-66.5, -64.55029296875, -62.6005859375, -60.65087890625, -58.701171875, -56.75146484375, -54.8017578125, -52.85205078125, -50.90234375, -48.95263671875, -47.0029296875, -45.05322265625, -43.103515625, -41.15380859375, -39.2041015625, -37.25439453125, -35.3046875, -33.35498046875, -31.4052734375, -29.45556640625, -27.505859375, -25.55615234375, -23.6064453125, -21.65673828125, -19.70703125, -17.75732421875, -15.8076171875, -13.85791015625, -11.908203125, -9.95849609375, -8.0087890625, -6.05908203125, -4.109375, -2.15966796875, -0.2099609375, 1.73974609375, 3.689453125, 5.63916015625, 7.5888671875, 9.53857421875, 11.48828125, 13.43798828125, 15.3876953125, 17.33740234375, 19.287109375, 21.23681640625, 23.1865234375, 25.13623046875, 27.0859375, 29.03564453125, 30.9853515625, 32.93505859375, 34.884765625, 36.83447265625, 38.7841796875, 40.73388671875, 42.68359375, 44.63330078125, 46.5830078125, 48.53271484375, 50.482421875, 52.43212890625, 54.3818359375, 56.33154296875, 58.28125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 16.0, 12.0, 12.0, 8.0, 34.0, 29.0, 28.0, 30.0, 35.0, 32.0, 34.0, 45.0, 32.0, 46.0, 48.0, 34.0, 42.0, 43.0, 44.0, 43.0, 44.0, 46.0, 38.0, 33.0, 24.0, 16.0, 20.0, 14.0, 8.0, 15.0, 13.0, 10.0, 13.0, 6.0, 7.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0751953125, -49.462890625, -47.8505859375, -46.23828125, -44.6259765625, -43.013671875, -41.4013671875, -39.7890625, -38.1767578125, -36.564453125, -34.9521484375, -33.33984375, -31.7275390625, -30.115234375, -28.5029296875, -26.890625, -25.2783203125, -23.666015625, -22.0537109375, -20.44140625, -18.8291015625, -17.216796875, -15.6044921875, -13.9921875, -12.3798828125, -10.767578125, -9.1552734375, -7.54296875, -5.9306640625, -4.318359375, -2.7060546875, -1.09375, 0.5185546875, 2.130859375, 3.7431640625, 5.35546875, 6.9677734375, 8.580078125, 10.1923828125, 11.8046875, 13.4169921875, 15.029296875, 16.6416015625, 18.25390625, 19.8662109375, 21.478515625, 23.0908203125, 24.703125, 26.3154296875, 27.927734375, 29.5400390625, 31.15234375, 32.7646484375, 34.376953125, 35.9892578125, 37.6015625, 39.2138671875, 40.826171875, 42.4384765625, 44.05078125, 45.6630859375, 47.275390625, 48.8876953125, 50.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 4.0, 6.0, 21.0, 22.0, 29.0, 41.0, 59.0, 82.0, 132.0, 185.0, 287.0, 467.0, 708.0, 1050.0, 1867.0, 3127.0, 5640.0, 10474.0, 20405.0, 51378.0, 804085.0, 94663.0, 24992.0, 12572.0, 6808.0, 3780.0, 2033.0, 1248.0, 847.0, 497.0, 328.0, 217.0, 132.0, 95.0, 82.0, 54.0, 29.0, 29.0, 18.0, 9.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08984375, -5.877197265625, -5.66455078125, -5.451904296875, -5.2392578125, -5.026611328125, -4.81396484375, -4.601318359375, -4.388671875, -4.176025390625, -3.96337890625, -3.750732421875, -3.5380859375, -3.325439453125, -3.11279296875, -2.900146484375, -2.6875, -2.474853515625, -2.26220703125, -2.049560546875, -1.8369140625, -1.624267578125, -1.41162109375, -1.198974609375, -0.986328125, -0.773681640625, -0.56103515625, -0.348388671875, -0.1357421875, 0.076904296875, 0.28955078125, 0.502197265625, 0.71484375, 0.927490234375, 1.14013671875, 1.352783203125, 1.5654296875, 1.778076171875, 1.99072265625, 2.203369140625, 2.416015625, 2.628662109375, 2.84130859375, 3.053955078125, 3.2666015625, 3.479248046875, 3.69189453125, 3.904541015625, 4.1171875, 4.329833984375, 4.54248046875, 4.755126953125, 4.9677734375, 5.180419921875, 5.39306640625, 5.605712890625, 5.818359375, 6.031005859375, 6.24365234375, 6.456298828125, 6.6689453125, 6.881591796875, 7.09423828125, 7.306884765625, 7.51953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 12.0, 8.0, 10.0, 16.0, 4.0, 16.0, 22.0, 22.0, 31.0, 31.0, 33.0, 41.0, 55.0, 66.0, 53.0, 54.0, 52.0, 55.0, 61.0, 54.0, 43.0, 34.0, 42.0, 28.0, 30.0, 25.0, 19.0, 15.0, 4.0, 12.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0009131431579589844, -0.0008829161524772644, -0.0008526891469955444, -0.0008224621415138245, -0.0007922351360321045, -0.0007620081305503845, -0.0007317811250686646, -0.0007015541195869446, -0.0006713271141052246, -0.0006411001086235046, -0.0006108731031417847, -0.0005806460976600647, -0.0005504190921783447, -0.0005201920866966248, -0.0004899650812149048, -0.0004597380757331848, -0.00042951107025146484, -0.0003992840647697449, -0.0003690570592880249, -0.00033883005380630493, -0.00030860304832458496, -0.000278376042842865, -0.000248149037361145, -0.00021792203187942505, -0.00018769502639770508, -0.0001574680209159851, -0.00012724101543426514, -9.701400995254517e-05, -6.67870044708252e-05, -3.6559998989105225e-05, -6.332993507385254e-06, 2.3894011974334717e-05, 5.412101745605469e-05, 8.434802293777466e-05, 0.00011457502841949463, 0.0001448020339012146, 0.00017502903938293457, 0.00020525604486465454, 0.0002354830503463745, 0.0002657100558280945, 0.00029593706130981445, 0.0003261640667915344, 0.0003563910722732544, 0.00038661807775497437, 0.00041684508323669434, 0.0004470720887184143, 0.0004772990942001343, 0.0005075260996818542, 0.0005377531051635742, 0.0005679801106452942, 0.0005982071161270142, 0.0006284341216087341, 0.0006586611270904541, 0.0006888881325721741, 0.000719115138053894, 0.000749342143535614, 0.000779569149017334, 0.000809796154499054, 0.0008400231599807739, 0.0008702501654624939, 0.0009004771709442139, 0.0009307041764259338, 0.0009609311819076538, 0.0009911581873893738, 0.0010213851928710938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 9.0, 20.0, 24.0, 36.0, 40.0, 66.0, 108.0, 154.0, 211.0, 303.0, 480.0, 743.0, 1007.0, 1552.0, 2364.0, 3465.0, 5076.0, 7742.0, 11775.0, 17454.0, 26043.0, 37878.0, 52949.0, 71034.0, 90389.0, 105971.0, 114173.0, 111468.0, 99676.0, 81631.0, 62521.0, 45205.0, 31775.0, 21804.0, 14410.0, 9751.0, 6430.0, 4269.0, 2806.0, 1830.0, 1235.0, 880.0, 577.0, 396.0, 265.0, 198.0, 111.0, 96.0, 61.0, 41.0, 27.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.09375, -2.023406982421875, -1.95306396484375, -1.882720947265625, -1.8123779296875, -1.742034912109375, -1.67169189453125, -1.601348876953125, -1.531005859375, -1.460662841796875, -1.39031982421875, -1.319976806640625, -1.2496337890625, -1.179290771484375, -1.10894775390625, -1.038604736328125, -0.96826171875, -0.897918701171875, -0.82757568359375, -0.757232666015625, -0.6868896484375, -0.616546630859375, -0.54620361328125, -0.475860595703125, -0.405517578125, -0.335174560546875, -0.26483154296875, -0.194488525390625, -0.1241455078125, -0.053802490234375, 0.01654052734375, 0.086883544921875, 0.1572265625, 0.227569580078125, 0.29791259765625, 0.368255615234375, 0.4385986328125, 0.508941650390625, 0.57928466796875, 0.649627685546875, 0.719970703125, 0.790313720703125, 0.86065673828125, 0.930999755859375, 1.0013427734375, 1.071685791015625, 1.14202880859375, 1.212371826171875, 1.28271484375, 1.353057861328125, 1.42340087890625, 1.493743896484375, 1.5640869140625, 1.634429931640625, 1.70477294921875, 1.775115966796875, 1.845458984375, 1.915802001953125, 1.98614501953125, 2.056488037109375, 2.1268310546875, 2.197174072265625, 2.26751708984375, 2.337860107421875, 2.408203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 12.0, 22.0, 21.0, 11.0, 35.0, 39.0, 44.0, 36.0, 43.0, 52.0, 48.0, 56.0, 66.0, 47.0, 52.0, 62.0, 43.0, 39.0, 44.0, 34.0, 35.0, 21.0, 27.0, 16.0, 11.0, 14.0, 6.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.353515625, -1.3142852783203125, -1.275054931640625, -1.2358245849609375, -1.19659423828125, -1.1573638916015625, -1.118133544921875, -1.0789031982421875, -1.0396728515625, -1.0004425048828125, -0.961212158203125, -0.9219818115234375, -0.88275146484375, -0.8435211181640625, -0.804290771484375, -0.7650604248046875, -0.725830078125, -0.6865997314453125, -0.647369384765625, -0.6081390380859375, -0.56890869140625, -0.5296783447265625, -0.490447998046875, -0.4512176513671875, -0.4119873046875, -0.3727569580078125, -0.333526611328125, -0.2942962646484375, -0.25506591796875, -0.2158355712890625, -0.176605224609375, -0.1373748779296875, -0.09814453125, -0.0589141845703125, -0.019683837890625, 0.0195465087890625, 0.05877685546875, 0.0980072021484375, 0.137237548828125, 0.1764678955078125, 0.2156982421875, 0.2549285888671875, 0.294158935546875, 0.3333892822265625, 0.37261962890625, 0.4118499755859375, 0.451080322265625, 0.4903106689453125, 0.529541015625, 0.5687713623046875, 0.608001708984375, 0.6472320556640625, 0.68646240234375, 0.7256927490234375, 0.764923095703125, 0.8041534423828125, 0.8433837890625, 0.8826141357421875, 0.921844482421875, 0.9610748291015625, 1.00030517578125, 1.0395355224609375, 1.078765869140625, 1.1179962158203125, 1.1572265625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 11.0, 11.0, 12.0, 17.0, 18.0, 24.0, 35.0, 32.0, 32.0, 41.0, 44.0, 48.0, 48.0, 51.0, 44.0, 46.0, 50.0, 33.0, 36.0, 38.0, 42.0, 38.0, 39.0, 31.0, 23.0, 22.0, 26.0, 11.0, 10.0, 11.0, 10.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-75.80357360839844, -73.64806365966797, -71.4925537109375, -69.33704376220703, -67.18153381347656, -65.0260238647461, -62.87051773071289, -60.71500778198242, -58.55949783325195, -56.403987884521484, -54.248477935791016, -52.09296798706055, -49.937461853027344, -47.781951904296875, -45.626441955566406, -43.47093200683594, -41.31542205810547, -39.159912109375, -37.00440216064453, -34.84889221191406, -32.693382263183594, -30.537874221801758, -28.382366180419922, -26.226856231689453, -24.071346282958984, -21.915836334228516, -19.760326385498047, -17.60481834411621, -15.449308395385742, -13.293798446655273, -11.138289451599121, -8.982780456542969, -6.827274322509766, -4.671764850616455, -2.5162553787231445, -0.360745906829834, 1.7947635650634766, 3.9502735137939453, 6.105782508850098, 8.26129150390625, 10.416801452636719, 12.572311401367188, 14.72782039642334, 16.883329391479492, 19.03883934020996, 21.19434928894043, 23.349857330322266, 25.505367279052734, 27.660877227783203, 29.816387176513672, 31.97189712524414, 34.12740707397461, 36.28291320800781, 38.43842315673828, 40.59393310546875, 42.74944305419922, 44.90495300292969, 47.060462951660156, 49.215972900390625, 51.371482849121094, 53.52699279785156, 55.68250274658203, 57.838008880615234, 59.9935188293457, 62.14902877807617]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 7.0, 13.0, 14.0, 10.0, 13.0, 16.0, 19.0, 20.0, 22.0, 26.0, 32.0, 31.0, 38.0, 37.0, 39.0, 37.0, 30.0, 49.0, 40.0, 45.0, 41.0, 43.0, 36.0, 33.0, 36.0, 27.0, 37.0, 30.0, 24.0, 20.0, 18.0, 22.0, 11.0, 16.0, 15.0, 2.0, 9.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.99536895751953, -54.92876434326172, -52.862159729003906, -50.795555114746094, -48.72895050048828, -46.66234588623047, -44.595741271972656, -42.529136657714844, -40.46253204345703, -38.39592742919922, -36.329322814941406, -34.262718200683594, -32.19611358642578, -30.12950897216797, -28.062902450561523, -25.99629783630371, -23.929691314697266, -21.863086700439453, -19.79648208618164, -17.729877471923828, -15.6632719039917, -13.596667289733887, -11.530061721801758, -9.463457107543945, -7.396852493286133, -5.33024787902832, -3.2636427879333496, -1.197037696838379, 0.8695669174194336, 2.936171531677246, 5.002777099609375, 7.0693817138671875, 9.135986328125, 11.202590942382812, 13.269195556640625, 15.335801124572754, 17.40240478515625, 19.469009399414062, 21.535615921020508, 23.60222053527832, 25.668825149536133, 27.735429763793945, 29.802034378051758, 31.868640899658203, 33.935245513916016, 36.00185012817383, 38.06845474243164, 40.13505935668945, 42.201663970947266, 44.26826858520508, 46.33487319946289, 48.4014778137207, 50.468082427978516, 52.53468704223633, 54.601295471191406, 56.66790008544922, 58.73450469970703, 60.801109313964844, 62.867713928222656, 64.93431854248047, 67.00092315673828, 69.0675277709961, 71.1341323852539, 73.20073699951172, 75.26734161376953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 14.0, 21.0, 14.0, 30.0, 44.0, 57.0, 98.0, 128.0, 182.0, 293.0, 411.0, 679.0, 972.0, 1577.0, 2398.0, 3848.0, 6403.0, 10704.0, 17835.0, 29680.0, 47745.0, 73195.0, 102486.0, 129782.0, 142976.0, 136751.0, 113332.0, 82471.0, 55658.0, 34748.0, 21023.0, 12751.0, 7532.0, 4548.0, 2908.0, 1751.0, 1160.0, 759.0, 483.0, 350.0, 241.0, 148.0, 108.0, 77.0, 60.0, 37.0, 26.0, 18.0, 12.0, 10.0, 4.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-68.6875, -66.5849609375, -64.482421875, -62.3798828125, -60.27734375, -58.1748046875, -56.072265625, -53.9697265625, -51.8671875, -49.7646484375, -47.662109375, -45.5595703125, -43.45703125, -41.3544921875, -39.251953125, -37.1494140625, -35.046875, -32.9443359375, -30.841796875, -28.7392578125, -26.63671875, -24.5341796875, -22.431640625, -20.3291015625, -18.2265625, -16.1240234375, -14.021484375, -11.9189453125, -9.81640625, -7.7138671875, -5.611328125, -3.5087890625, -1.40625, 0.6962890625, 2.798828125, 4.9013671875, 7.00390625, 9.1064453125, 11.208984375, 13.3115234375, 15.4140625, 17.5166015625, 19.619140625, 21.7216796875, 23.82421875, 25.9267578125, 28.029296875, 30.1318359375, 32.234375, 34.3369140625, 36.439453125, 38.5419921875, 40.64453125, 42.7470703125, 44.849609375, 46.9521484375, 49.0546875, 51.1572265625, 53.259765625, 55.3623046875, 57.46484375, 59.5673828125, 61.669921875, 63.7724609375, 65.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 5.0, 5.0, 4.0, 8.0, 5.0, 8.0, 14.0, 16.0, 15.0, 14.0, 11.0, 22.0, 23.0, 23.0, 24.0, 31.0, 37.0, 38.0, 37.0, 34.0, 42.0, 35.0, 52.0, 35.0, 47.0, 43.0, 35.0, 38.0, 30.0, 34.0, 31.0, 34.0, 27.0, 18.0, 25.0, 18.0, 19.0, 12.0, 8.0, 12.0, 7.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.625, -52.7490234375, -50.873046875, -48.9970703125, -47.12109375, -45.2451171875, -43.369140625, -41.4931640625, -39.6171875, -37.7412109375, -35.865234375, -33.9892578125, -32.11328125, -30.2373046875, -28.361328125, -26.4853515625, -24.609375, -22.7333984375, -20.857421875, -18.9814453125, -17.10546875, -15.2294921875, -13.353515625, -11.4775390625, -9.6015625, -7.7255859375, -5.849609375, -3.9736328125, -2.09765625, -0.2216796875, 1.654296875, 3.5302734375, 5.40625, 7.2822265625, 9.158203125, 11.0341796875, 12.91015625, 14.7861328125, 16.662109375, 18.5380859375, 20.4140625, 22.2900390625, 24.166015625, 26.0419921875, 27.91796875, 29.7939453125, 31.669921875, 33.5458984375, 35.421875, 37.2978515625, 39.173828125, 41.0498046875, 42.92578125, 44.8017578125, 46.677734375, 48.5537109375, 50.4296875, 52.3056640625, 54.181640625, 56.0576171875, 57.93359375, 59.8095703125, 61.685546875, 63.5615234375, 65.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 12.0, 19.0, 24.0, 56.0, 81.0, 115.0, 156.0, 259.0, 389.0, 579.0, 859.0, 1403.0, 2429.0, 3838.0, 6484.0, 11297.0, 20446.0, 35294.0, 60573.0, 95516.0, 135745.0, 163314.0, 160509.0, 129149.0, 88265.0, 55305.0, 32340.0, 18194.0, 10479.0, 6011.0, 3540.0, 2165.0, 1318.0, 820.0, 558.0, 322.0, 214.0, 150.0, 109.0, 67.0, 44.0, 30.0, 27.0, 17.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.625, -79.9521484375, -77.279296875, -74.6064453125, -71.93359375, -69.2607421875, -66.587890625, -63.9150390625, -61.2421875, -58.5693359375, -55.896484375, -53.2236328125, -50.55078125, -47.8779296875, -45.205078125, -42.5322265625, -39.859375, -37.1865234375, -34.513671875, -31.8408203125, -29.16796875, -26.4951171875, -23.822265625, -21.1494140625, -18.4765625, -15.8037109375, -13.130859375, -10.4580078125, -7.78515625, -5.1123046875, -2.439453125, 0.2333984375, 2.90625, 5.5791015625, 8.251953125, 10.9248046875, 13.59765625, 16.2705078125, 18.943359375, 21.6162109375, 24.2890625, 26.9619140625, 29.634765625, 32.3076171875, 34.98046875, 37.6533203125, 40.326171875, 42.9990234375, 45.671875, 48.3447265625, 51.017578125, 53.6904296875, 56.36328125, 59.0361328125, 61.708984375, 64.3818359375, 67.0546875, 69.7275390625, 72.400390625, 75.0732421875, 77.74609375, 80.4189453125, 83.091796875, 85.7646484375, 88.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 12.0, 15.0, 17.0, 18.0, 14.0, 21.0, 37.0, 27.0, 36.0, 32.0, 41.0, 49.0, 53.0, 45.0, 42.0, 45.0, 40.0, 46.0, 52.0, 44.0, 36.0, 44.0, 31.0, 32.0, 23.0, 17.0, 24.0, 18.0, 8.0, 12.0, 14.0, 16.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-43.5625, -42.216796875, -40.87109375, -39.525390625, -38.1796875, -36.833984375, -35.48828125, -34.142578125, -32.796875, -31.451171875, -30.10546875, -28.759765625, -27.4140625, -26.068359375, -24.72265625, -23.376953125, -22.03125, -20.685546875, -19.33984375, -17.994140625, -16.6484375, -15.302734375, -13.95703125, -12.611328125, -11.265625, -9.919921875, -8.57421875, -7.228515625, -5.8828125, -4.537109375, -3.19140625, -1.845703125, -0.5, 0.845703125, 2.19140625, 3.537109375, 4.8828125, 6.228515625, 7.57421875, 8.919921875, 10.265625, 11.611328125, 12.95703125, 14.302734375, 15.6484375, 16.994140625, 18.33984375, 19.685546875, 21.03125, 22.376953125, 23.72265625, 25.068359375, 26.4140625, 27.759765625, 29.10546875, 30.451171875, 31.796875, 33.142578125, 34.48828125, 35.833984375, 37.1796875, 38.525390625, 39.87109375, 41.216796875, 42.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 15.0, 20.0, 25.0, 35.0, 60.0, 90.0, 155.0, 266.0, 440.0, 766.0, 1254.0, 2036.0, 3736.0, 6529.0, 11717.0, 20416.0, 34799.0, 57247.0, 87455.0, 120736.0, 146029.0, 150679.0, 132084.0, 101420.0, 68222.0, 42752.0, 25298.0, 14590.0, 8432.0, 4807.0, 2667.0, 1525.0, 890.0, 541.0, 312.0, 169.0, 124.0, 69.0, 54.0, 32.0, 21.0, 12.0, 10.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.90625, -18.30029296875, -17.6943359375, -17.08837890625, -16.482421875, -15.87646484375, -15.2705078125, -14.66455078125, -14.05859375, -13.45263671875, -12.8466796875, -12.24072265625, -11.634765625, -11.02880859375, -10.4228515625, -9.81689453125, -9.2109375, -8.60498046875, -7.9990234375, -7.39306640625, -6.787109375, -6.18115234375, -5.5751953125, -4.96923828125, -4.36328125, -3.75732421875, -3.1513671875, -2.54541015625, -1.939453125, -1.33349609375, -0.7275390625, -0.12158203125, 0.484375, 1.09033203125, 1.6962890625, 2.30224609375, 2.908203125, 3.51416015625, 4.1201171875, 4.72607421875, 5.33203125, 5.93798828125, 6.5439453125, 7.14990234375, 7.755859375, 8.36181640625, 8.9677734375, 9.57373046875, 10.1796875, 10.78564453125, 11.3916015625, 11.99755859375, 12.603515625, 13.20947265625, 13.8154296875, 14.42138671875, 15.02734375, 15.63330078125, 16.2392578125, 16.84521484375, 17.451171875, 18.05712890625, 18.6630859375, 19.26904296875, 19.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 28.0, 20.0, 25.0, 32.0, 34.0, 37.0, 42.0, 49.0, 51.0, 51.0, 42.0, 63.0, 51.0, 45.0, 55.0, 41.0, 35.0, 35.0, 34.0, 34.0, 26.0, 29.0, 11.0, 21.0, 12.0, 14.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019254684448242188, -0.0018616467714309692, -0.0017978250980377197, -0.0017340034246444702, -0.0016701817512512207, -0.0016063600778579712, -0.0015425384044647217, -0.0014787167310714722, -0.0014148950576782227, -0.0013510733842849731, -0.0012872517108917236, -0.0012234300374984741, -0.0011596083641052246, -0.001095786690711975, -0.0010319650173187256, -0.0009681433439254761, -0.0009043216705322266, -0.000840499997138977, -0.0007766783237457275, -0.000712856650352478, -0.0006490349769592285, -0.000585213303565979, -0.0005213916301727295, -0.00045756995677948, -0.00039374828338623047, -0.00032992660999298096, -0.00026610493659973145, -0.00020228326320648193, -0.00013846158981323242, -7.463991641998291e-05, -1.0818243026733398e-05, 5.300343036651611e-05, 0.00011682510375976562, 0.00018064677715301514, 0.00024446845054626465, 0.00030829012393951416, 0.00037211179733276367, 0.0004359334707260132, 0.0004997551441192627, 0.0005635768175125122, 0.0006273984909057617, 0.0006912201642990112, 0.0007550418376922607, 0.0008188635110855103, 0.0008826851844787598, 0.0009465068578720093, 0.0010103285312652588, 0.0010741502046585083, 0.0011379718780517578, 0.0012017935514450073, 0.0012656152248382568, 0.0013294368982315063, 0.0013932585716247559, 0.0014570802450180054, 0.0015209019184112549, 0.0015847235918045044, 0.001648545265197754, 0.0017123669385910034, 0.001776188611984253, 0.0018400102853775024, 0.001903831958770752, 0.0019676536321640015, 0.002031475305557251, 0.0020952969789505005, 0.00215911865234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 34.0, 37.0, 41.0, 90.0, 118.0, 176.0, 264.0, 391.0, 599.0, 844.0, 1382.0, 1991.0, 3005.0, 4867.0, 7403.0, 11499.0, 17803.0, 27030.0, 40146.0, 57317.0, 79016.0, 100157.0, 116513.0, 122690.0, 114808.0, 97569.0, 76024.0, 54754.0, 37952.0, 25858.0, 16797.0, 11065.0, 7125.0, 4483.0, 2996.0, 1931.0, 1288.0, 836.0, 507.0, 380.0, 224.0, 165.0, 105.0, 76.0, 49.0, 39.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 9.0, 3.0, 1.0], "bins": [-16.25, -15.7490234375, -15.248046875, -14.7470703125, -14.24609375, -13.7451171875, -13.244140625, -12.7431640625, -12.2421875, -11.7412109375, -11.240234375, -10.7392578125, -10.23828125, -9.7373046875, -9.236328125, -8.7353515625, -8.234375, -7.7333984375, -7.232421875, -6.7314453125, -6.23046875, -5.7294921875, -5.228515625, -4.7275390625, -4.2265625, -3.7255859375, -3.224609375, -2.7236328125, -2.22265625, -1.7216796875, -1.220703125, -0.7197265625, -0.21875, 0.2822265625, 0.783203125, 1.2841796875, 1.78515625, 2.2861328125, 2.787109375, 3.2880859375, 3.7890625, 4.2900390625, 4.791015625, 5.2919921875, 5.79296875, 6.2939453125, 6.794921875, 7.2958984375, 7.796875, 8.2978515625, 8.798828125, 9.2998046875, 9.80078125, 10.3017578125, 10.802734375, 11.3037109375, 11.8046875, 12.3056640625, 12.806640625, 13.3076171875, 13.80859375, 14.3095703125, 14.810546875, 15.3115234375, 15.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 16.0, 15.0, 24.0, 16.0, 25.0, 20.0, 39.0, 42.0, 41.0, 41.0, 45.0, 60.0, 58.0, 48.0, 66.0, 53.0, 46.0, 36.0, 31.0, 38.0, 38.0, 38.0, 22.0, 24.0, 13.0, 16.0, 16.0, 6.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.24609375, -7.018798828125, -6.79150390625, -6.564208984375, -6.3369140625, -6.109619140625, -5.88232421875, -5.655029296875, -5.427734375, -5.200439453125, -4.97314453125, -4.745849609375, -4.5185546875, -4.291259765625, -4.06396484375, -3.836669921875, -3.609375, -3.382080078125, -3.15478515625, -2.927490234375, -2.7001953125, -2.472900390625, -2.24560546875, -2.018310546875, -1.791015625, -1.563720703125, -1.33642578125, -1.109130859375, -0.8818359375, -0.654541015625, -0.42724609375, -0.199951171875, 0.02734375, 0.254638671875, 0.48193359375, 0.709228515625, 0.9365234375, 1.163818359375, 1.39111328125, 1.618408203125, 1.845703125, 2.072998046875, 2.30029296875, 2.527587890625, 2.7548828125, 2.982177734375, 3.20947265625, 3.436767578125, 3.6640625, 3.891357421875, 4.11865234375, 4.345947265625, 4.5732421875, 4.800537109375, 5.02783203125, 5.255126953125, 5.482421875, 5.709716796875, 5.93701171875, 6.164306640625, 6.3916015625, 6.618896484375, 6.84619140625, 7.073486328125, 7.30078125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 9.0, 12.0, 12.0, 18.0, 20.0, 29.0, 33.0, 32.0, 41.0, 37.0, 45.0, 36.0, 39.0, 42.0, 33.0, 48.0, 44.0, 35.0, 45.0, 39.0, 42.0, 30.0, 36.0, 26.0, 31.0, 16.0, 22.0, 20.0, 18.0, 12.0, 12.0, 6.0, 14.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.189083099365234, -60.27553939819336, -58.361995697021484, -56.44845199584961, -54.534908294677734, -52.621360778808594, -50.70781707763672, -48.794273376464844, -46.88072967529297, -44.967185974121094, -43.05364227294922, -41.140098571777344, -39.22655487060547, -37.313011169433594, -35.39946746826172, -33.48591995239258, -31.572378158569336, -29.65883445739746, -27.745290756225586, -25.831745147705078, -23.918201446533203, -22.004657745361328, -20.091114044189453, -18.177570343017578, -16.264026641845703, -14.350482940673828, -12.436938285827637, -10.523394584655762, -8.60984992980957, -6.696306228637695, -4.78276252746582, -2.869217872619629, -0.9556732177734375, 0.9578708410263062, 2.87141489982605, 4.784958839416504, 6.698503017425537, 8.61204719543457, 10.525590896606445, 12.439135551452637, 14.352679252624512, 16.266223907470703, 18.179767608642578, 20.093311309814453, 22.006855010986328, 23.920398712158203, 25.833942413330078, 27.747488021850586, 29.66103172302246, 31.574575424194336, 33.488121032714844, 35.40166473388672, 37.315208435058594, 39.22875213623047, 41.142295837402344, 43.05583953857422, 44.969383239746094, 46.88292694091797, 48.796470642089844, 50.71001434326172, 52.623558044433594, 54.53710174560547, 56.450645446777344, 58.364192962646484, 60.27773666381836]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 28.0, 14.0, 15.0, 17.0, 21.0, 32.0, 37.0, 31.0, 25.0, 33.0, 27.0, 35.0, 42.0, 37.0, 33.0, 38.0, 43.0, 35.0, 47.0, 33.0, 27.0, 25.0, 30.0, 26.0, 33.0, 33.0, 23.0, 12.0, 18.0, 16.0, 7.0, 13.0, 8.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.026329040527344, -50.16587829589844, -48.30542755126953, -46.444976806640625, -44.584529876708984, -42.72407913208008, -40.86362838745117, -39.003177642822266, -37.142730712890625, -35.28227996826172, -33.42182922363281, -31.56138038635254, -29.700931549072266, -27.84048080444336, -25.980030059814453, -24.119579315185547, -22.25912857055664, -20.398677825927734, -18.53822898864746, -16.677778244018555, -14.817328453063965, -12.956878662109375, -11.096427917480469, -9.235978126525879, -7.375528335571289, -5.515078544616699, -3.654628276824951, -1.7941780090332031, 0.06627178192138672, 1.9267215728759766, 3.787172317504883, 5.647622108459473, 7.5080718994140625, 9.368521690368652, 11.228971481323242, 13.089422225952148, 14.949872016906738, 16.810321807861328, 18.670772552490234, 20.53122329711914, 22.391672134399414, 24.25212287902832, 26.112571716308594, 27.9730224609375, 29.833473205566406, 31.69392204284668, 33.55437469482422, 35.41482162475586, 37.275272369384766, 39.13572311401367, 40.99617385864258, 42.85662078857422, 44.717071533203125, 46.57752227783203, 48.43797302246094, 50.298423767089844, 52.15887451171875, 54.019325256347656, 55.87977600097656, 57.74022674560547, 59.60067367553711, 61.461124420166016, 63.32157516479492, 65.18202209472656, 67.04247283935547]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 11.0, 18.0, 28.0, 42.0, 76.0, 121.0, 200.0, 316.0, 589.0, 952.0, 1492.0, 2526.0, 4350.0, 7005.0, 11884.0, 19751.0, 32830.0, 53605.0, 87683.0, 139074.0, 214626.0, 316454.0, 430625.0, 526383.0, 562820.0, 518340.0, 417305.0, 301483.0, 203956.0, 130892.0, 81386.0, 49896.0, 30420.0, 18512.0, 11151.0, 6719.0, 4072.0, 2501.0, 1595.0, 911.0, 659.0, 373.0, 229.0, 146.0, 86.0, 72.0, 44.0, 24.0, 14.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-58.125, -56.3330078125, -54.541015625, -52.7490234375, -50.95703125, -49.1650390625, -47.373046875, -45.5810546875, -43.7890625, -41.9970703125, -40.205078125, -38.4130859375, -36.62109375, -34.8291015625, -33.037109375, -31.2451171875, -29.453125, -27.6611328125, -25.869140625, -24.0771484375, -22.28515625, -20.4931640625, -18.701171875, -16.9091796875, -15.1171875, -13.3251953125, -11.533203125, -9.7412109375, -7.94921875, -6.1572265625, -4.365234375, -2.5732421875, -0.78125, 1.0107421875, 2.802734375, 4.5947265625, 6.38671875, 8.1787109375, 9.970703125, 11.7626953125, 13.5546875, 15.3466796875, 17.138671875, 18.9306640625, 20.72265625, 22.5146484375, 24.306640625, 26.0986328125, 27.890625, 29.6826171875, 31.474609375, 33.2666015625, 35.05859375, 36.8505859375, 38.642578125, 40.4345703125, 42.2265625, 44.0185546875, 45.810546875, 47.6025390625, 49.39453125, 51.1865234375, 52.978515625, 54.7705078125, 56.5625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 7.0, 11.0, 15.0, 13.0, 18.0, 19.0, 16.0, 21.0, 30.0, 24.0, 34.0, 34.0, 34.0, 26.0, 30.0, 31.0, 46.0, 47.0, 45.0, 35.0, 45.0, 31.0, 36.0, 35.0, 23.0, 25.0, 38.0, 36.0, 23.0, 23.0, 22.0, 15.0, 12.0, 16.0, 12.0, 9.0, 7.0, 11.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.15576171875, -41.5302734375, -39.90478515625, -38.279296875, -36.65380859375, -35.0283203125, -33.40283203125, -31.77734375, -30.15185546875, -28.5263671875, -26.90087890625, -25.275390625, -23.64990234375, -22.0244140625, -20.39892578125, -18.7734375, -17.14794921875, -15.5224609375, -13.89697265625, -12.271484375, -10.64599609375, -9.0205078125, -7.39501953125, -5.76953125, -4.14404296875, -2.5185546875, -0.89306640625, 0.732421875, 2.35791015625, 3.9833984375, 5.60888671875, 7.234375, 8.85986328125, 10.4853515625, 12.11083984375, 13.736328125, 15.36181640625, 16.9873046875, 18.61279296875, 20.23828125, 21.86376953125, 23.4892578125, 25.11474609375, 26.740234375, 28.36572265625, 29.9912109375, 31.61669921875, 33.2421875, 34.86767578125, 36.4931640625, 38.11865234375, 39.744140625, 41.36962890625, 42.9951171875, 44.62060546875, 46.24609375, 47.87158203125, 49.4970703125, 51.12255859375, 52.748046875, 54.37353515625, 55.9990234375, 57.62451171875, 59.25]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 11.0, 33.0, 44.0, 100.0, 147.0, 256.0, 409.0, 626.0, 1168.0, 1943.0, 3359.0, 5957.0, 10396.0, 17840.0, 31373.0, 53585.0, 89492.0, 143184.0, 221088.0, 322262.0, 431006.0, 518071.0, 550668.0, 510450.0, 418899.0, 309558.0, 212385.0, 136791.0, 83564.0, 50257.0, 29121.0, 16935.0, 9979.0, 5594.0, 3229.0, 1856.0, 1100.0, 592.0, 392.0, 238.0, 120.0, 72.0, 44.0, 22.0, 13.0, 13.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-63.75, -61.84375, -59.9375, -58.03125, -56.125, -54.21875, -52.3125, -50.40625, -48.5, -46.59375, -44.6875, -42.78125, -40.875, -38.96875, -37.0625, -35.15625, -33.25, -31.34375, -29.4375, -27.53125, -25.625, -23.71875, -21.8125, -19.90625, -18.0, -16.09375, -14.1875, -12.28125, -10.375, -8.46875, -6.5625, -4.65625, -2.75, -0.84375, 1.0625, 2.96875, 4.875, 6.78125, 8.6875, 10.59375, 12.5, 14.40625, 16.3125, 18.21875, 20.125, 22.03125, 23.9375, 25.84375, 27.75, 29.65625, 31.5625, 33.46875, 35.375, 37.28125, 39.1875, 41.09375, 43.0, 44.90625, 46.8125, 48.71875, 50.625, 52.53125, 54.4375, 56.34375, 58.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 24.0, 27.0, 23.0, 42.0, 56.0, 82.0, 86.0, 119.0, 119.0, 140.0, 180.0, 174.0, 202.0, 220.0, 207.0, 214.0, 250.0, 230.0, 255.0, 214.0, 206.0, 167.0, 140.0, 129.0, 106.0, 94.0, 61.0, 64.0, 53.0, 41.0, 32.0, 21.0, 12.0, 19.0, 9.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.640625, -26.752197265625, -25.86376953125, -24.975341796875, -24.0869140625, -23.198486328125, -22.31005859375, -21.421630859375, -20.533203125, -19.644775390625, -18.75634765625, -17.867919921875, -16.9794921875, -16.091064453125, -15.20263671875, -14.314208984375, -13.42578125, -12.537353515625, -11.64892578125, -10.760498046875, -9.8720703125, -8.983642578125, -8.09521484375, -7.206787109375, -6.318359375, -5.429931640625, -4.54150390625, -3.653076171875, -2.7646484375, -1.876220703125, -0.98779296875, -0.099365234375, 0.7890625, 1.677490234375, 2.56591796875, 3.454345703125, 4.3427734375, 5.231201171875, 6.11962890625, 7.008056640625, 7.896484375, 8.784912109375, 9.67333984375, 10.561767578125, 11.4501953125, 12.338623046875, 13.22705078125, 14.115478515625, 15.00390625, 15.892333984375, 16.78076171875, 17.669189453125, 18.5576171875, 19.446044921875, 20.33447265625, 21.222900390625, 22.111328125, 22.999755859375, 23.88818359375, 24.776611328125, 25.6650390625, 26.553466796875, 27.44189453125, 28.330322265625, 29.21875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 7.0, 8.0, 14.0, 9.0, 17.0, 25.0, 24.0, 29.0, 32.0, 38.0, 41.0, 44.0, 45.0, 47.0, 34.0, 47.0, 38.0, 34.0, 48.0, 40.0, 50.0, 34.0, 34.0, 38.0, 26.0, 24.0, 29.0, 19.0, 14.0, 18.0, 11.0, 9.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.0414810180664, -62.051815032958984, -60.06214904785156, -58.072479248046875, -56.08281326293945, -54.09314727783203, -52.10348129272461, -50.11381530761719, -48.1241455078125, -46.13447952270508, -44.144813537597656, -42.15514373779297, -40.16547775268555, -38.175811767578125, -36.1861457824707, -34.19647979736328, -32.20681381225586, -30.217147827148438, -28.227479934692383, -26.23781394958496, -24.248146057128906, -22.258480072021484, -20.268814086914062, -18.27914810180664, -16.289480209350586, -14.299813270568848, -12.31014633178711, -10.320480346679688, -8.33081340789795, -6.341146469116211, -4.351480484008789, -2.361813545227051, -0.3721427917480469, 1.6175239086151123, 3.6071906089782715, 5.596857070922852, 7.58652400970459, 9.576190948486328, 11.56585693359375, 13.555523872375488, 15.545190811157227, 17.53485679626465, 19.524524688720703, 21.514190673828125, 23.503856658935547, 25.4935245513916, 27.483190536499023, 29.472858428955078, 31.4625244140625, 33.45219039916992, 35.441856384277344, 37.43152618408203, 39.42119216918945, 41.410858154296875, 43.4005241394043, 45.39019012451172, 47.379859924316406, 49.36952590942383, 51.35919189453125, 53.34886169433594, 55.33852767944336, 57.32819366455078, 59.3178596496582, 61.307525634765625, 63.29719161987305]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 13.0, 13.0, 21.0, 21.0, 20.0, 30.0, 29.0, 30.0, 43.0, 33.0, 43.0, 34.0, 37.0, 35.0, 47.0, 42.0, 44.0, 56.0, 39.0, 28.0, 33.0, 35.0, 31.0, 32.0, 21.0, 18.0, 27.0, 17.0, 18.0, 12.0, 16.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.1981086730957, -50.17898178100586, -48.159854888916016, -46.14072799682617, -44.12159729003906, -42.10247039794922, -40.083343505859375, -38.06421661376953, -36.04508972167969, -34.025962829589844, -32.0068359375, -29.987707138061523, -27.96858024597168, -25.949453353881836, -23.93032455444336, -21.911197662353516, -19.892070770263672, -17.872943878173828, -15.853816032409668, -13.834688186645508, -11.815561294555664, -9.79643440246582, -7.77730655670166, -5.7581787109375, -3.7390518188476562, -1.7199244499206543, 0.29920291900634766, 2.3183302879333496, 4.337457656860352, 6.356584548950195, 8.375712394714355, 10.394840240478516, 12.413963317871094, 14.433090209960938, 16.45221710205078, 18.471345901489258, 20.4904727935791, 22.509599685668945, 24.528728485107422, 26.547855377197266, 28.56698226928711, 30.586109161376953, 32.6052360534668, 34.62436294555664, 36.64349365234375, 38.662620544433594, 40.68174743652344, 42.70087432861328, 44.720001220703125, 46.73912811279297, 48.75825500488281, 50.777381896972656, 52.7965087890625, 54.815635681152344, 56.83476638793945, 58.8538932800293, 60.87302017211914, 62.892147064208984, 64.9112777709961, 66.93040466308594, 68.94953155517578, 70.96865844726562, 72.98778533935547, 75.00691223144531, 77.02603912353516]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 18.0, 26.0, 32.0, 62.0, 99.0, 123.0, 190.0, 332.0, 512.0, 805.0, 1310.0, 1936.0, 2922.0, 4618.0, 6983.0, 10573.0, 15849.0, 23310.0, 33445.0, 46418.0, 61905.0, 77733.0, 92309.0, 101624.0, 104860.0, 100458.0, 89157.0, 74347.0, 58061.0, 43335.0, 31382.0, 21663.0, 14597.0, 9589.0, 6322.0, 4161.0, 2599.0, 1713.0, 1105.0, 701.0, 478.0, 330.0, 185.0, 125.0, 98.0, 55.0, 38.0, 19.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-28.078125, -27.18359375, -26.2890625, -25.39453125, -24.5, -23.60546875, -22.7109375, -21.81640625, -20.921875, -20.02734375, -19.1328125, -18.23828125, -17.34375, -16.44921875, -15.5546875, -14.66015625, -13.765625, -12.87109375, -11.9765625, -11.08203125, -10.1875, -9.29296875, -8.3984375, -7.50390625, -6.609375, -5.71484375, -4.8203125, -3.92578125, -3.03125, -2.13671875, -1.2421875, -0.34765625, 0.546875, 1.44140625, 2.3359375, 3.23046875, 4.125, 5.01953125, 5.9140625, 6.80859375, 7.703125, 8.59765625, 9.4921875, 10.38671875, 11.28125, 12.17578125, 13.0703125, 13.96484375, 14.859375, 15.75390625, 16.6484375, 17.54296875, 18.4375, 19.33203125, 20.2265625, 21.12109375, 22.015625, 22.91015625, 23.8046875, 24.69921875, 25.59375, 26.48828125, 27.3828125, 28.27734375, 29.171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 15.0, 22.0, 21.0, 18.0, 30.0, 31.0, 30.0, 43.0, 35.0, 39.0, 33.0, 41.0, 33.0, 43.0, 42.0, 47.0, 54.0, 41.0, 27.0, 31.0, 34.0, 32.0, 34.0, 23.0, 19.0, 23.0, 19.0, 14.0, 15.0, 14.0, 11.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.75, -50.712890625, -48.67578125, -46.638671875, -44.6015625, -42.564453125, -40.52734375, -38.490234375, -36.453125, -34.416015625, -32.37890625, -30.341796875, -28.3046875, -26.267578125, -24.23046875, -22.193359375, -20.15625, -18.119140625, -16.08203125, -14.044921875, -12.0078125, -9.970703125, -7.93359375, -5.896484375, -3.859375, -1.822265625, 0.21484375, 2.251953125, 4.2890625, 6.326171875, 8.36328125, 10.400390625, 12.4375, 14.474609375, 16.51171875, 18.548828125, 20.5859375, 22.623046875, 24.66015625, 26.697265625, 28.734375, 30.771484375, 32.80859375, 34.845703125, 36.8828125, 38.919921875, 40.95703125, 42.994140625, 45.03125, 47.068359375, 49.10546875, 51.142578125, 53.1796875, 55.216796875, 57.25390625, 59.291015625, 61.328125, 63.365234375, 65.40234375, 67.439453125, 69.4765625, 71.513671875, 73.55078125, 75.587890625, 77.625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 13.0, 8.0, 11.0, 23.0, 42.0, 40.0, 66.0, 96.0, 123.0, 178.0, 230.0, 337.0, 462.0, 608.0, 912.0, 1204.0, 1691.0, 2282.0, 3206.0, 4328.0, 5954.0, 8307.0, 11384.0, 15689.0, 22526.0, 64395.0, 673006.0, 142752.0, 25810.0, 17002.0, 12508.0, 9026.0, 6700.0, 4899.0, 3575.0, 2543.0, 1775.0, 1353.0, 950.0, 754.0, 491.0, 381.0, 250.0, 199.0, 146.0, 99.0, 81.0, 47.0, 37.0, 15.0, 13.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0], "bins": [-47.9375, -46.46875, -45.0, -43.53125, -42.0625, -40.59375, -39.125, -37.65625, -36.1875, -34.71875, -33.25, -31.78125, -30.3125, -28.84375, -27.375, -25.90625, -24.4375, -22.96875, -21.5, -20.03125, -18.5625, -17.09375, -15.625, -14.15625, -12.6875, -11.21875, -9.75, -8.28125, -6.8125, -5.34375, -3.875, -2.40625, -0.9375, 0.53125, 2.0, 3.46875, 4.9375, 6.40625, 7.875, 9.34375, 10.8125, 12.28125, 13.75, 15.21875, 16.6875, 18.15625, 19.625, 21.09375, 22.5625, 24.03125, 25.5, 26.96875, 28.4375, 29.90625, 31.375, 32.84375, 34.3125, 35.78125, 37.25, 38.71875, 40.1875, 41.65625, 43.125, 44.59375, 46.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 3.0, 11.0, 7.0, 7.0, 18.0, 13.0, 20.0, 16.0, 16.0, 18.0, 31.0, 39.0, 37.0, 42.0, 43.0, 43.0, 49.0, 43.0, 63.0, 36.0, 46.0, 41.0, 48.0, 37.0, 27.0, 31.0, 38.0, 31.0, 24.0, 22.0, 17.0, 19.0, 18.0, 10.0, 9.0, 3.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.1962890625, -40.611328125, -39.0263671875, -37.44140625, -35.8564453125, -34.271484375, -32.6865234375, -31.1015625, -29.5166015625, -27.931640625, -26.3466796875, -24.76171875, -23.1767578125, -21.591796875, -20.0068359375, -18.421875, -16.8369140625, -15.251953125, -13.6669921875, -12.08203125, -10.4970703125, -8.912109375, -7.3271484375, -5.7421875, -4.1572265625, -2.572265625, -0.9873046875, 0.59765625, 2.1826171875, 3.767578125, 5.3525390625, 6.9375, 8.5224609375, 10.107421875, 11.6923828125, 13.27734375, 14.8623046875, 16.447265625, 18.0322265625, 19.6171875, 21.2021484375, 22.787109375, 24.3720703125, 25.95703125, 27.5419921875, 29.126953125, 30.7119140625, 32.296875, 33.8818359375, 35.466796875, 37.0517578125, 38.63671875, 40.2216796875, 41.806640625, 43.3916015625, 44.9765625, 46.5615234375, 48.146484375, 49.7314453125, 51.31640625, 52.9013671875, 54.486328125, 56.0712890625, 57.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 20.0, 16.0, 22.0, 27.0, 45.0, 47.0, 65.0, 80.0, 110.0, 145.0, 194.0, 284.0, 369.0, 591.0, 705.0, 1040.0, 1513.0, 2240.0, 3047.0, 4776.0, 6969.0, 10614.0, 16690.0, 30278.0, 148299.0, 679154.0, 72873.0, 24596.0, 14626.0, 9452.0, 6087.0, 4114.0, 2833.0, 1871.0, 1361.0, 913.0, 658.0, 480.0, 338.0, 256.0, 193.0, 132.0, 124.0, 83.0, 52.0, 44.0, 31.0, 24.0, 12.0, 22.0, 5.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0], "bins": [-4.98046875, -4.8265380859375, -4.672607421875, -4.5186767578125, -4.36474609375, -4.2108154296875, -4.056884765625, -3.9029541015625, -3.7490234375, -3.5950927734375, -3.441162109375, -3.2872314453125, -3.13330078125, -2.9793701171875, -2.825439453125, -2.6715087890625, -2.517578125, -2.3636474609375, -2.209716796875, -2.0557861328125, -1.90185546875, -1.7479248046875, -1.593994140625, -1.4400634765625, -1.2861328125, -1.1322021484375, -0.978271484375, -0.8243408203125, -0.67041015625, -0.5164794921875, -0.362548828125, -0.2086181640625, -0.0546875, 0.0992431640625, 0.253173828125, 0.4071044921875, 0.56103515625, 0.7149658203125, 0.868896484375, 1.0228271484375, 1.1767578125, 1.3306884765625, 1.484619140625, 1.6385498046875, 1.79248046875, 1.9464111328125, 2.100341796875, 2.2542724609375, 2.408203125, 2.5621337890625, 2.716064453125, 2.8699951171875, 3.02392578125, 3.1778564453125, 3.331787109375, 3.4857177734375, 3.6396484375, 3.7935791015625, 3.947509765625, 4.1014404296875, 4.25537109375, 4.4093017578125, 4.563232421875, 4.7171630859375, 4.87109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 14.0, 7.0, 15.0, 16.0, 27.0, 29.0, 19.0, 29.0, 28.0, 38.0, 40.0, 42.0, 47.0, 44.0, 42.0, 43.0, 52.0, 46.0, 53.0, 41.0, 40.0, 41.0, 25.0, 26.0, 21.0, 24.0, 22.0, 17.0, 9.0, 11.0, 11.0, 4.0, 6.0, 10.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011510848999023438, -0.0011145174503326416, -0.0010779500007629395, -0.0010413825511932373, -0.0010048151016235352, -0.000968247652053833, -0.0009316802024841309, -0.0008951127529144287, -0.0008585453033447266, -0.0008219778537750244, -0.0007854104042053223, -0.0007488429546356201, -0.000712275505065918, -0.0006757080554962158, -0.0006391406059265137, -0.0006025731563568115, -0.0005660057067871094, -0.0005294382572174072, -0.0004928708076477051, -0.00045630335807800293, -0.0004197359085083008, -0.00038316845893859863, -0.0003466010093688965, -0.00031003355979919434, -0.0002734661102294922, -0.00023689866065979004, -0.0002003312110900879, -0.00016376376152038574, -0.0001271963119506836, -9.062886238098145e-05, -5.40614128112793e-05, -1.749396324157715e-05, 1.9073486328125e-05, 5.564093589782715e-05, 9.22083854675293e-05, 0.00012877583503723145, 0.0001653432846069336, 0.00020191073417663574, 0.0002384781837463379, 0.00027504563331604004, 0.0003116130828857422, 0.00034818053245544434, 0.0003847479820251465, 0.00042131543159484863, 0.0004578828811645508, 0.0004944503307342529, 0.0005310177803039551, 0.0005675852298736572, 0.0006041526794433594, 0.0006407201290130615, 0.0006772875785827637, 0.0007138550281524658, 0.000750422477722168, 0.0007869899272918701, 0.0008235573768615723, 0.0008601248264312744, 0.0008966922760009766, 0.0009332597255706787, 0.0009698271751403809, 0.001006394624710083, 0.0010429620742797852, 0.0010795295238494873, 0.0011160969734191895, 0.0011526644229888916, 0.0011892318725585938]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 9.0, 6.0, 12.0, 17.0, 31.0, 42.0, 61.0, 82.0, 158.0, 176.0, 338.0, 453.0, 696.0, 993.0, 1501.0, 2310.0, 3416.0, 5375.0, 8284.0, 12780.0, 19713.0, 30933.0, 46364.0, 68397.0, 93987.0, 119371.0, 134051.0, 129967.0, 111039.0, 83812.0, 59623.0, 40182.0, 26158.0, 16721.0, 10956.0, 7068.0, 4629.0, 2926.0, 1983.0, 1275.0, 918.0, 592.0, 380.0, 268.0, 178.0, 111.0, 65.0, 62.0, 35.0, 16.0, 15.0, 11.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-2.68359375, -2.5992431640625, -2.514892578125, -2.4305419921875, -2.34619140625, -2.2618408203125, -2.177490234375, -2.0931396484375, -2.0087890625, -1.9244384765625, -1.840087890625, -1.7557373046875, -1.67138671875, -1.5870361328125, -1.502685546875, -1.4183349609375, -1.333984375, -1.2496337890625, -1.165283203125, -1.0809326171875, -0.99658203125, -0.9122314453125, -0.827880859375, -0.7435302734375, -0.6591796875, -0.5748291015625, -0.490478515625, -0.4061279296875, -0.32177734375, -0.2374267578125, -0.153076171875, -0.0687255859375, 0.015625, 0.0999755859375, 0.184326171875, 0.2686767578125, 0.35302734375, 0.4373779296875, 0.521728515625, 0.6060791015625, 0.6904296875, 0.7747802734375, 0.859130859375, 0.9434814453125, 1.02783203125, 1.1121826171875, 1.196533203125, 1.2808837890625, 1.365234375, 1.4495849609375, 1.533935546875, 1.6182861328125, 1.70263671875, 1.7869873046875, 1.871337890625, 1.9556884765625, 2.0400390625, 2.1243896484375, 2.208740234375, 2.2930908203125, 2.37744140625, 2.4617919921875, 2.546142578125, 2.6304931640625, 2.71484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 2.0, 7.0, 3.0, 21.0, 13.0, 12.0, 23.0, 19.0, 30.0, 29.0, 36.0, 43.0, 41.0, 49.0, 43.0, 49.0, 56.0, 49.0, 54.0, 59.0, 44.0, 54.0, 42.0, 35.0, 38.0, 20.0, 14.0, 21.0, 15.0, 16.0, 5.0, 13.0, 11.0, 4.0, 10.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0448760986328125, -1.011627197265625, -0.9783782958984375, -0.94512939453125, -0.9118804931640625, -0.878631591796875, -0.8453826904296875, -0.8121337890625, -0.7788848876953125, -0.745635986328125, -0.7123870849609375, -0.67913818359375, -0.6458892822265625, -0.612640380859375, -0.5793914794921875, -0.546142578125, -0.5128936767578125, -0.479644775390625, -0.4463958740234375, -0.41314697265625, -0.3798980712890625, -0.346649169921875, -0.3134002685546875, -0.2801513671875, -0.2469024658203125, -0.213653564453125, -0.1804046630859375, -0.14715576171875, -0.1139068603515625, -0.080657958984375, -0.0474090576171875, -0.01416015625, 0.0190887451171875, 0.052337646484375, 0.0855865478515625, 0.11883544921875, 0.1520843505859375, 0.185333251953125, 0.2185821533203125, 0.2518310546875, 0.2850799560546875, 0.318328857421875, 0.3515777587890625, 0.38482666015625, 0.4180755615234375, 0.451324462890625, 0.4845733642578125, 0.517822265625, 0.5510711669921875, 0.584320068359375, 0.6175689697265625, 0.65081787109375, 0.6840667724609375, 0.717315673828125, 0.7505645751953125, 0.7838134765625, 0.8170623779296875, 0.850311279296875, 0.8835601806640625, 0.91680908203125, 0.9500579833984375, 0.983306884765625, 1.0165557861328125, 1.0498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 14.0, 13.0, 22.0, 16.0, 27.0, 34.0, 44.0, 25.0, 27.0, 46.0, 45.0, 53.0, 58.0, 55.0, 48.0, 45.0, 46.0, 37.0, 39.0, 51.0, 36.0, 39.0, 31.0, 18.0, 12.0, 24.0, 17.0, 13.0, 12.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.9545669555664, -74.69002532958984, -72.42549133300781, -70.16094970703125, -67.89641571044922, -65.63187408447266, -63.36733627319336, -61.10279846191406, -58.838260650634766, -56.57372283935547, -54.30918502807617, -52.044647216796875, -49.78010559082031, -47.51557159423828, -45.25102996826172, -42.98649215698242, -40.721954345703125, -38.45741653442383, -36.19287872314453, -33.928340911865234, -31.663801193237305, -29.399263381958008, -27.134723663330078, -24.87018585205078, -22.605648040771484, -20.341110229492188, -18.07657241821289, -15.812032699584961, -13.547494888305664, -11.282957077026367, -9.018418312072754, -6.753879547119141, -4.4893341064453125, -2.2247958183288574, 0.039742469787597656, 2.3042807579040527, 4.568819046020508, 6.833356857299805, 9.097895622253418, 11.362434387207031, 13.626972198486328, 15.891510009765625, 18.156047821044922, 20.42058753967285, 22.68512535095215, 24.949663162231445, 27.214202880859375, 29.478740692138672, 31.74327850341797, 34.007816314697266, 36.27235412597656, 38.53689193725586, 40.801429748535156, 43.06597137451172, 45.330509185791016, 47.59504699707031, 49.85958480834961, 52.124122619628906, 54.3886604309082, 56.6531982421875, 58.91773986816406, 61.182273864746094, 63.446815490722656, 65.71134948730469, 67.97589111328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 10.0, 11.0, 13.0, 20.0, 12.0, 27.0, 18.0, 29.0, 23.0, 34.0, 39.0, 39.0, 33.0, 43.0, 34.0, 31.0, 44.0, 45.0, 44.0, 53.0, 47.0, 34.0, 28.0, 35.0, 37.0, 27.0, 26.0, 22.0, 20.0, 25.0, 15.0, 14.0, 14.0, 9.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.366737365722656, -52.296630859375, -50.22652816772461, -48.15642166137695, -46.08631896972656, -44.016212463378906, -41.94610595703125, -39.875999450683594, -37.8058967590332, -35.73579025268555, -33.665687561035156, -31.5955810546875, -29.525476455688477, -27.455371856689453, -25.385265350341797, -23.315160751342773, -21.24505615234375, -19.174951553344727, -17.104846954345703, -15.034740447998047, -12.964635848999023, -10.89453125, -8.82442569732666, -6.75432014465332, -4.684215545654297, -2.6141104698181152, -0.5440053939819336, 1.526099681854248, 3.5962047576904297, 5.666309356689453, 7.736414909362793, 9.806520462036133, 11.876617431640625, 13.946722030639648, 16.016826629638672, 18.086933135986328, 20.15703773498535, 22.227142333984375, 24.29724884033203, 26.367353439331055, 28.437458038330078, 30.5075626373291, 32.577667236328125, 34.64777374267578, 36.71788024902344, 38.78798294067383, 40.858089447021484, 42.928192138671875, 44.99829864501953, 47.06840515136719, 49.13850784301758, 51.208614349365234, 53.278717041015625, 55.34882354736328, 57.41893005371094, 59.489036560058594, 61.559139251708984, 63.62924575805664, 65.69934844970703, 67.76945495605469, 69.83956146240234, 71.90966796875, 73.97976684570312, 76.04987335205078, 78.11997985839844]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 30.0, 54.0, 54.0, 92.0, 157.0, 224.0, 417.0, 633.0, 1040.0, 1811.0, 3028.0, 4995.0, 8713.0, 14132.0, 23245.0, 36536.0, 54820.0, 78354.0, 100563.0, 119748.0, 127566.0, 122210.0, 104890.0, 82340.0, 58774.0, 39752.0, 25528.0, 15418.0, 9606.0, 5499.0, 3240.0, 1958.0, 1195.0, 739.0, 464.0, 268.0, 164.0, 106.0, 66.0, 39.0, 21.0, 16.0, 12.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.21875, -51.42041015625, -49.6220703125, -47.82373046875, -46.025390625, -44.22705078125, -42.4287109375, -40.63037109375, -38.83203125, -37.03369140625, -35.2353515625, -33.43701171875, -31.638671875, -29.84033203125, -28.0419921875, -26.24365234375, -24.4453125, -22.64697265625, -20.8486328125, -19.05029296875, -17.251953125, -15.45361328125, -13.6552734375, -11.85693359375, -10.05859375, -8.26025390625, -6.4619140625, -4.66357421875, -2.865234375, -1.06689453125, 0.7314453125, 2.52978515625, 4.328125, 6.12646484375, 7.9248046875, 9.72314453125, 11.521484375, 13.31982421875, 15.1181640625, 16.91650390625, 18.71484375, 20.51318359375, 22.3115234375, 24.10986328125, 25.908203125, 27.70654296875, 29.5048828125, 31.30322265625, 33.1015625, 34.89990234375, 36.6982421875, 38.49658203125, 40.294921875, 42.09326171875, 43.8916015625, 45.68994140625, 47.48828125, 49.28662109375, 51.0849609375, 52.88330078125, 54.681640625, 56.47998046875, 58.2783203125, 60.07666015625, 61.875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 10.0, 12.0, 17.0, 12.0, 20.0, 20.0, 28.0, 28.0, 24.0, 39.0, 40.0, 43.0, 37.0, 39.0, 42.0, 41.0, 45.0, 38.0, 53.0, 48.0, 42.0, 35.0, 26.0, 32.0, 42.0, 22.0, 19.0, 27.0, 23.0, 17.0, 14.0, 9.0, 17.0, 3.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.58349609375, -49.5732421875, -47.56298828125, -45.552734375, -43.54248046875, -41.5322265625, -39.52197265625, -37.51171875, -35.50146484375, -33.4912109375, -31.48095703125, -29.470703125, -27.46044921875, -25.4501953125, -23.43994140625, -21.4296875, -19.41943359375, -17.4091796875, -15.39892578125, -13.388671875, -11.37841796875, -9.3681640625, -7.35791015625, -5.34765625, -3.33740234375, -1.3271484375, 0.68310546875, 2.693359375, 4.70361328125, 6.7138671875, 8.72412109375, 10.734375, 12.74462890625, 14.7548828125, 16.76513671875, 18.775390625, 20.78564453125, 22.7958984375, 24.80615234375, 26.81640625, 28.82666015625, 30.8369140625, 32.84716796875, 34.857421875, 36.86767578125, 38.8779296875, 40.88818359375, 42.8984375, 44.90869140625, 46.9189453125, 48.92919921875, 50.939453125, 52.94970703125, 54.9599609375, 56.97021484375, 58.98046875, 60.99072265625, 63.0009765625, 65.01123046875, 67.021484375, 69.03173828125, 71.0419921875, 73.05224609375, 75.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 20.0, 15.0, 28.0, 50.0, 58.0, 95.0, 175.0, 232.0, 394.0, 696.0, 1147.0, 1897.0, 3335.0, 5858.0, 10277.0, 17876.0, 30313.0, 49846.0, 76312.0, 106124.0, 132568.0, 144737.0, 136808.0, 112506.0, 82177.0, 54129.0, 33830.0, 19925.0, 11495.0, 6673.0, 3649.0, 2164.0, 1221.0, 720.0, 430.0, 254.0, 165.0, 137.0, 72.0, 46.0, 30.0, 15.0, 15.0, 11.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0], "bins": [-70.5625, -68.46240234375, -66.3623046875, -64.26220703125, -62.162109375, -60.06201171875, -57.9619140625, -55.86181640625, -53.76171875, -51.66162109375, -49.5615234375, -47.46142578125, -45.361328125, -43.26123046875, -41.1611328125, -39.06103515625, -36.9609375, -34.86083984375, -32.7607421875, -30.66064453125, -28.560546875, -26.46044921875, -24.3603515625, -22.26025390625, -20.16015625, -18.06005859375, -15.9599609375, -13.85986328125, -11.759765625, -9.65966796875, -7.5595703125, -5.45947265625, -3.359375, -1.25927734375, 0.8408203125, 2.94091796875, 5.041015625, 7.14111328125, 9.2412109375, 11.34130859375, 13.44140625, 15.54150390625, 17.6416015625, 19.74169921875, 21.841796875, 23.94189453125, 26.0419921875, 28.14208984375, 30.2421875, 32.34228515625, 34.4423828125, 36.54248046875, 38.642578125, 40.74267578125, 42.8427734375, 44.94287109375, 47.04296875, 49.14306640625, 51.2431640625, 53.34326171875, 55.443359375, 57.54345703125, 59.6435546875, 61.74365234375, 63.84375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 16.0, 17.0, 15.0, 22.0, 17.0, 24.0, 33.0, 29.0, 29.0, 35.0, 25.0, 44.0, 52.0, 46.0, 48.0, 48.0, 63.0, 37.0, 40.0, 34.0, 33.0, 36.0, 37.0, 29.0, 17.0, 21.0, 25.0, 24.0, 11.0, 18.0, 8.0, 9.0, 5.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-44.625, -43.2900390625, -41.955078125, -40.6201171875, -39.28515625, -37.9501953125, -36.615234375, -35.2802734375, -33.9453125, -32.6103515625, -31.275390625, -29.9404296875, -28.60546875, -27.2705078125, -25.935546875, -24.6005859375, -23.265625, -21.9306640625, -20.595703125, -19.2607421875, -17.92578125, -16.5908203125, -15.255859375, -13.9208984375, -12.5859375, -11.2509765625, -9.916015625, -8.5810546875, -7.24609375, -5.9111328125, -4.576171875, -3.2412109375, -1.90625, -0.5712890625, 0.763671875, 2.0986328125, 3.43359375, 4.7685546875, 6.103515625, 7.4384765625, 8.7734375, 10.1083984375, 11.443359375, 12.7783203125, 14.11328125, 15.4482421875, 16.783203125, 18.1181640625, 19.453125, 20.7880859375, 22.123046875, 23.4580078125, 24.79296875, 26.1279296875, 27.462890625, 28.7978515625, 30.1328125, 31.4677734375, 32.802734375, 34.1376953125, 35.47265625, 36.8076171875, 38.142578125, 39.4775390625, 40.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 21.0, 21.0, 33.0, 69.0, 89.0, 150.0, 244.0, 399.0, 649.0, 997.0, 1658.0, 3078.0, 5311.0, 9758.0, 18873.0, 36113.0, 66712.0, 116137.0, 167339.0, 191749.0, 168234.0, 115608.0, 67664.0, 36050.0, 18911.0, 9883.0, 5299.0, 3039.0, 1727.0, 1047.0, 603.0, 379.0, 233.0, 164.0, 90.0, 75.0, 45.0, 26.0, 21.0, 21.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.711181640625, -23.84423828125, -22.977294921875, -22.1103515625, -21.243408203125, -20.37646484375, -19.509521484375, -18.642578125, -17.775634765625, -16.90869140625, -16.041748046875, -15.1748046875, -14.307861328125, -13.44091796875, -12.573974609375, -11.70703125, -10.840087890625, -9.97314453125, -9.106201171875, -8.2392578125, -7.372314453125, -6.50537109375, -5.638427734375, -4.771484375, -3.904541015625, -3.03759765625, -2.170654296875, -1.3037109375, -0.436767578125, 0.43017578125, 1.297119140625, 2.1640625, 3.031005859375, 3.89794921875, 4.764892578125, 5.6318359375, 6.498779296875, 7.36572265625, 8.232666015625, 9.099609375, 9.966552734375, 10.83349609375, 11.700439453125, 12.5673828125, 13.434326171875, 14.30126953125, 15.168212890625, 16.03515625, 16.902099609375, 17.76904296875, 18.635986328125, 19.5029296875, 20.369873046875, 21.23681640625, 22.103759765625, 22.970703125, 23.837646484375, 24.70458984375, 25.571533203125, 26.4384765625, 27.305419921875, 28.17236328125, 29.039306640625, 29.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 9.0, 5.0, 22.0, 17.0, 14.0, 22.0, 29.0, 27.0, 34.0, 34.0, 50.0, 35.0, 54.0, 51.0, 64.0, 55.0, 52.0, 50.0, 56.0, 43.0, 39.0, 33.0, 26.0, 24.0, 32.0, 21.0, 17.0, 12.0, 10.0, 8.0, 10.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0024166107177734375, -0.0023413002490997314, -0.0022659897804260254, -0.0021906793117523193, -0.0021153688430786133, -0.0020400583744049072, -0.001964747905731201, -0.0018894374370574951, -0.001814126968383789, -0.001738816499710083, -0.001663506031036377, -0.001588195562362671, -0.0015128850936889648, -0.0014375746250152588, -0.0013622641563415527, -0.0012869536876678467, -0.0012116432189941406, -0.0011363327503204346, -0.0010610222816467285, -0.0009857118129730225, -0.0009104013442993164, -0.0008350908756256104, -0.0007597804069519043, -0.0006844699382781982, -0.0006091594696044922, -0.0005338490009307861, -0.0004585385322570801, -0.000383228063583374, -0.00030791759490966797, -0.00023260712623596191, -0.00015729665756225586, -8.19861888885498e-05, -6.67572021484375e-06, 6.86347484588623e-05, 0.00014394521713256836, 0.00021925568580627441, 0.00029456615447998047, 0.0003698766231536865, 0.0004451870918273926, 0.0005204975605010986, 0.0005958080291748047, 0.0006711184978485107, 0.0007464289665222168, 0.0008217394351959229, 0.0008970499038696289, 0.000972360372543335, 0.001047670841217041, 0.001122981309890747, 0.0011982917785644531, 0.0012736022472381592, 0.0013489127159118652, 0.0014242231845855713, 0.0014995336532592773, 0.0015748441219329834, 0.0016501545906066895, 0.0017254650592803955, 0.0018007755279541016, 0.0018760859966278076, 0.0019513964653015137, 0.0020267069339752197, 0.0021020174026489258, 0.002177327871322632, 0.002252638339996338, 0.002327948808670044, 0.00240325927734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 9.0, 8.0, 13.0, 21.0, 33.0, 44.0, 88.0, 134.0, 213.0, 312.0, 465.0, 740.0, 1141.0, 1815.0, 2802.0, 4334.0, 6985.0, 10980.0, 17648.0, 27088.0, 41986.0, 61827.0, 85937.0, 110041.0, 127232.0, 129828.0, 117323.0, 95160.0, 69609.0, 47287.0, 31578.0, 20409.0, 12921.0, 8158.0, 5285.0, 3249.0, 2050.0, 1320.0, 874.0, 577.0, 377.0, 220.0, 138.0, 102.0, 70.0, 51.0, 24.0, 20.0, 14.0, 10.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.6435546875, -16.052734375, -15.4619140625, -14.87109375, -14.2802734375, -13.689453125, -13.0986328125, -12.5078125, -11.9169921875, -11.326171875, -10.7353515625, -10.14453125, -9.5537109375, -8.962890625, -8.3720703125, -7.78125, -7.1904296875, -6.599609375, -6.0087890625, -5.41796875, -4.8271484375, -4.236328125, -3.6455078125, -3.0546875, -2.4638671875, -1.873046875, -1.2822265625, -0.69140625, -0.1005859375, 0.490234375, 1.0810546875, 1.671875, 2.2626953125, 2.853515625, 3.4443359375, 4.03515625, 4.6259765625, 5.216796875, 5.8076171875, 6.3984375, 6.9892578125, 7.580078125, 8.1708984375, 8.76171875, 9.3525390625, 9.943359375, 10.5341796875, 11.125, 11.7158203125, 12.306640625, 12.8974609375, 13.48828125, 14.0791015625, 14.669921875, 15.2607421875, 15.8515625, 16.4423828125, 17.033203125, 17.6240234375, 18.21484375, 18.8056640625, 19.396484375, 19.9873046875, 20.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 10.0, 9.0, 14.0, 16.0, 23.0, 31.0, 26.0, 28.0, 47.0, 38.0, 36.0, 53.0, 57.0, 41.0, 45.0, 43.0, 47.0, 51.0, 41.0, 41.0, 39.0, 34.0, 39.0, 23.0, 24.0, 20.0, 15.0, 11.0, 12.0, 8.0, 6.0, 9.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.7108154296875, -7.452880859375, -7.1949462890625, -6.93701171875, -6.6790771484375, -6.421142578125, -6.1632080078125, -5.9052734375, -5.6473388671875, -5.389404296875, -5.1314697265625, -4.87353515625, -4.6156005859375, -4.357666015625, -4.0997314453125, -3.841796875, -3.5838623046875, -3.325927734375, -3.0679931640625, -2.81005859375, -2.5521240234375, -2.294189453125, -2.0362548828125, -1.7783203125, -1.5203857421875, -1.262451171875, -1.0045166015625, -0.74658203125, -0.4886474609375, -0.230712890625, 0.0272216796875, 0.28515625, 0.5430908203125, 0.801025390625, 1.0589599609375, 1.31689453125, 1.5748291015625, 1.832763671875, 2.0906982421875, 2.3486328125, 2.6065673828125, 2.864501953125, 3.1224365234375, 3.38037109375, 3.6383056640625, 3.896240234375, 4.1541748046875, 4.412109375, 4.6700439453125, 4.927978515625, 5.1859130859375, 5.44384765625, 5.7017822265625, 5.959716796875, 6.2176513671875, 6.4755859375, 6.7335205078125, 6.991455078125, 7.2493896484375, 7.50732421875, 7.7652587890625, 8.023193359375, 8.2811279296875, 8.5390625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 13.0, 6.0, 3.0, 7.0, 20.0, 25.0, 27.0, 26.0, 29.0, 51.0, 37.0, 53.0, 43.0, 51.0, 48.0, 46.0, 64.0, 52.0, 40.0, 43.0, 41.0, 43.0, 38.0, 30.0, 35.0, 21.0, 22.0, 18.0, 15.0, 8.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.9693832397461, -78.72274780273438, -76.47611999511719, -74.22948455810547, -71.98284912109375, -69.73622131347656, -67.48958587646484, -65.24295043945312, -62.99632263183594, -60.749691009521484, -58.503055572509766, -56.25642395019531, -54.00979232788086, -51.763160705566406, -49.51652526855469, -47.269893646240234, -45.023258209228516, -42.77662658691406, -40.529991149902344, -38.28335952758789, -36.03672790527344, -33.79009246826172, -31.543460845947266, -29.296829223632812, -27.050195693969727, -24.80356216430664, -22.556930541992188, -20.3102970123291, -18.063663482666016, -15.817031860351562, -13.570398330688477, -11.323765754699707, -9.077136993408203, -6.830504417419434, -4.583871364593506, -2.337238311767578, -0.0906057357788086, 2.156026840209961, 4.402660369873047, 6.649292945861816, 8.895925521850586, 11.142558097839355, 13.389190673828125, 15.635824203491211, 17.882457733154297, 20.12908935546875, 22.375722885131836, 24.622356414794922, 26.868988037109375, 29.11562156677246, 31.362253189086914, 33.60888671875, 35.85551834106445, 38.102149963378906, 40.348785400390625, 42.59541702270508, 44.84204864501953, 47.088680267333984, 49.3353157043457, 51.581947326660156, 53.82857894897461, 56.07521057128906, 58.32184600830078, 60.568477630615234, 62.81511306762695]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 7.0, 5.0, 6.0, 11.0, 10.0, 14.0, 14.0, 19.0, 20.0, 16.0, 24.0, 19.0, 29.0, 25.0, 28.0, 41.0, 28.0, 32.0, 34.0, 38.0, 34.0, 35.0, 50.0, 42.0, 32.0, 40.0, 52.0, 38.0, 32.0, 20.0, 30.0, 22.0, 21.0, 20.0, 17.0, 11.0, 20.0, 7.0, 14.0, 8.0, 6.0, 9.0, 14.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.210289001464844, -47.3166389465332, -45.42298889160156, -43.52933883666992, -41.63568878173828, -39.74203872680664, -37.848388671875, -35.95473861694336, -34.06108856201172, -32.16743850708008, -30.273788452148438, -28.380138397216797, -26.486488342285156, -24.592838287353516, -22.699188232421875, -20.805538177490234, -18.911888122558594, -17.018238067626953, -15.124588012695312, -13.230937957763672, -11.337287902832031, -9.44363784790039, -7.54998779296875, -5.656337738037109, -3.7626876831054688, -1.8690376281738281, 0.0246124267578125, 1.9182624816894531, 3.8119125366210938, 5.705562591552734, 7.599212646484375, 9.492862701416016, 11.386512756347656, 13.280162811279297, 15.173812866210938, 17.067462921142578, 18.96111297607422, 20.85476303100586, 22.7484130859375, 24.64206314086914, 26.53571319580078, 28.429363250732422, 30.323013305664062, 32.2166633605957, 34.110313415527344, 36.003963470458984, 37.897613525390625, 39.791263580322266, 41.684913635253906, 43.57856369018555, 45.47221374511719, 47.36586380004883, 49.25951385498047, 51.15316390991211, 53.04681396484375, 54.94046401977539, 56.83411407470703, 58.72776412963867, 60.62141418457031, 62.51506423950195, 64.4087142944336, 66.3023681640625, 68.19601440429688, 70.08966064453125, 71.98331451416016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 8.0, 14.0, 37.0, 78.0, 105.0, 185.0, 367.0, 622.0, 1072.0, 1786.0, 3272.0, 5462.0, 9482.0, 16255.0, 27320.0, 46254.0, 76401.0, 123816.0, 192599.0, 287775.0, 396848.0, 494906.0, 548059.0, 528717.0, 449178.0, 342064.0, 238779.0, 156122.0, 97683.0, 60333.0, 36029.0, 21283.0, 12538.0, 7570.0, 4350.0, 2751.0, 1596.0, 989.0, 585.0, 392.0, 231.0, 124.0, 77.0, 65.0, 42.0, 21.0, 13.0, 13.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.21875, -47.56494140625, -45.9111328125, -44.25732421875, -42.603515625, -40.94970703125, -39.2958984375, -37.64208984375, -35.98828125, -34.33447265625, -32.6806640625, -31.02685546875, -29.373046875, -27.71923828125, -26.0654296875, -24.41162109375, -22.7578125, -21.10400390625, -19.4501953125, -17.79638671875, -16.142578125, -14.48876953125, -12.8349609375, -11.18115234375, -9.52734375, -7.87353515625, -6.2197265625, -4.56591796875, -2.912109375, -1.25830078125, 0.3955078125, 2.04931640625, 3.703125, 5.35693359375, 7.0107421875, 8.66455078125, 10.318359375, 11.97216796875, 13.6259765625, 15.27978515625, 16.93359375, 18.58740234375, 20.2412109375, 21.89501953125, 23.548828125, 25.20263671875, 26.8564453125, 28.51025390625, 30.1640625, 31.81787109375, 33.4716796875, 35.12548828125, 36.779296875, 38.43310546875, 40.0869140625, 41.74072265625, 43.39453125, 45.04833984375, 46.7021484375, 48.35595703125, 50.009765625, 51.66357421875, 53.3173828125, 54.97119140625, 56.625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 9.0, 12.0, 18.0, 12.0, 15.0, 18.0, 26.0, 22.0, 19.0, 28.0, 32.0, 31.0, 33.0, 34.0, 41.0, 39.0, 37.0, 34.0, 50.0, 42.0, 40.0, 33.0, 58.0, 36.0, 32.0, 37.0, 24.0, 25.0, 27.0, 15.0, 16.0, 16.0, 14.0, 16.0, 11.0, 4.0, 11.0, 8.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.2353515625, -43.470703125, -41.7060546875, -39.94140625, -38.1767578125, -36.412109375, -34.6474609375, -32.8828125, -31.1181640625, -29.353515625, -27.5888671875, -25.82421875, -24.0595703125, -22.294921875, -20.5302734375, -18.765625, -17.0009765625, -15.236328125, -13.4716796875, -11.70703125, -9.9423828125, -8.177734375, -6.4130859375, -4.6484375, -2.8837890625, -1.119140625, 0.6455078125, 2.41015625, 4.1748046875, 5.939453125, 7.7041015625, 9.46875, 11.2333984375, 12.998046875, 14.7626953125, 16.52734375, 18.2919921875, 20.056640625, 21.8212890625, 23.5859375, 25.3505859375, 27.115234375, 28.8798828125, 30.64453125, 32.4091796875, 34.173828125, 35.9384765625, 37.703125, 39.4677734375, 41.232421875, 42.9970703125, 44.76171875, 46.5263671875, 48.291015625, 50.0556640625, 51.8203125, 53.5849609375, 55.349609375, 57.1142578125, 58.87890625, 60.6435546875, 62.408203125, 64.1728515625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 18.0, 20.0, 38.0, 61.0, 70.0, 127.0, 217.0, 347.0, 554.0, 850.0, 1461.0, 2496.0, 4118.0, 6591.0, 10900.0, 17607.0, 28185.0, 45196.0, 70206.0, 106360.0, 158942.0, 222483.0, 298108.0, 376806.0, 437719.0, 467376.0, 452248.0, 398707.0, 324433.0, 246083.0, 176631.0, 121236.0, 80127.0, 51918.0, 33282.0, 20410.0, 12422.0, 7885.0, 4689.0, 2832.0, 1783.0, 1063.0, 658.0, 394.0, 230.0, 159.0, 94.0, 50.0, 29.0, 26.0, 14.0, 11.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.625, -49.02587890625, -47.4267578125, -45.82763671875, -44.228515625, -42.62939453125, -41.0302734375, -39.43115234375, -37.83203125, -36.23291015625, -34.6337890625, -33.03466796875, -31.435546875, -29.83642578125, -28.2373046875, -26.63818359375, -25.0390625, -23.43994140625, -21.8408203125, -20.24169921875, -18.642578125, -17.04345703125, -15.4443359375, -13.84521484375, -12.24609375, -10.64697265625, -9.0478515625, -7.44873046875, -5.849609375, -4.25048828125, -2.6513671875, -1.05224609375, 0.546875, 2.14599609375, 3.7451171875, 5.34423828125, 6.943359375, 8.54248046875, 10.1416015625, 11.74072265625, 13.33984375, 14.93896484375, 16.5380859375, 18.13720703125, 19.736328125, 21.33544921875, 22.9345703125, 24.53369140625, 26.1328125, 27.73193359375, 29.3310546875, 30.93017578125, 32.529296875, 34.12841796875, 35.7275390625, 37.32666015625, 38.92578125, 40.52490234375, 42.1240234375, 43.72314453125, 45.322265625, 46.92138671875, 48.5205078125, 50.11962890625, 51.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 12.0, 20.0, 21.0, 23.0, 23.0, 43.0, 38.0, 53.0, 57.0, 57.0, 84.0, 103.0, 105.0, 154.0, 161.0, 150.0, 206.0, 198.0, 199.0, 214.0, 258.0, 215.0, 197.0, 197.0, 190.0, 143.0, 144.0, 143.0, 114.0, 108.0, 83.0, 76.0, 55.0, 43.0, 41.0, 38.0, 27.0, 18.0, 16.0, 7.0, 13.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-27.703125, -26.891357421875, -26.07958984375, -25.267822265625, -24.4560546875, -23.644287109375, -22.83251953125, -22.020751953125, -21.208984375, -20.397216796875, -19.58544921875, -18.773681640625, -17.9619140625, -17.150146484375, -16.33837890625, -15.526611328125, -14.71484375, -13.903076171875, -13.09130859375, -12.279541015625, -11.4677734375, -10.656005859375, -9.84423828125, -9.032470703125, -8.220703125, -7.408935546875, -6.59716796875, -5.785400390625, -4.9736328125, -4.161865234375, -3.35009765625, -2.538330078125, -1.7265625, -0.914794921875, -0.10302734375, 0.708740234375, 1.5205078125, 2.332275390625, 3.14404296875, 3.955810546875, 4.767578125, 5.579345703125, 6.39111328125, 7.202880859375, 8.0146484375, 8.826416015625, 9.63818359375, 10.449951171875, 11.26171875, 12.073486328125, 12.88525390625, 13.697021484375, 14.5087890625, 15.320556640625, 16.13232421875, 16.944091796875, 17.755859375, 18.567626953125, 19.37939453125, 20.191162109375, 21.0029296875, 21.814697265625, 22.62646484375, 23.438232421875, 24.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 19.0, 14.0, 15.0, 13.0, 30.0, 26.0, 25.0, 28.0, 22.0, 35.0, 43.0, 53.0, 29.0, 38.0, 38.0, 41.0, 26.0, 43.0, 24.0, 32.0, 35.0, 33.0, 22.0, 26.0, 26.0, 25.0, 32.0, 18.0, 19.0, 20.0, 19.0, 12.0, 16.0, 14.0, 10.0, 3.0, 8.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-59.39789962768555, -57.643192291259766, -55.888484954833984, -54.1337776184082, -52.37907028198242, -50.62436294555664, -48.869659423828125, -47.114952087402344, -45.36024475097656, -43.60553741455078, -41.850830078125, -40.09612274169922, -38.34141540527344, -36.586708068847656, -34.832000732421875, -33.077293395996094, -31.322586059570312, -29.56787872314453, -27.81317138671875, -26.05846405029297, -24.303756713867188, -22.549049377441406, -20.794343948364258, -19.039636611938477, -17.284929275512695, -15.530221939086914, -13.775514602661133, -12.020808219909668, -10.266100883483887, -8.511393547058105, -6.756687164306641, -5.001979827880859, -3.2472763061523438, -1.4925692081451416, 0.26213788986206055, 2.0168447494506836, 3.771552085876465, 5.526259422302246, 7.280965805053711, 9.035673141479492, 10.790380477905273, 12.545087814331055, 14.299795150756836, 16.054500579833984, 17.809207916259766, 19.563915252685547, 21.318622589111328, 23.07332992553711, 24.82803726196289, 26.582744598388672, 28.337451934814453, 30.092159271240234, 31.846866607666016, 33.6015739440918, 35.35627746582031, 37.110984802246094, 38.865692138671875, 40.620399475097656, 42.37510681152344, 44.12981414794922, 45.884521484375, 47.63922882080078, 49.39393615722656, 51.148643493652344, 52.903350830078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 7.0, 3.0, 8.0, 5.0, 12.0, 9.0, 9.0, 16.0, 15.0, 22.0, 14.0, 24.0, 24.0, 30.0, 27.0, 35.0, 46.0, 46.0, 34.0, 31.0, 33.0, 41.0, 52.0, 33.0, 43.0, 44.0, 38.0, 25.0, 29.0, 34.0, 32.0, 27.0, 21.0, 17.0, 14.0, 17.0, 21.0, 8.0, 8.0, 12.0, 4.0, 12.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.15023422241211, -52.22712326049805, -50.30400848388672, -48.380897521972656, -46.457786560058594, -44.53467559814453, -42.61156463623047, -40.68844985961914, -38.76533889770508, -36.842227935791016, -34.91911315917969, -32.996002197265625, -31.072891235351562, -29.1497802734375, -27.226667404174805, -25.30355453491211, -23.380443572998047, -21.457332611083984, -19.53421974182129, -17.611106872558594, -15.687995910644531, -13.764883995056152, -11.841772079467773, -9.918660163879395, -7.995548248291016, -6.072436332702637, -4.149324417114258, -2.226212501525879, -0.3031005859375, 1.620011329650879, 3.543123245239258, 5.466235160827637, 7.389350891113281, 9.31246280670166, 11.235574722290039, 13.158686637878418, 15.081798553466797, 17.00490951538086, 18.928022384643555, 20.85113525390625, 22.774246215820312, 24.697357177734375, 26.62047004699707, 28.543582916259766, 30.466693878173828, 32.38980484008789, 34.31291961669922, 36.23603057861328, 38.159141540527344, 40.082252502441406, 42.00536346435547, 43.9284782409668, 45.85158920288086, 47.77470016479492, 49.69781494140625, 51.62092590332031, 53.544036865234375, 55.46714782714844, 57.3902587890625, 59.31337356567383, 61.23648452758789, 63.15959548950195, 65.08271026611328, 67.00582122802734, 68.9289321899414]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 13.0, 14.0, 33.0, 43.0, 96.0, 114.0, 161.0, 321.0, 391.0, 664.0, 1039.0, 1594.0, 2375.0, 3608.0, 5380.0, 8190.0, 12297.0, 17823.0, 25515.0, 36011.0, 47812.0, 62428.0, 77262.0, 89817.0, 97215.0, 99835.0, 95552.0, 85812.0, 72442.0, 57470.0, 43955.0, 32337.0, 22960.0, 15866.0, 10802.0, 7350.0, 4857.0, 3199.0, 2036.0, 1370.0, 865.0, 593.0, 372.0, 228.0, 152.0, 105.0, 62.0, 47.0, 28.0, 15.0, 12.0, 4.0, 9.0, 2.0, 0.0, 1.0, 2.0], "bins": [-25.859375, -25.059814453125, -24.26025390625, -23.460693359375, -22.6611328125, -21.861572265625, -21.06201171875, -20.262451171875, -19.462890625, -18.663330078125, -17.86376953125, -17.064208984375, -16.2646484375, -15.465087890625, -14.66552734375, -13.865966796875, -13.06640625, -12.266845703125, -11.46728515625, -10.667724609375, -9.8681640625, -9.068603515625, -8.26904296875, -7.469482421875, -6.669921875, -5.870361328125, -5.07080078125, -4.271240234375, -3.4716796875, -2.672119140625, -1.87255859375, -1.072998046875, -0.2734375, 0.526123046875, 1.32568359375, 2.125244140625, 2.9248046875, 3.724365234375, 4.52392578125, 5.323486328125, 6.123046875, 6.922607421875, 7.72216796875, 8.521728515625, 9.3212890625, 10.120849609375, 10.92041015625, 11.719970703125, 12.51953125, 13.319091796875, 14.11865234375, 14.918212890625, 15.7177734375, 16.517333984375, 17.31689453125, 18.116455078125, 18.916015625, 19.715576171875, 20.51513671875, 21.314697265625, 22.1142578125, 22.913818359375, 23.71337890625, 24.512939453125, 25.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 5.0, 5.0, 5.0, 12.0, 11.0, 11.0, 16.0, 14.0, 20.0, 19.0, 24.0, 19.0, 34.0, 28.0, 39.0, 44.0, 42.0, 34.0, 29.0, 35.0, 43.0, 54.0, 30.0, 44.0, 43.0, 34.0, 24.0, 34.0, 30.0, 37.0, 26.0, 17.0, 15.0, 16.0, 18.0, 17.0, 9.0, 10.0, 9.0, 5.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.58544921875, -50.6396484375, -48.69384765625, -46.748046875, -44.80224609375, -42.8564453125, -40.91064453125, -38.96484375, -37.01904296875, -35.0732421875, -33.12744140625, -31.181640625, -29.23583984375, -27.2900390625, -25.34423828125, -23.3984375, -21.45263671875, -19.5068359375, -17.56103515625, -15.615234375, -13.66943359375, -11.7236328125, -9.77783203125, -7.83203125, -5.88623046875, -3.9404296875, -1.99462890625, -0.048828125, 1.89697265625, 3.8427734375, 5.78857421875, 7.734375, 9.68017578125, 11.6259765625, 13.57177734375, 15.517578125, 17.46337890625, 19.4091796875, 21.35498046875, 23.30078125, 25.24658203125, 27.1923828125, 29.13818359375, 31.083984375, 33.02978515625, 34.9755859375, 36.92138671875, 38.8671875, 40.81298828125, 42.7587890625, 44.70458984375, 46.650390625, 48.59619140625, 50.5419921875, 52.48779296875, 54.43359375, 56.37939453125, 58.3251953125, 60.27099609375, 62.216796875, 64.16259765625, 66.1083984375, 68.05419921875, 70.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 14.0, 25.0, 28.0, 59.0, 104.0, 153.0, 255.0, 385.0, 690.0, 1088.0, 1680.0, 2699.0, 4448.0, 7208.0, 11488.0, 18255.0, 30632.0, 290415.0, 589939.0, 35324.0, 20022.0, 12766.0, 7962.0, 4826.0, 3078.0, 1957.0, 1142.0, 705.0, 476.0, 281.0, 173.0, 102.0, 68.0, 34.0, 32.0, 7.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-65.5, -63.4599609375, -61.419921875, -59.3798828125, -57.33984375, -55.2998046875, -53.259765625, -51.2197265625, -49.1796875, -47.1396484375, -45.099609375, -43.0595703125, -41.01953125, -38.9794921875, -36.939453125, -34.8994140625, -32.859375, -30.8193359375, -28.779296875, -26.7392578125, -24.69921875, -22.6591796875, -20.619140625, -18.5791015625, -16.5390625, -14.4990234375, -12.458984375, -10.4189453125, -8.37890625, -6.3388671875, -4.298828125, -2.2587890625, -0.21875, 1.8212890625, 3.861328125, 5.9013671875, 7.94140625, 9.9814453125, 12.021484375, 14.0615234375, 16.1015625, 18.1416015625, 20.181640625, 22.2216796875, 24.26171875, 26.3017578125, 28.341796875, 30.3818359375, 32.421875, 34.4619140625, 36.501953125, 38.5419921875, 40.58203125, 42.6220703125, 44.662109375, 46.7021484375, 48.7421875, 50.7822265625, 52.822265625, 54.8623046875, 56.90234375, 58.9423828125, 60.982421875, 63.0224609375, 65.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 9.0, 8.0, 11.0, 13.0, 26.0, 22.0, 19.0, 23.0, 21.0, 19.0, 33.0, 30.0, 29.0, 25.0, 36.0, 40.0, 27.0, 19.0, 37.0, 43.0, 35.0, 44.0, 39.0, 39.0, 49.0, 33.0, 33.0, 32.0, 26.0, 18.0, 15.0, 29.0, 20.0, 16.0, 18.0, 7.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.65625, -43.236328125, -41.81640625, -40.396484375, -38.9765625, -37.556640625, -36.13671875, -34.716796875, -33.296875, -31.876953125, -30.45703125, -29.037109375, -27.6171875, -26.197265625, -24.77734375, -23.357421875, -21.9375, -20.517578125, -19.09765625, -17.677734375, -16.2578125, -14.837890625, -13.41796875, -11.998046875, -10.578125, -9.158203125, -7.73828125, -6.318359375, -4.8984375, -3.478515625, -2.05859375, -0.638671875, 0.78125, 2.201171875, 3.62109375, 5.041015625, 6.4609375, 7.880859375, 9.30078125, 10.720703125, 12.140625, 13.560546875, 14.98046875, 16.400390625, 17.8203125, 19.240234375, 20.66015625, 22.080078125, 23.5, 24.919921875, 26.33984375, 27.759765625, 29.1796875, 30.599609375, 32.01953125, 33.439453125, 34.859375, 36.279296875, 37.69921875, 39.119140625, 40.5390625, 41.958984375, 43.37890625, 44.798828125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 16.0, 20.0, 34.0, 30.0, 55.0, 73.0, 93.0, 128.0, 201.0, 288.0, 414.0, 567.0, 832.0, 1202.0, 1978.0, 2967.0, 4580.0, 7203.0, 12228.0, 21373.0, 49879.0, 712994.0, 161159.0, 28935.0, 15589.0, 9273.0, 5800.0, 3625.0, 2216.0, 1541.0, 1018.0, 695.0, 436.0, 308.0, 208.0, 150.0, 138.0, 78.0, 55.0, 46.0, 27.0, 21.0, 12.0, 11.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.15234375, -4.0126953125, -3.873046875, -3.7333984375, -3.59375, -3.4541015625, -3.314453125, -3.1748046875, -3.03515625, -2.8955078125, -2.755859375, -2.6162109375, -2.4765625, -2.3369140625, -2.197265625, -2.0576171875, -1.91796875, -1.7783203125, -1.638671875, -1.4990234375, -1.359375, -1.2197265625, -1.080078125, -0.9404296875, -0.80078125, -0.6611328125, -0.521484375, -0.3818359375, -0.2421875, -0.1025390625, 0.037109375, 0.1767578125, 0.31640625, 0.4560546875, 0.595703125, 0.7353515625, 0.875, 1.0146484375, 1.154296875, 1.2939453125, 1.43359375, 1.5732421875, 1.712890625, 1.8525390625, 1.9921875, 2.1318359375, 2.271484375, 2.4111328125, 2.55078125, 2.6904296875, 2.830078125, 2.9697265625, 3.109375, 3.2490234375, 3.388671875, 3.5283203125, 3.66796875, 3.8076171875, 3.947265625, 4.0869140625, 4.2265625, 4.3662109375, 4.505859375, 4.6455078125, 4.78515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 8.0, 13.0, 12.0, 11.0, 15.0, 14.0, 31.0, 29.0, 27.0, 37.0, 40.0, 30.0, 56.0, 51.0, 72.0, 52.0, 56.0, 54.0, 43.0, 42.0, 50.0, 34.0, 33.0, 35.0, 29.0, 22.0, 21.0, 17.0, 14.0, 12.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007371902465820312, -0.0007062405347824097, -0.0006752908229827881, -0.0006443411111831665, -0.0006133913993835449, -0.0005824416875839233, -0.0005514919757843018, -0.0005205422639846802, -0.0004895925521850586, -0.000458642840385437, -0.00042769312858581543, -0.00039674341678619385, -0.00036579370498657227, -0.0003348439931869507, -0.0003038942813873291, -0.0002729445695877075, -0.00024199485778808594, -0.00021104514598846436, -0.00018009543418884277, -0.0001491457223892212, -0.00011819601058959961, -8.724629878997803e-05, -5.6296586990356445e-05, -2.5346875190734863e-05, 5.602836608886719e-06, 3.65525484085083e-05, 6.750226020812988e-05, 9.845197200775146e-05, 0.00012940168380737305, 0.00016035139560699463, 0.0001913011074066162, 0.0002222508192062378, 0.0002532005310058594, 0.00028415024280548096, 0.00031509995460510254, 0.0003460496664047241, 0.0003769993782043457, 0.0004079490900039673, 0.00043889880180358887, 0.00046984851360321045, 0.000500798225402832, 0.0005317479372024536, 0.0005626976490020752, 0.0005936473608016968, 0.0006245970726013184, 0.0006555467844009399, 0.0006864964962005615, 0.0007174462080001831, 0.0007483959197998047, 0.0007793456315994263, 0.0008102953433990479, 0.0008412450551986694, 0.000872194766998291, 0.0009031444787979126, 0.0009340941905975342, 0.0009650439023971558, 0.0009959936141967773, 0.001026943325996399, 0.0010578930377960205, 0.001088842749595642, 0.0011197924613952637, 0.0011507421731948853, 0.0011816918849945068, 0.0012126415967941284, 0.00124359130859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 11.0, 18.0, 36.0, 47.0, 44.0, 72.0, 129.0, 169.0, 329.0, 462.0, 918.0, 1639.0, 2957.0, 5474.0, 9860.0, 18464.0, 33899.0, 60495.0, 99951.0, 144459.0, 173684.0, 167542.0, 130692.0, 84932.0, 50667.0, 27940.0, 15214.0, 8239.0, 4471.0, 2399.0, 1373.0, 727.0, 415.0, 285.0, 172.0, 115.0, 80.0, 59.0, 30.0, 19.0, 19.0, 6.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.1640625, -3.070556640625, -2.97705078125, -2.883544921875, -2.7900390625, -2.696533203125, -2.60302734375, -2.509521484375, -2.416015625, -2.322509765625, -2.22900390625, -2.135498046875, -2.0419921875, -1.948486328125, -1.85498046875, -1.761474609375, -1.66796875, -1.574462890625, -1.48095703125, -1.387451171875, -1.2939453125, -1.200439453125, -1.10693359375, -1.013427734375, -0.919921875, -0.826416015625, -0.73291015625, -0.639404296875, -0.5458984375, -0.452392578125, -0.35888671875, -0.265380859375, -0.171875, -0.078369140625, 0.01513671875, 0.108642578125, 0.2021484375, 0.295654296875, 0.38916015625, 0.482666015625, 0.576171875, 0.669677734375, 0.76318359375, 0.856689453125, 0.9501953125, 1.043701171875, 1.13720703125, 1.230712890625, 1.32421875, 1.417724609375, 1.51123046875, 1.604736328125, 1.6982421875, 1.791748046875, 1.88525390625, 1.978759765625, 2.072265625, 2.165771484375, 2.25927734375, 2.352783203125, 2.4462890625, 2.539794921875, 2.63330078125, 2.726806640625, 2.8203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 11.0, 14.0, 13.0, 13.0, 27.0, 13.0, 30.0, 27.0, 18.0, 29.0, 37.0, 24.0, 39.0, 31.0, 33.0, 37.0, 40.0, 48.0, 44.0, 45.0, 45.0, 44.0, 31.0, 22.0, 43.0, 32.0, 22.0, 28.0, 24.0, 9.0, 16.0, 13.0, 11.0, 14.0, 20.0, 5.0, 4.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8568801879882812, -0.8246002197265625, -0.7923202514648438, -0.760040283203125, -0.7277603149414062, -0.6954803466796875, -0.6632003784179688, -0.63092041015625, -0.5986404418945312, -0.5663604736328125, -0.5340805053710938, -0.501800537109375, -0.46952056884765625, -0.4372406005859375, -0.40496063232421875, -0.3726806640625, -0.34040069580078125, -0.3081207275390625, -0.27584075927734375, -0.243560791015625, -0.21128082275390625, -0.1790008544921875, -0.14672088623046875, -0.11444091796875, -0.08216094970703125, -0.0498809814453125, -0.01760101318359375, 0.014678955078125, 0.04695892333984375, 0.0792388916015625, 0.11151885986328125, 0.143798828125, 0.17607879638671875, 0.2083587646484375, 0.24063873291015625, 0.272918701171875, 0.30519866943359375, 0.3374786376953125, 0.36975860595703125, 0.40203857421875, 0.43431854248046875, 0.4665985107421875, 0.49887847900390625, 0.531158447265625, 0.5634384155273438, 0.5957183837890625, 0.6279983520507812, 0.6602783203125, 0.6925582885742188, 0.7248382568359375, 0.7571182250976562, 0.789398193359375, 0.8216781616210938, 0.8539581298828125, 0.8862380981445312, 0.91851806640625, 0.9507980346679688, 0.9830780029296875, 1.0153579711914062, 1.047637939453125, 1.0799179077148438, 1.1121978759765625, 1.1444778442382812, 1.1767578125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 3.0, 4.0, 5.0, 14.0, 12.0, 5.0, 14.0, 16.0, 22.0, 16.0, 13.0, 29.0, 25.0, 29.0, 24.0, 32.0, 30.0, 40.0, 45.0, 36.0, 35.0, 31.0, 54.0, 45.0, 37.0, 25.0, 17.0, 34.0, 29.0, 27.0, 34.0, 23.0, 24.0, 23.0, 29.0, 15.0, 18.0, 12.0, 15.0, 10.0, 7.0, 15.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-61.922672271728516, -60.123634338378906, -58.32460021972656, -56.52556228637695, -54.726524353027344, -52.927486419677734, -51.128448486328125, -49.32941436767578, -47.53037643432617, -45.73133850097656, -43.93230438232422, -42.13326644897461, -40.334228515625, -38.53519058227539, -36.73615264892578, -34.93711853027344, -33.13808059692383, -31.33904266357422, -29.540006637573242, -27.740970611572266, -25.941932678222656, -24.142894744873047, -22.34385871887207, -20.544822692871094, -18.745784759521484, -16.946746826171875, -15.147710800170898, -13.348673820495605, -11.549636840820312, -9.75059986114502, -7.951562881469727, -6.152525901794434, -4.353485107421875, -2.554448127746582, -0.7554111480712891, 1.043625831604004, 2.842662811279297, 4.64169979095459, 6.440736770629883, 8.239773750305176, 10.038810729980469, 11.837847709655762, 13.636884689331055, 15.435921669006348, 17.23495864868164, 19.03399658203125, 20.833032608032227, 22.632068634033203, 24.431106567382812, 26.230144500732422, 28.0291805267334, 29.828216552734375, 31.627254486083984, 33.426292419433594, 35.22532653808594, 37.02436447143555, 38.823402404785156, 40.622440338134766, 42.421478271484375, 44.22051239013672, 46.01955032348633, 47.81858825683594, 49.61762237548828, 51.41666030883789, 53.2156982421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 9.0, 6.0, 12.0, 12.0, 21.0, 16.0, 12.0, 19.0, 24.0, 24.0, 30.0, 31.0, 35.0, 46.0, 41.0, 38.0, 27.0, 30.0, 41.0, 52.0, 36.0, 48.0, 31.0, 41.0, 28.0, 30.0, 39.0, 24.0, 24.0, 21.0, 16.0, 12.0, 23.0, 11.0, 14.0, 6.0, 15.0, 8.0, 7.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.10070037841797, -52.170501708984375, -50.24030303955078, -48.31010818481445, -46.37990951538086, -44.449710845947266, -42.51951599121094, -40.589317321777344, -38.65911865234375, -36.728919982910156, -34.79872131347656, -32.868526458740234, -30.93832778930664, -29.008129119873047, -27.077932357788086, -25.147735595703125, -23.21753692626953, -21.287338256835938, -19.357141494750977, -17.426944732666016, -15.496746063232422, -13.566548347473145, -11.636350631713867, -9.70615291595459, -7.7759552001953125, -5.845757484436035, -3.915559768676758, -1.9853620529174805, -0.055164337158203125, 1.8750333786010742, 3.8052310943603516, 5.735428810119629, 7.665626525878906, 9.595824241638184, 11.526021957397461, 13.456219673156738, 15.386417388916016, 17.31661605834961, 19.24681282043457, 21.17700958251953, 23.107208251953125, 25.03740692138672, 26.96760368347168, 28.89780044555664, 30.827999114990234, 32.75819778442383, 34.688392639160156, 36.61859130859375, 38.548789978027344, 40.47898864746094, 42.40918731689453, 44.33938217163086, 46.26958084106445, 48.19977951049805, 50.129974365234375, 52.06017303466797, 53.99037170410156, 55.920570373535156, 57.85076904296875, 59.78096389770508, 61.71116256713867, 63.641361236572266, 65.5715560913086, 67.50175476074219, 69.43195343017578]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 23.0, 32.0, 45.0, 93.0, 154.0, 263.0, 482.0, 836.0, 1606.0, 2889.0, 5478.0, 10367.0, 18643.0, 32824.0, 54837.0, 85412.0, 118716.0, 145552.0, 151630.0, 136410.0, 105598.0, 72402.0, 45511.0, 26568.0, 14945.0, 7973.0, 4194.0, 2243.0, 1265.0, 652.0, 363.0, 209.0, 127.0, 76.0, 51.0, 33.0, 19.0, 10.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -67.8330078125, -65.666015625, -63.4990234375, -61.33203125, -59.1650390625, -56.998046875, -54.8310546875, -52.6640625, -50.4970703125, -48.330078125, -46.1630859375, -43.99609375, -41.8291015625, -39.662109375, -37.4951171875, -35.328125, -33.1611328125, -30.994140625, -28.8271484375, -26.66015625, -24.4931640625, -22.326171875, -20.1591796875, -17.9921875, -15.8251953125, -13.658203125, -11.4912109375, -9.32421875, -7.1572265625, -4.990234375, -2.8232421875, -0.65625, 1.5107421875, 3.677734375, 5.8447265625, 8.01171875, 10.1787109375, 12.345703125, 14.5126953125, 16.6796875, 18.8466796875, 21.013671875, 23.1806640625, 25.34765625, 27.5146484375, 29.681640625, 31.8486328125, 34.015625, 36.1826171875, 38.349609375, 40.5166015625, 42.68359375, 44.8505859375, 47.017578125, 49.1845703125, 51.3515625, 53.5185546875, 55.685546875, 57.8525390625, 60.01953125, 62.1865234375, 64.353515625, 66.5205078125, 68.6875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 9.0, 5.0, 10.0, 14.0, 19.0, 17.0, 13.0, 22.0, 19.0, 28.0, 26.0, 32.0, 32.0, 47.0, 36.0, 43.0, 28.0, 35.0, 39.0, 44.0, 45.0, 36.0, 42.0, 40.0, 29.0, 34.0, 30.0, 34.0, 24.0, 16.0, 17.0, 12.0, 20.0, 14.0, 12.0, 9.0, 14.0, 8.0, 7.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.65625, -49.81591796875, -47.9755859375, -46.13525390625, -44.294921875, -42.45458984375, -40.6142578125, -38.77392578125, -36.93359375, -35.09326171875, -33.2529296875, -31.41259765625, -29.572265625, -27.73193359375, -25.8916015625, -24.05126953125, -22.2109375, -20.37060546875, -18.5302734375, -16.68994140625, -14.849609375, -13.00927734375, -11.1689453125, -9.32861328125, -7.48828125, -5.64794921875, -3.8076171875, -1.96728515625, -0.126953125, 1.71337890625, 3.5537109375, 5.39404296875, 7.234375, 9.07470703125, 10.9150390625, 12.75537109375, 14.595703125, 16.43603515625, 18.2763671875, 20.11669921875, 21.95703125, 23.79736328125, 25.6376953125, 27.47802734375, 29.318359375, 31.15869140625, 32.9990234375, 34.83935546875, 36.6796875, 38.52001953125, 40.3603515625, 42.20068359375, 44.041015625, 45.88134765625, 47.7216796875, 49.56201171875, 51.40234375, 53.24267578125, 55.0830078125, 56.92333984375, 58.763671875, 60.60400390625, 62.4443359375, 64.28466796875, 66.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 10.0, 6.0, 10.0, 10.0, 21.0, 43.0, 56.0, 84.0, 132.0, 191.0, 305.0, 509.0, 760.0, 1236.0, 1933.0, 3208.0, 5043.0, 7806.0, 12221.0, 18696.0, 28069.0, 40598.0, 56324.0, 75794.0, 93522.0, 107699.0, 114245.0, 109883.0, 97445.0, 79486.0, 61035.0, 43802.0, 30917.0, 20492.0, 13426.0, 8664.0, 5431.0, 3533.0, 2221.0, 1369.0, 841.0, 512.0, 332.0, 221.0, 141.0, 89.0, 62.0, 47.0, 21.0, 20.0, 13.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.96875, -48.33642578125, -46.7041015625, -45.07177734375, -43.439453125, -41.80712890625, -40.1748046875, -38.54248046875, -36.91015625, -35.27783203125, -33.6455078125, -32.01318359375, -30.380859375, -28.74853515625, -27.1162109375, -25.48388671875, -23.8515625, -22.21923828125, -20.5869140625, -18.95458984375, -17.322265625, -15.68994140625, -14.0576171875, -12.42529296875, -10.79296875, -9.16064453125, -7.5283203125, -5.89599609375, -4.263671875, -2.63134765625, -0.9990234375, 0.63330078125, 2.265625, 3.89794921875, 5.5302734375, 7.16259765625, 8.794921875, 10.42724609375, 12.0595703125, 13.69189453125, 15.32421875, 16.95654296875, 18.5888671875, 20.22119140625, 21.853515625, 23.48583984375, 25.1181640625, 26.75048828125, 28.3828125, 30.01513671875, 31.6474609375, 33.27978515625, 34.912109375, 36.54443359375, 38.1767578125, 39.80908203125, 41.44140625, 43.07373046875, 44.7060546875, 46.33837890625, 47.970703125, 49.60302734375, 51.2353515625, 52.86767578125, 54.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 12.0, 4.0, 14.0, 13.0, 11.0, 21.0, 10.0, 25.0, 18.0, 25.0, 19.0, 25.0, 26.0, 41.0, 34.0, 35.0, 38.0, 36.0, 47.0, 45.0, 59.0, 41.0, 40.0, 43.0, 42.0, 32.0, 35.0, 30.0, 29.0, 17.0, 20.0, 29.0, 10.0, 14.0, 8.0, 8.0, 12.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.625, -36.40673828125, -35.1884765625, -33.97021484375, -32.751953125, -31.53369140625, -30.3154296875, -29.09716796875, -27.87890625, -26.66064453125, -25.4423828125, -24.22412109375, -23.005859375, -21.78759765625, -20.5693359375, -19.35107421875, -18.1328125, -16.91455078125, -15.6962890625, -14.47802734375, -13.259765625, -12.04150390625, -10.8232421875, -9.60498046875, -8.38671875, -7.16845703125, -5.9501953125, -4.73193359375, -3.513671875, -2.29541015625, -1.0771484375, 0.14111328125, 1.359375, 2.57763671875, 3.7958984375, 5.01416015625, 6.232421875, 7.45068359375, 8.6689453125, 9.88720703125, 11.10546875, 12.32373046875, 13.5419921875, 14.76025390625, 15.978515625, 17.19677734375, 18.4150390625, 19.63330078125, 20.8515625, 22.06982421875, 23.2880859375, 24.50634765625, 25.724609375, 26.94287109375, 28.1611328125, 29.37939453125, 30.59765625, 31.81591796875, 33.0341796875, 34.25244140625, 35.470703125, 36.68896484375, 37.9072265625, 39.12548828125, 40.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 11.0, 13.0, 12.0, 36.0, 27.0, 55.0, 85.0, 150.0, 223.0, 356.0, 598.0, 1078.0, 2152.0, 4187.0, 8555.0, 17692.0, 35574.0, 69833.0, 123960.0, 181024.0, 202795.0, 169482.0, 109806.0, 60399.0, 30620.0, 14842.0, 7153.0, 3582.0, 1843.0, 1006.0, 572.0, 318.0, 193.0, 123.0, 62.0, 48.0, 25.0, 26.0, 13.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.30078125, -28.3671875, -27.43359375, -26.5, -25.56640625, -24.6328125, -23.69921875, -22.765625, -21.83203125, -20.8984375, -19.96484375, -19.03125, -18.09765625, -17.1640625, -16.23046875, -15.296875, -14.36328125, -13.4296875, -12.49609375, -11.5625, -10.62890625, -9.6953125, -8.76171875, -7.828125, -6.89453125, -5.9609375, -5.02734375, -4.09375, -3.16015625, -2.2265625, -1.29296875, -0.359375, 0.57421875, 1.5078125, 2.44140625, 3.375, 4.30859375, 5.2421875, 6.17578125, 7.109375, 8.04296875, 8.9765625, 9.91015625, 10.84375, 11.77734375, 12.7109375, 13.64453125, 14.578125, 15.51171875, 16.4453125, 17.37890625, 18.3125, 19.24609375, 20.1796875, 21.11328125, 22.046875, 22.98046875, 23.9140625, 24.84765625, 25.78125, 26.71484375, 27.6484375, 28.58203125, 29.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 10.0, 11.0, 8.0, 8.0, 18.0, 25.0, 34.0, 33.0, 54.0, 60.0, 65.0, 72.0, 71.0, 91.0, 69.0, 83.0, 61.0, 49.0, 40.0, 45.0, 33.0, 15.0, 14.0, 14.0, 7.0, 8.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.005054473876953125, -0.00494047999382019, -0.004826486110687256, -0.004712492227554321, -0.004598498344421387, -0.004484504461288452, -0.004370510578155518, -0.004256516695022583, -0.0041425228118896484, -0.004028528928756714, -0.003914535045623779, -0.0038005411624908447, -0.00368654727935791, -0.0035725533962249756, -0.003458559513092041, -0.0033445656299591064, -0.003230571746826172, -0.0031165778636932373, -0.0030025839805603027, -0.002888590097427368, -0.0027745962142944336, -0.002660602331161499, -0.0025466084480285645, -0.00243261456489563, -0.0023186206817626953, -0.0022046267986297607, -0.002090632915496826, -0.0019766390323638916, -0.001862645149230957, -0.0017486512660980225, -0.0016346573829650879, -0.0015206634998321533, -0.0014066696166992188, -0.0012926757335662842, -0.0011786818504333496, -0.001064687967300415, -0.0009506940841674805, -0.0008367002010345459, -0.0007227063179016113, -0.0006087124347686768, -0.0004947185516357422, -0.0003807246685028076, -0.00026673078536987305, -0.00015273690223693848, -3.8743019104003906e-05, 7.525086402893066e-05, 0.00018924474716186523, 0.0003032386302947998, 0.0004172325134277344, 0.0005312263965606689, 0.0006452202796936035, 0.0007592141628265381, 0.0008732080459594727, 0.0009872019290924072, 0.0011011958122253418, 0.0012151896953582764, 0.001329183578491211, 0.0014431774616241455, 0.00155717134475708, 0.0016711652278900146, 0.0017851591110229492, 0.0018991529941558838, 0.0020131468772888184, 0.002127140760421753, 0.0022411346435546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 8.0, 7.0, 11.0, 18.0, 26.0, 46.0, 53.0, 91.0, 156.0, 268.0, 369.0, 628.0, 1035.0, 1678.0, 2683.0, 4770.0, 8837.0, 16130.0, 29619.0, 51987.0, 86848.0, 130224.0, 165309.0, 170468.0, 141135.0, 98507.0, 60199.0, 34386.0, 18875.0, 10412.0, 5687.0, 3243.0, 1931.0, 1108.0, 647.0, 419.0, 254.0, 147.0, 109.0, 95.0, 44.0, 27.0, 22.0, 12.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.734375, -24.88037109375, -24.0263671875, -23.17236328125, -22.318359375, -21.46435546875, -20.6103515625, -19.75634765625, -18.90234375, -18.04833984375, -17.1943359375, -16.34033203125, -15.486328125, -14.63232421875, -13.7783203125, -12.92431640625, -12.0703125, -11.21630859375, -10.3623046875, -9.50830078125, -8.654296875, -7.80029296875, -6.9462890625, -6.09228515625, -5.23828125, -4.38427734375, -3.5302734375, -2.67626953125, -1.822265625, -0.96826171875, -0.1142578125, 0.73974609375, 1.59375, 2.44775390625, 3.3017578125, 4.15576171875, 5.009765625, 5.86376953125, 6.7177734375, 7.57177734375, 8.42578125, 9.27978515625, 10.1337890625, 10.98779296875, 11.841796875, 12.69580078125, 13.5498046875, 14.40380859375, 15.2578125, 16.11181640625, 16.9658203125, 17.81982421875, 18.673828125, 19.52783203125, 20.3818359375, 21.23583984375, 22.08984375, 22.94384765625, 23.7978515625, 24.65185546875, 25.505859375, 26.35986328125, 27.2138671875, 28.06787109375, 28.921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 12.0, 17.0, 25.0, 24.0, 29.0, 38.0, 50.0, 65.0, 70.0, 84.0, 68.0, 64.0, 84.0, 55.0, 56.0, 53.0, 42.0, 42.0, 17.0, 26.0, 14.0, 16.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -12.9974365234375, -12.533935546875, -12.0704345703125, -11.60693359375, -11.1434326171875, -10.679931640625, -10.2164306640625, -9.7529296875, -9.2894287109375, -8.825927734375, -8.3624267578125, -7.89892578125, -7.4354248046875, -6.971923828125, -6.5084228515625, -6.044921875, -5.5814208984375, -5.117919921875, -4.6544189453125, -4.19091796875, -3.7274169921875, -3.263916015625, -2.8004150390625, -2.3369140625, -1.8734130859375, -1.409912109375, -0.9464111328125, -0.48291015625, -0.0194091796875, 0.444091796875, 0.9075927734375, 1.37109375, 1.8345947265625, 2.298095703125, 2.7615966796875, 3.22509765625, 3.6885986328125, 4.152099609375, 4.6156005859375, 5.0791015625, 5.5426025390625, 6.006103515625, 6.4696044921875, 6.93310546875, 7.3966064453125, 7.860107421875, 8.3236083984375, 8.787109375, 9.2506103515625, 9.714111328125, 10.1776123046875, 10.64111328125, 11.1046142578125, 11.568115234375, 12.0316162109375, 12.4951171875, 12.9586181640625, 13.422119140625, 13.8856201171875, 14.34912109375, 14.8126220703125, 15.276123046875, 15.7396240234375, 16.203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 10.0, 16.0, 22.0, 18.0, 22.0, 31.0, 27.0, 32.0, 37.0, 37.0, 35.0, 42.0, 47.0, 34.0, 50.0, 45.0, 38.0, 24.0, 40.0, 27.0, 23.0, 27.0, 36.0, 25.0, 33.0, 31.0, 25.0, 21.0, 21.0, 19.0, 10.0, 14.0, 8.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.84510803222656, -58.98116683959961, -57.11722946166992, -55.25328826904297, -53.389347076416016, -51.52540588378906, -49.661468505859375, -47.79752731323242, -45.93358612060547, -44.069644927978516, -42.20570755004883, -40.341766357421875, -38.47782516479492, -36.61388397216797, -34.74994659423828, -32.88600540161133, -31.02206802368164, -29.15812873840332, -27.294187545776367, -25.430248260498047, -23.566307067871094, -21.702367782592773, -19.838428497314453, -17.9744873046875, -16.11054801940918, -14.246607780456543, -12.382667541503906, -10.518728256225586, -8.65478801727295, -6.7908477783203125, -4.926908493041992, -3.0629682540893555, -1.1990318298339844, 0.6649081707000732, 2.528848171234131, 4.392787933349609, 6.256728172302246, 8.120668411254883, 9.984607696533203, 11.84854793548584, 13.712488174438477, 15.576428413391113, 17.44036865234375, 19.30430793762207, 21.16824722290039, 23.032188415527344, 24.896127700805664, 26.760066986083984, 28.624008178710938, 30.487947463989258, 32.35188674926758, 34.21582794189453, 36.079769134521484, 37.94371032714844, 39.807647705078125, 41.67158889770508, 43.53553009033203, 45.399471282958984, 47.26340866088867, 49.127349853515625, 50.99129104614258, 52.85523223876953, 54.71916961669922, 56.58311080932617, 58.44704818725586]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 2.0, 9.0, 11.0, 16.0, 13.0, 9.0, 19.0, 18.0, 32.0, 31.0, 25.0, 37.0, 32.0, 25.0, 42.0, 36.0, 36.0, 40.0, 40.0, 36.0, 32.0, 41.0, 33.0, 43.0, 41.0, 30.0, 20.0, 32.0, 35.0, 24.0, 26.0, 16.0, 14.0, 13.0, 14.0, 9.0, 14.0, 10.0, 3.0, 11.0, 8.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.64284133911133, -52.721534729003906, -50.800228118896484, -48.87892150878906, -46.95761489868164, -45.03630828857422, -43.1150016784668, -41.193695068359375, -39.27238845825195, -37.35108184814453, -35.42977523803711, -33.50846862792969, -31.587162017822266, -29.665855407714844, -27.744548797607422, -25.8232421875, -23.901935577392578, -21.980628967285156, -20.059322357177734, -18.138015747070312, -16.21670913696289, -14.295402526855469, -12.374095916748047, -10.452789306640625, -8.531482696533203, -6.610176086425781, -4.688869476318359, -2.7675628662109375, -0.8462562561035156, 1.0750503540039062, 2.996356964111328, 4.91766357421875, 6.838966369628906, 8.760272979736328, 10.68157958984375, 12.602886199951172, 14.524192810058594, 16.445499420166016, 18.366806030273438, 20.28811264038086, 22.20941925048828, 24.130725860595703, 26.052032470703125, 27.973339080810547, 29.89464569091797, 31.81595230102539, 33.73725891113281, 35.658565521240234, 37.579872131347656, 39.50117874145508, 41.4224853515625, 43.34379196166992, 45.265098571777344, 47.186405181884766, 49.10771179199219, 51.02901840209961, 52.95032501220703, 54.87163162231445, 56.792938232421875, 58.7142448425293, 60.63555145263672, 62.55685806274414, 64.47816467285156, 66.39947509765625, 68.3207778930664]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 20.0, 46.0, 59.0, 123.0, 174.0, 298.0, 485.0, 803.0, 1253.0, 2126.0, 3530.0, 5505.0, 9112.0, 14945.0, 24060.0, 38424.0, 60402.0, 92812.0, 140249.0, 203516.0, 280648.0, 364383.0, 438720.0, 476999.0, 470202.0, 420598.0, 343168.0, 260727.0, 185471.0, 126067.0, 83052.0, 54487.0, 34546.0, 21552.0, 13518.0, 8436.0, 5191.0, 3225.0, 2025.0, 1231.0, 734.0, 498.0, 314.0, 202.0, 125.0, 65.0, 45.0, 29.0, 23.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0], "bins": [-46.8125, -45.388671875, -43.96484375, -42.541015625, -41.1171875, -39.693359375, -38.26953125, -36.845703125, -35.421875, -33.998046875, -32.57421875, -31.150390625, -29.7265625, -28.302734375, -26.87890625, -25.455078125, -24.03125, -22.607421875, -21.18359375, -19.759765625, -18.3359375, -16.912109375, -15.48828125, -14.064453125, -12.640625, -11.216796875, -9.79296875, -8.369140625, -6.9453125, -5.521484375, -4.09765625, -2.673828125, -1.25, 0.173828125, 1.59765625, 3.021484375, 4.4453125, 5.869140625, 7.29296875, 8.716796875, 10.140625, 11.564453125, 12.98828125, 14.412109375, 15.8359375, 17.259765625, 18.68359375, 20.107421875, 21.53125, 22.955078125, 24.37890625, 25.802734375, 27.2265625, 28.650390625, 30.07421875, 31.498046875, 32.921875, 34.345703125, 35.76953125, 37.193359375, 38.6171875, 40.041015625, 41.46484375, 42.888671875, 44.3125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 14.0, 12.0, 15.0, 23.0, 14.0, 28.0, 32.0, 34.0, 40.0, 30.0, 34.0, 36.0, 37.0, 27.0, 43.0, 47.0, 43.0, 36.0, 36.0, 41.0, 43.0, 30.0, 28.0, 32.0, 31.0, 29.0, 25.0, 12.0, 18.0, 22.0, 5.0, 13.0, 14.0, 8.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.65283203125, -44.9306640625, -43.20849609375, -41.486328125, -39.76416015625, -38.0419921875, -36.31982421875, -34.59765625, -32.87548828125, -31.1533203125, -29.43115234375, -27.708984375, -25.98681640625, -24.2646484375, -22.54248046875, -20.8203125, -19.09814453125, -17.3759765625, -15.65380859375, -13.931640625, -12.20947265625, -10.4873046875, -8.76513671875, -7.04296875, -5.32080078125, -3.5986328125, -1.87646484375, -0.154296875, 1.56787109375, 3.2900390625, 5.01220703125, 6.734375, 8.45654296875, 10.1787109375, 11.90087890625, 13.623046875, 15.34521484375, 17.0673828125, 18.78955078125, 20.51171875, 22.23388671875, 23.9560546875, 25.67822265625, 27.400390625, 29.12255859375, 30.8447265625, 32.56689453125, 34.2890625, 36.01123046875, 37.7333984375, 39.45556640625, 41.177734375, 42.89990234375, 44.6220703125, 46.34423828125, 48.06640625, 49.78857421875, 51.5107421875, 53.23291015625, 54.955078125, 56.67724609375, 58.3994140625, 60.12158203125, 61.84375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 12.0, 17.0, 30.0, 57.0, 114.0, 155.0, 317.0, 517.0, 909.0, 1703.0, 2894.0, 5337.0, 9258.0, 16180.0, 27868.0, 46970.0, 76536.0, 121801.0, 185460.0, 265494.0, 358204.0, 441560.0, 495081.0, 498400.0, 452484.0, 371805.0, 280442.0, 197543.0, 131098.0, 83177.0, 51024.0, 30400.0, 17688.0, 10230.0, 5962.0, 3311.0, 1824.0, 1051.0, 570.0, 315.0, 221.0, 110.0, 64.0, 32.0, 27.0, 11.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.7578125, -48.046875, -46.3359375, -44.625, -42.9140625, -41.203125, -39.4921875, -37.78125, -36.0703125, -34.359375, -32.6484375, -30.9375, -29.2265625, -27.515625, -25.8046875, -24.09375, -22.3828125, -20.671875, -18.9609375, -17.25, -15.5390625, -13.828125, -12.1171875, -10.40625, -8.6953125, -6.984375, -5.2734375, -3.5625, -1.8515625, -0.140625, 1.5703125, 3.28125, 4.9921875, 6.703125, 8.4140625, 10.125, 11.8359375, 13.546875, 15.2578125, 16.96875, 18.6796875, 20.390625, 22.1015625, 23.8125, 25.5234375, 27.234375, 28.9453125, 30.65625, 32.3671875, 34.078125, 35.7890625, 37.5, 39.2109375, 40.921875, 42.6328125, 44.34375, 46.0546875, 47.765625, 49.4765625, 51.1875, 52.8984375, 54.609375, 56.3203125, 58.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 16.0, 12.0, 16.0, 24.0, 29.0, 41.0, 39.0, 48.0, 66.0, 74.0, 99.0, 119.0, 120.0, 140.0, 134.0, 185.0, 169.0, 202.0, 190.0, 220.0, 209.0, 187.0, 228.0, 188.0, 189.0, 170.0, 152.0, 130.0, 117.0, 107.0, 102.0, 79.0, 53.0, 38.0, 38.0, 33.0, 27.0, 18.0, 25.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.41552734375, -23.6123046875, -22.80908203125, -22.005859375, -21.20263671875, -20.3994140625, -19.59619140625, -18.79296875, -17.98974609375, -17.1865234375, -16.38330078125, -15.580078125, -14.77685546875, -13.9736328125, -13.17041015625, -12.3671875, -11.56396484375, -10.7607421875, -9.95751953125, -9.154296875, -8.35107421875, -7.5478515625, -6.74462890625, -5.94140625, -5.13818359375, -4.3349609375, -3.53173828125, -2.728515625, -1.92529296875, -1.1220703125, -0.31884765625, 0.484375, 1.28759765625, 2.0908203125, 2.89404296875, 3.697265625, 4.50048828125, 5.3037109375, 6.10693359375, 6.91015625, 7.71337890625, 8.5166015625, 9.31982421875, 10.123046875, 10.92626953125, 11.7294921875, 12.53271484375, 13.3359375, 14.13916015625, 14.9423828125, 15.74560546875, 16.548828125, 17.35205078125, 18.1552734375, 18.95849609375, 19.76171875, 20.56494140625, 21.3681640625, 22.17138671875, 22.974609375, 23.77783203125, 24.5810546875, 25.38427734375, 26.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 11.0, 8.0, 17.0, 11.0, 7.0, 13.0, 20.0, 12.0, 14.0, 28.0, 27.0, 26.0, 28.0, 32.0, 38.0, 41.0, 44.0, 39.0, 44.0, 33.0, 40.0, 38.0, 23.0, 43.0, 29.0, 28.0, 32.0, 38.0, 33.0, 18.0, 22.0, 15.0, 21.0, 11.0, 14.0, 9.0, 14.0, 13.0, 12.0, 5.0, 6.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-52.89725875854492, -51.18734359741211, -49.47743225097656, -47.76751708984375, -46.0576057434082, -44.34769058227539, -42.637779235839844, -40.92786407470703, -39.217952728271484, -37.50803756713867, -35.798126220703125, -34.08821105957031, -32.378299713134766, -30.668384552001953, -28.958473205566406, -27.248558044433594, -25.538644790649414, -23.828731536865234, -22.118818283081055, -20.408905029296875, -18.698991775512695, -16.989078521728516, -15.27916431427002, -13.56925106048584, -11.85933780670166, -10.14942455291748, -8.4395112991333, -6.729597568511963, -5.019684314727783, -3.3097705841064453, -1.5998573303222656, 0.11005592346191406, 1.8199691772460938, 3.5298824310302734, 5.239795684814453, 6.949709415435791, 8.659622192382812, 10.369536399841309, 12.079449653625488, 13.789362907409668, 15.499276161193848, 17.209190368652344, 18.919103622436523, 20.629016876220703, 22.338930130004883, 24.048843383789062, 25.758756637573242, 27.468669891357422, 29.1785831451416, 30.88849639892578, 32.598411560058594, 34.30832290649414, 36.01823806762695, 37.7281494140625, 39.43806457519531, 41.14797592163086, 42.85789108276367, 44.567806243896484, 46.27771759033203, 47.987632751464844, 49.69754409790039, 51.4074592590332, 53.11737060546875, 54.82728576660156, 56.53719711303711]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 11.0, 10.0, 13.0, 13.0, 13.0, 14.0, 12.0, 25.0, 29.0, 22.0, 29.0, 34.0, 42.0, 42.0, 42.0, 38.0, 31.0, 44.0, 46.0, 39.0, 44.0, 33.0, 41.0, 34.0, 30.0, 36.0, 36.0, 27.0, 27.0, 21.0, 17.0, 16.0, 22.0, 12.0, 8.0, 8.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.406978607177734, -54.4423713684082, -52.477760314941406, -50.513153076171875, -48.548545837402344, -46.58393859863281, -44.619327545166016, -42.654720306396484, -40.69010925292969, -38.725502014160156, -36.76089096069336, -34.79628372192383, -32.8316764831543, -30.867067337036133, -28.90245819091797, -26.937850952148438, -24.973243713378906, -23.008634567260742, -21.04402732849121, -19.079418182373047, -17.114810943603516, -15.150201797485352, -13.185592651367188, -11.22098445892334, -9.256376266479492, -7.2917680740356445, -5.327159404754639, -3.362550735473633, -1.3979425430297852, 0.5666656494140625, 2.5312747955322266, 4.495882987976074, 6.460487365722656, 8.425095558166504, 10.389703750610352, 12.354312896728516, 14.318921089172363, 16.28352928161621, 18.248138427734375, 20.212745666503906, 22.17735481262207, 24.141963958740234, 26.106571197509766, 28.07118034362793, 30.035789489746094, 32.000396728515625, 33.965003967285156, 35.92961502075195, 37.894222259521484, 39.858829498291016, 41.82344055175781, 43.788047790527344, 45.752655029296875, 47.717262268066406, 49.6818733215332, 51.646480560302734, 53.61109161376953, 55.57569885253906, 57.54030990600586, 59.50491714477539, 61.46952438354492, 63.43413543701172, 65.39874267578125, 67.36334991455078, 69.32795715332031]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 10.0, 16.0, 21.0, 30.0, 43.0, 86.0, 129.0, 215.0, 375.0, 558.0, 1076.0, 1997.0, 3360.0, 5758.0, 9964.0, 17244.0, 28364.0, 46069.0, 69920.0, 98552.0, 125818.0, 140518.0, 137160.0, 116620.0, 87808.0, 60409.0, 38963.0, 23937.0, 14071.0, 8159.0, 4787.0, 2788.0, 1610.0, 889.0, 478.0, 288.0, 171.0, 112.0, 66.0, 37.0, 29.0, 16.0, 9.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.675048828125, -23.81884765625, -22.962646484375, -22.1064453125, -21.250244140625, -20.39404296875, -19.537841796875, -18.681640625, -17.825439453125, -16.96923828125, -16.113037109375, -15.2568359375, -14.400634765625, -13.54443359375, -12.688232421875, -11.83203125, -10.975830078125, -10.11962890625, -9.263427734375, -8.4072265625, -7.551025390625, -6.69482421875, -5.838623046875, -4.982421875, -4.126220703125, -3.27001953125, -2.413818359375, -1.5576171875, -0.701416015625, 0.15478515625, 1.010986328125, 1.8671875, 2.723388671875, 3.57958984375, 4.435791015625, 5.2919921875, 6.148193359375, 7.00439453125, 7.860595703125, 8.716796875, 9.572998046875, 10.42919921875, 11.285400390625, 12.1416015625, 12.997802734375, 13.85400390625, 14.710205078125, 15.56640625, 16.422607421875, 17.27880859375, 18.135009765625, 18.9912109375, 19.847412109375, 20.70361328125, 21.559814453125, 22.416015625, 23.272216796875, 24.12841796875, 24.984619140625, 25.8408203125, 26.697021484375, 27.55322265625, 28.409423828125, 29.265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 10.0, 15.0, 14.0, 10.0, 14.0, 14.0, 22.0, 31.0, 23.0, 31.0, 34.0, 37.0, 41.0, 45.0, 40.0, 31.0, 42.0, 45.0, 39.0, 41.0, 36.0, 43.0, 33.0, 28.0, 38.0, 33.0, 31.0, 23.0, 23.0, 18.0, 14.0, 21.0, 16.0, 6.0, 8.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.03125, -55.04541015625, -53.0595703125, -51.07373046875, -49.087890625, -47.10205078125, -45.1162109375, -43.13037109375, -41.14453125, -39.15869140625, -37.1728515625, -35.18701171875, -33.201171875, -31.21533203125, -29.2294921875, -27.24365234375, -25.2578125, -23.27197265625, -21.2861328125, -19.30029296875, -17.314453125, -15.32861328125, -13.3427734375, -11.35693359375, -9.37109375, -7.38525390625, -5.3994140625, -3.41357421875, -1.427734375, 0.55810546875, 2.5439453125, 4.52978515625, 6.515625, 8.50146484375, 10.4873046875, 12.47314453125, 14.458984375, 16.44482421875, 18.4306640625, 20.41650390625, 22.40234375, 24.38818359375, 26.3740234375, 28.35986328125, 30.345703125, 32.33154296875, 34.3173828125, 36.30322265625, 38.2890625, 40.27490234375, 42.2607421875, 44.24658203125, 46.232421875, 48.21826171875, 50.2041015625, 52.18994140625, 54.17578125, 56.16162109375, 58.1474609375, 60.13330078125, 62.119140625, 64.10498046875, 66.0908203125, 68.07666015625, 70.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 24.0, 35.0, 49.0, 86.0, 116.0, 221.0, 411.0, 717.0, 1363.0, 2507.0, 4492.0, 8247.0, 15361.0, 29134.0, 192290.0, 717800.0, 35699.0, 18448.0, 9742.0, 5211.0, 2848.0, 1671.0, 879.0, 510.0, 245.0, 121.0, 106.0, 67.0, 35.0, 21.0, 15.0, 13.0, 4.0, 3.0, 11.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.625, -80.205078125, -77.78515625, -75.365234375, -72.9453125, -70.525390625, -68.10546875, -65.685546875, -63.265625, -60.845703125, -58.42578125, -56.005859375, -53.5859375, -51.166015625, -48.74609375, -46.326171875, -43.90625, -41.486328125, -39.06640625, -36.646484375, -34.2265625, -31.806640625, -29.38671875, -26.966796875, -24.546875, -22.126953125, -19.70703125, -17.287109375, -14.8671875, -12.447265625, -10.02734375, -7.607421875, -5.1875, -2.767578125, -0.34765625, 2.072265625, 4.4921875, 6.912109375, 9.33203125, 11.751953125, 14.171875, 16.591796875, 19.01171875, 21.431640625, 23.8515625, 26.271484375, 28.69140625, 31.111328125, 33.53125, 35.951171875, 38.37109375, 40.791015625, 43.2109375, 45.630859375, 48.05078125, 50.470703125, 52.890625, 55.310546875, 57.73046875, 60.150390625, 62.5703125, 64.990234375, 67.41015625, 69.830078125, 72.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 17.0, 15.0, 19.0, 24.0, 13.0, 28.0, 34.0, 32.0, 38.0, 36.0, 31.0, 35.0, 41.0, 37.0, 39.0, 23.0, 37.0, 26.0, 30.0, 45.0, 43.0, 28.0, 35.0, 20.0, 39.0, 27.0, 20.0, 21.0, 14.0, 17.0, 13.0, 15.0, 18.0, 4.0, 8.0, 6.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-37.46875, -36.17626953125, -34.8837890625, -33.59130859375, -32.298828125, -31.00634765625, -29.7138671875, -28.42138671875, -27.12890625, -25.83642578125, -24.5439453125, -23.25146484375, -21.958984375, -20.66650390625, -19.3740234375, -18.08154296875, -16.7890625, -15.49658203125, -14.2041015625, -12.91162109375, -11.619140625, -10.32666015625, -9.0341796875, -7.74169921875, -6.44921875, -5.15673828125, -3.8642578125, -2.57177734375, -1.279296875, 0.01318359375, 1.3056640625, 2.59814453125, 3.890625, 5.18310546875, 6.4755859375, 7.76806640625, 9.060546875, 10.35302734375, 11.6455078125, 12.93798828125, 14.23046875, 15.52294921875, 16.8154296875, 18.10791015625, 19.400390625, 20.69287109375, 21.9853515625, 23.27783203125, 24.5703125, 25.86279296875, 27.1552734375, 28.44775390625, 29.740234375, 31.03271484375, 32.3251953125, 33.61767578125, 34.91015625, 36.20263671875, 37.4951171875, 38.78759765625, 40.080078125, 41.37255859375, 42.6650390625, 43.95751953125, 45.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 22.0, 23.0, 28.0, 36.0, 43.0, 56.0, 92.0, 136.0, 213.0, 332.0, 549.0, 848.0, 1436.0, 2504.0, 4515.0, 8505.0, 16439.0, 35883.0, 672400.0, 244580.0, 28724.0, 13991.0, 7360.0, 4156.0, 2251.0, 1222.0, 782.0, 432.0, 274.0, 199.0, 141.0, 76.0, 79.0, 45.0, 30.0, 32.0, 30.0, 10.0, 14.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.18359375, -5.02099609375, -4.8583984375, -4.69580078125, -4.533203125, -4.37060546875, -4.2080078125, -4.04541015625, -3.8828125, -3.72021484375, -3.5576171875, -3.39501953125, -3.232421875, -3.06982421875, -2.9072265625, -2.74462890625, -2.58203125, -2.41943359375, -2.2568359375, -2.09423828125, -1.931640625, -1.76904296875, -1.6064453125, -1.44384765625, -1.28125, -1.11865234375, -0.9560546875, -0.79345703125, -0.630859375, -0.46826171875, -0.3056640625, -0.14306640625, 0.01953125, 0.18212890625, 0.3447265625, 0.50732421875, 0.669921875, 0.83251953125, 0.9951171875, 1.15771484375, 1.3203125, 1.48291015625, 1.6455078125, 1.80810546875, 1.970703125, 2.13330078125, 2.2958984375, 2.45849609375, 2.62109375, 2.78369140625, 2.9462890625, 3.10888671875, 3.271484375, 3.43408203125, 3.5966796875, 3.75927734375, 3.921875, 4.08447265625, 4.2470703125, 4.40966796875, 4.572265625, 4.73486328125, 4.8974609375, 5.06005859375, 5.22265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 5.0, 18.0, 23.0, 12.0, 25.0, 20.0, 34.0, 29.0, 51.0, 49.0, 44.0, 57.0, 57.0, 52.0, 62.0, 45.0, 51.0, 36.0, 35.0, 32.0, 33.0, 31.0, 25.0, 20.0, 17.0, 13.0, 12.0, 10.0, 8.0, 7.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00061798095703125, -0.0006001219153404236, -0.0005822628736495972, -0.0005644038319587708, -0.0005465447902679443, -0.0005286857485771179, -0.0005108267068862915, -0.0004929676651954651, -0.00047510862350463867, -0.00045724958181381226, -0.00043939054012298584, -0.0004215314984321594, -0.000403672456741333, -0.0003858134150505066, -0.0003679543733596802, -0.00035009533166885376, -0.00033223628997802734, -0.00031437724828720093, -0.0002965182065963745, -0.0002786591649055481, -0.0002608001232147217, -0.00024294108152389526, -0.00022508203983306885, -0.00020722299814224243, -0.00018936395645141602, -0.0001715049147605896, -0.00015364587306976318, -0.00013578683137893677, -0.00011792778968811035, -0.00010006874799728394, -8.220970630645752e-05, -6.43506646156311e-05, -4.649162292480469e-05, -2.863258123397827e-05, -1.0773539543151855e-05, 7.0855021476745605e-06, 2.4944543838500977e-05, 4.280358552932739e-05, 6.066262722015381e-05, 7.852166891098022e-05, 9.638071060180664e-05, 0.00011423975229263306, 0.00013209879398345947, 0.0001499578356742859, 0.0001678168773651123, 0.00018567591905593872, 0.00020353496074676514, 0.00022139400243759155, 0.00023925304412841797, 0.0002571120858192444, 0.0002749711275100708, 0.0002928301692008972, 0.00031068921089172363, 0.00032854825258255005, 0.00034640729427337646, 0.0003642663359642029, 0.0003821253776550293, 0.0003999844193458557, 0.00041784346103668213, 0.00043570250272750854, 0.00045356154441833496, 0.0004714205861091614, 0.0004892796277999878, 0.0005071386694908142, 0.0005249977111816406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 6.0, 10.0, 14.0, 22.0, 20.0, 36.0, 49.0, 73.0, 120.0, 156.0, 219.0, 280.0, 439.0, 610.0, 949.0, 1560.0, 2572.0, 4545.0, 8854.0, 18010.0, 36725.0, 74127.0, 136651.0, 208399.0, 219956.0, 156264.0, 87894.0, 43924.0, 21741.0, 10681.0, 5577.0, 2995.0, 1724.0, 1093.0, 694.0, 484.0, 300.0, 224.0, 163.0, 111.0, 87.0, 84.0, 38.0, 25.0, 20.0, 6.0, 12.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.525390625, -3.40838623046875, -3.2913818359375, -3.17437744140625, -3.057373046875, -2.94036865234375, -2.8233642578125, -2.70635986328125, -2.58935546875, -2.47235107421875, -2.3553466796875, -2.23834228515625, -2.121337890625, -2.00433349609375, -1.8873291015625, -1.77032470703125, -1.6533203125, -1.53631591796875, -1.4193115234375, -1.30230712890625, -1.185302734375, -1.06829833984375, -0.9512939453125, -0.83428955078125, -0.71728515625, -0.60028076171875, -0.4832763671875, -0.36627197265625, -0.249267578125, -0.13226318359375, -0.0152587890625, 0.10174560546875, 0.21875, 0.33575439453125, 0.4527587890625, 0.56976318359375, 0.686767578125, 0.80377197265625, 0.9207763671875, 1.03778076171875, 1.15478515625, 1.27178955078125, 1.3887939453125, 1.50579833984375, 1.622802734375, 1.73980712890625, 1.8568115234375, 1.97381591796875, 2.0908203125, 2.20782470703125, 2.3248291015625, 2.44183349609375, 2.558837890625, 2.67584228515625, 2.7928466796875, 2.90985107421875, 3.02685546875, 3.14385986328125, 3.2608642578125, 3.37786865234375, 3.494873046875, 3.61187744140625, 3.7288818359375, 3.84588623046875, 3.962890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 20.0, 18.0, 31.0, 31.0, 62.0, 77.0, 96.0, 113.0, 118.0, 102.0, 80.0, 61.0, 44.0, 28.0, 14.0, 14.0, 8.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4547882080078125, -1.404693603515625, -1.3545989990234375, -1.30450439453125, -1.2544097900390625, -1.204315185546875, -1.1542205810546875, -1.1041259765625, -1.0540313720703125, -1.003936767578125, -0.9538421630859375, -0.90374755859375, -0.8536529541015625, -0.803558349609375, -0.7534637451171875, -0.703369140625, -0.6532745361328125, -0.603179931640625, -0.5530853271484375, -0.50299072265625, -0.4528961181640625, -0.402801513671875, -0.3527069091796875, -0.3026123046875, -0.2525177001953125, -0.202423095703125, -0.1523284912109375, -0.10223388671875, -0.0521392822265625, -0.002044677734375, 0.0480499267578125, 0.09814453125, 0.1482391357421875, 0.198333740234375, 0.2484283447265625, 0.29852294921875, 0.3486175537109375, 0.398712158203125, 0.4488067626953125, 0.4989013671875, 0.5489959716796875, 0.599090576171875, 0.6491851806640625, 0.69927978515625, 0.7493743896484375, 0.799468994140625, 0.8495635986328125, 0.899658203125, 0.9497528076171875, 0.999847412109375, 1.0499420166015625, 1.10003662109375, 1.1501312255859375, 1.200225830078125, 1.2503204345703125, 1.3004150390625, 1.3505096435546875, 1.400604248046875, 1.4506988525390625, 1.50079345703125, 1.5508880615234375, 1.600982666015625, 1.6510772705078125, 1.701171875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 5.0, 10.0, 9.0, 11.0, 10.0, 14.0, 9.0, 14.0, 13.0, 16.0, 20.0, 30.0, 19.0, 21.0, 22.0, 35.0, 42.0, 35.0, 33.0, 39.0, 43.0, 37.0, 40.0, 37.0, 34.0, 31.0, 31.0, 34.0, 42.0, 29.0, 26.0, 28.0, 21.0, 20.0, 17.0, 16.0, 20.0, 5.0, 9.0, 16.0, 10.0, 14.0, 6.0, 1.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.85308837890625, -50.14957809448242, -48.44607162475586, -46.74256134033203, -45.0390510559082, -43.335540771484375, -41.63203430175781, -39.928524017333984, -38.225013732910156, -36.52150344848633, -34.817996978759766, -33.11448669433594, -31.41097640991211, -29.707468032836914, -28.00395965576172, -26.30044937133789, -24.596942901611328, -22.893434524536133, -21.189924240112305, -19.48641586303711, -17.78290557861328, -16.079397201538086, -14.37588882446289, -12.672379493713379, -10.968870162963867, -9.265360832214355, -7.561851978302002, -5.858343124389648, -4.154833793640137, -2.451324462890625, -0.7478160858154297, 0.955693244934082, 2.6592025756835938, 4.3627119064331055, 6.066220760345459, 7.7697296142578125, 9.473238945007324, 11.176748275756836, 12.880256652832031, 14.583765983581543, 16.287275314331055, 17.99078369140625, 19.694293975830078, 21.397802352905273, 23.10131072998047, 24.804821014404297, 26.508329391479492, 28.211837768554688, 29.915348052978516, 31.61885643005371, 33.322364807128906, 35.025875091552734, 36.72938537597656, 38.432891845703125, 40.13640213012695, 41.83991241455078, 43.543418884277344, 45.24692916870117, 46.950435638427734, 48.65394592285156, 50.35745620727539, 52.06096649169922, 53.76447296142578, 55.46798324584961, 57.17149353027344]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 8.0, 11.0, 16.0, 11.0, 14.0, 15.0, 25.0, 23.0, 27.0, 34.0, 32.0, 35.0, 45.0, 32.0, 46.0, 33.0, 45.0, 44.0, 37.0, 42.0, 30.0, 50.0, 30.0, 30.0, 40.0, 27.0, 32.0, 30.0, 19.0, 18.0, 13.0, 16.0, 24.0, 4.0, 14.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.00938415527344, -55.027931213378906, -53.04648208618164, -51.06502914428711, -49.083580017089844, -47.10212707519531, -45.12067413330078, -43.139225006103516, -41.15777587890625, -39.17632293701172, -37.19487380981445, -35.21342086791992, -33.231971740722656, -31.250518798828125, -29.269067764282227, -27.287616729736328, -25.306163787841797, -23.3247127532959, -21.34326171875, -19.36180877685547, -17.380359649658203, -15.398907661437988, -13.417455673217773, -11.436004638671875, -9.454553604125977, -7.473102569580078, -5.4916510581970215, -3.510199546813965, -1.5287485122680664, 0.45270252227783203, 2.434154510498047, 4.415605545043945, 6.397056579589844, 8.378507614135742, 10.35995864868164, 12.341410636901855, 14.322861671447754, 16.30431365966797, 18.285764694213867, 20.267215728759766, 22.248666763305664, 24.230117797851562, 26.21156883239746, 28.19301986694336, 30.17447280883789, 32.155921936035156, 34.13737487792969, 36.11882781982422, 38.100276947021484, 40.081729888916016, 42.06317901611328, 44.04463195800781, 46.02608108520508, 48.00753402709961, 49.988983154296875, 51.970436096191406, 53.95188903808594, 55.93334197998047, 57.914791107177734, 59.896244049072266, 61.87769317626953, 63.85914611816406, 65.8405990600586, 67.82205200195312, 69.80349731445312]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 18.0, 18.0, 43.0, 63.0, 101.0, 184.0, 282.0, 496.0, 893.0, 1534.0, 2670.0, 4636.0, 8102.0, 13836.0, 22784.0, 36187.0, 54462.0, 76886.0, 100217.0, 118705.0, 127268.0, 122384.0, 106039.0, 83518.0, 60636.0, 41409.0, 26437.0, 16125.0, 9627.0, 5593.0, 3118.0, 1877.0, 967.0, 598.0, 350.0, 201.0, 114.0, 67.0, 45.0, 22.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.96875, -53.17529296875, -51.3818359375, -49.58837890625, -47.794921875, -46.00146484375, -44.2080078125, -42.41455078125, -40.62109375, -38.82763671875, -37.0341796875, -35.24072265625, -33.447265625, -31.65380859375, -29.8603515625, -28.06689453125, -26.2734375, -24.47998046875, -22.6865234375, -20.89306640625, -19.099609375, -17.30615234375, -15.5126953125, -13.71923828125, -11.92578125, -10.13232421875, -8.3388671875, -6.54541015625, -4.751953125, -2.95849609375, -1.1650390625, 0.62841796875, 2.421875, 4.21533203125, 6.0087890625, 7.80224609375, 9.595703125, 11.38916015625, 13.1826171875, 14.97607421875, 16.76953125, 18.56298828125, 20.3564453125, 22.14990234375, 23.943359375, 25.73681640625, 27.5302734375, 29.32373046875, 31.1171875, 32.91064453125, 34.7041015625, 36.49755859375, 38.291015625, 40.08447265625, 41.8779296875, 43.67138671875, 45.46484375, 47.25830078125, 49.0517578125, 50.84521484375, 52.638671875, 54.43212890625, 56.2255859375, 58.01904296875, 59.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 10.0, 11.0, 13.0, 14.0, 10.0, 14.0, 12.0, 21.0, 29.0, 30.0, 30.0, 35.0, 35.0, 36.0, 38.0, 47.0, 40.0, 43.0, 45.0, 35.0, 39.0, 35.0, 44.0, 31.0, 29.0, 33.0, 38.0, 31.0, 31.0, 15.0, 16.0, 17.0, 20.0, 17.0, 9.0, 9.0, 10.0, 4.0, 7.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.71875, -52.81591796875, -50.9130859375, -49.01025390625, -47.107421875, -45.20458984375, -43.3017578125, -41.39892578125, -39.49609375, -37.59326171875, -35.6904296875, -33.78759765625, -31.884765625, -29.98193359375, -28.0791015625, -26.17626953125, -24.2734375, -22.37060546875, -20.4677734375, -18.56494140625, -16.662109375, -14.75927734375, -12.8564453125, -10.95361328125, -9.05078125, -7.14794921875, -5.2451171875, -3.34228515625, -1.439453125, 0.46337890625, 2.3662109375, 4.26904296875, 6.171875, 8.07470703125, 9.9775390625, 11.88037109375, 13.783203125, 15.68603515625, 17.5888671875, 19.49169921875, 21.39453125, 23.29736328125, 25.2001953125, 27.10302734375, 29.005859375, 30.90869140625, 32.8115234375, 34.71435546875, 36.6171875, 38.52001953125, 40.4228515625, 42.32568359375, 44.228515625, 46.13134765625, 48.0341796875, 49.93701171875, 51.83984375, 53.74267578125, 55.6455078125, 57.54833984375, 59.451171875, 61.35400390625, 63.2568359375, 65.15966796875, 67.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 15.0, 26.0, 26.0, 47.0, 93.0, 142.0, 245.0, 425.0, 748.0, 1379.0, 2651.0, 4791.0, 8485.0, 15129.0, 25978.0, 42115.0, 64208.0, 90517.0, 116813.0, 133375.0, 135467.0, 121817.0, 98133.0, 70803.0, 46488.0, 29235.0, 17300.0, 9924.0, 5457.0, 2992.0, 1692.0, 888.0, 457.0, 279.0, 161.0, 88.0, 59.0, 36.0, 28.0, 12.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-64.0625, -62.18505859375, -60.3076171875, -58.43017578125, -56.552734375, -54.67529296875, -52.7978515625, -50.92041015625, -49.04296875, -47.16552734375, -45.2880859375, -43.41064453125, -41.533203125, -39.65576171875, -37.7783203125, -35.90087890625, -34.0234375, -32.14599609375, -30.2685546875, -28.39111328125, -26.513671875, -24.63623046875, -22.7587890625, -20.88134765625, -19.00390625, -17.12646484375, -15.2490234375, -13.37158203125, -11.494140625, -9.61669921875, -7.7392578125, -5.86181640625, -3.984375, -2.10693359375, -0.2294921875, 1.64794921875, 3.525390625, 5.40283203125, 7.2802734375, 9.15771484375, 11.03515625, 12.91259765625, 14.7900390625, 16.66748046875, 18.544921875, 20.42236328125, 22.2998046875, 24.17724609375, 26.0546875, 27.93212890625, 29.8095703125, 31.68701171875, 33.564453125, 35.44189453125, 37.3193359375, 39.19677734375, 41.07421875, 42.95166015625, 44.8291015625, 46.70654296875, 48.583984375, 50.46142578125, 52.3388671875, 54.21630859375, 56.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 8.0, 10.0, 21.0, 12.0, 14.0, 34.0, 34.0, 35.0, 31.0, 31.0, 33.0, 39.0, 37.0, 41.0, 43.0, 40.0, 38.0, 46.0, 43.0, 39.0, 38.0, 35.0, 33.0, 26.0, 24.0, 34.0, 33.0, 23.0, 14.0, 17.0, 11.0, 14.0, 5.0, 11.0, 8.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.2587890625, -32.955078125, -31.6513671875, -30.34765625, -29.0439453125, -27.740234375, -26.4365234375, -25.1328125, -23.8291015625, -22.525390625, -21.2216796875, -19.91796875, -18.6142578125, -17.310546875, -16.0068359375, -14.703125, -13.3994140625, -12.095703125, -10.7919921875, -9.48828125, -8.1845703125, -6.880859375, -5.5771484375, -4.2734375, -2.9697265625, -1.666015625, -0.3623046875, 0.94140625, 2.2451171875, 3.548828125, 4.8525390625, 6.15625, 7.4599609375, 8.763671875, 10.0673828125, 11.37109375, 12.6748046875, 13.978515625, 15.2822265625, 16.5859375, 17.8896484375, 19.193359375, 20.4970703125, 21.80078125, 23.1044921875, 24.408203125, 25.7119140625, 27.015625, 28.3193359375, 29.623046875, 30.9267578125, 32.23046875, 33.5341796875, 34.837890625, 36.1416015625, 37.4453125, 38.7490234375, 40.052734375, 41.3564453125, 42.66015625, 43.9638671875, 45.267578125, 46.5712890625, 47.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 15.0, 18.0, 32.0, 45.0, 113.0, 222.0, 370.0, 724.0, 1563.0, 3602.0, 8526.0, 20222.0, 46512.0, 101883.0, 180054.0, 233613.0, 208294.0, 129957.0, 64116.0, 27944.0, 11632.0, 4889.0, 2116.0, 974.0, 500.0, 254.0, 135.0, 75.0, 53.0, 35.0, 21.0, 8.0, 10.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.9091796875, -38.724609375, -37.5400390625, -36.35546875, -35.1708984375, -33.986328125, -32.8017578125, -31.6171875, -30.4326171875, -29.248046875, -28.0634765625, -26.87890625, -25.6943359375, -24.509765625, -23.3251953125, -22.140625, -20.9560546875, -19.771484375, -18.5869140625, -17.40234375, -16.2177734375, -15.033203125, -13.8486328125, -12.6640625, -11.4794921875, -10.294921875, -9.1103515625, -7.92578125, -6.7412109375, -5.556640625, -4.3720703125, -3.1875, -2.0029296875, -0.818359375, 0.3662109375, 1.55078125, 2.7353515625, 3.919921875, 5.1044921875, 6.2890625, 7.4736328125, 8.658203125, 9.8427734375, 11.02734375, 12.2119140625, 13.396484375, 14.5810546875, 15.765625, 16.9501953125, 18.134765625, 19.3193359375, 20.50390625, 21.6884765625, 22.873046875, 24.0576171875, 25.2421875, 26.4267578125, 27.611328125, 28.7958984375, 29.98046875, 31.1650390625, 32.349609375, 33.5341796875, 34.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 11.0, 11.0, 13.0, 17.0, 30.0, 24.0, 26.0, 28.0, 24.0, 37.0, 34.0, 41.0, 42.0, 57.0, 44.0, 52.0, 46.0, 46.0, 37.0, 43.0, 41.0, 34.0, 36.0, 27.0, 25.0, 19.0, 21.0, 20.0, 20.0, 16.0, 10.0, 7.0, 9.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.002246856689453125, -0.0021781325340270996, -0.0021094083786010742, -0.002040684223175049, -0.0019719600677490234, -0.001903235912322998, -0.0018345117568969727, -0.0017657876014709473, -0.0016970634460449219, -0.0016283392906188965, -0.001559615135192871, -0.0014908909797668457, -0.0014221668243408203, -0.001353442668914795, -0.0012847185134887695, -0.0012159943580627441, -0.0011472702026367188, -0.0010785460472106934, -0.001009821891784668, -0.0009410977363586426, -0.0008723735809326172, -0.0008036494255065918, -0.0007349252700805664, -0.000666201114654541, -0.0005974769592285156, -0.0005287528038024902, -0.00046002864837646484, -0.00039130449295043945, -0.00032258033752441406, -0.00025385618209838867, -0.00018513202667236328, -0.00011640787124633789, -4.76837158203125e-05, 2.104043960571289e-05, 8.976459503173828e-05, 0.00015848875045776367, 0.00022721290588378906, 0.00029593706130981445, 0.00036466121673583984, 0.00043338537216186523, 0.0005021095275878906, 0.000570833683013916, 0.0006395578384399414, 0.0007082819938659668, 0.0007770061492919922, 0.0008457303047180176, 0.000914454460144043, 0.0009831786155700684, 0.0010519027709960938, 0.0011206269264221191, 0.0011893510818481445, 0.00125807523727417, 0.0013267993927001953, 0.0013955235481262207, 0.001464247703552246, 0.0015329718589782715, 0.0016016960144042969, 0.0016704201698303223, 0.0017391443252563477, 0.001807868480682373, 0.0018765926361083984, 0.0019453167915344238, 0.0020140409469604492, 0.0020827651023864746, 0.0021514892578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 14.0, 28.0, 39.0, 75.0, 90.0, 178.0, 251.0, 463.0, 683.0, 1144.0, 1897.0, 3243.0, 5687.0, 9818.0, 16813.0, 30027.0, 49888.0, 79978.0, 115233.0, 145215.0, 155958.0, 140039.0, 108431.0, 73550.0, 45660.0, 26973.0, 15566.0, 8969.0, 5175.0, 2985.0, 1754.0, 1064.0, 636.0, 366.0, 259.0, 149.0, 86.0, 58.0, 29.0, 19.0, 23.0, 4.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.0830078125, -23.291015625, -22.4990234375, -21.70703125, -20.9150390625, -20.123046875, -19.3310546875, -18.5390625, -17.7470703125, -16.955078125, -16.1630859375, -15.37109375, -14.5791015625, -13.787109375, -12.9951171875, -12.203125, -11.4111328125, -10.619140625, -9.8271484375, -9.03515625, -8.2431640625, -7.451171875, -6.6591796875, -5.8671875, -5.0751953125, -4.283203125, -3.4912109375, -2.69921875, -1.9072265625, -1.115234375, -0.3232421875, 0.46875, 1.2607421875, 2.052734375, 2.8447265625, 3.63671875, 4.4287109375, 5.220703125, 6.0126953125, 6.8046875, 7.5966796875, 8.388671875, 9.1806640625, 9.97265625, 10.7646484375, 11.556640625, 12.3486328125, 13.140625, 13.9326171875, 14.724609375, 15.5166015625, 16.30859375, 17.1005859375, 17.892578125, 18.6845703125, 19.4765625, 20.2685546875, 21.060546875, 21.8525390625, 22.64453125, 23.4365234375, 24.228515625, 25.0205078125, 25.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 21.0, 21.0, 40.0, 29.0, 42.0, 58.0, 55.0, 67.0, 85.0, 72.0, 69.0, 66.0, 70.0, 54.0, 56.0, 39.0, 26.0, 27.0, 18.0, 20.0, 10.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.4757080078125, -11.037353515625, -10.5989990234375, -10.16064453125, -9.7222900390625, -9.283935546875, -8.8455810546875, -8.4072265625, -7.9688720703125, -7.530517578125, -7.0921630859375, -6.65380859375, -6.2154541015625, -5.777099609375, -5.3387451171875, -4.900390625, -4.4620361328125, -4.023681640625, -3.5853271484375, -3.14697265625, -2.7086181640625, -2.270263671875, -1.8319091796875, -1.3935546875, -0.9552001953125, -0.516845703125, -0.0784912109375, 0.35986328125, 0.7982177734375, 1.236572265625, 1.6749267578125, 2.11328125, 2.5516357421875, 2.989990234375, 3.4283447265625, 3.86669921875, 4.3050537109375, 4.743408203125, 5.1817626953125, 5.6201171875, 6.0584716796875, 6.496826171875, 6.9351806640625, 7.37353515625, 7.8118896484375, 8.250244140625, 8.6885986328125, 9.126953125, 9.5653076171875, 10.003662109375, 10.4420166015625, 10.88037109375, 11.3187255859375, 11.757080078125, 12.1954345703125, 12.6337890625, 13.0721435546875, 13.510498046875, 13.9488525390625, 14.38720703125, 14.8255615234375, 15.263916015625, 15.7022705078125, 16.140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 11.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 18.0, 27.0, 42.0, 33.0, 30.0, 33.0, 45.0, 55.0, 30.0, 37.0, 46.0, 40.0, 45.0, 36.0, 42.0, 36.0, 36.0, 21.0, 28.0, 25.0, 28.0, 18.0, 29.0, 18.0, 10.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 10.0, 2.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.68506622314453, -49.852203369140625, -48.01934051513672, -46.18647384643555, -44.35361099243164, -42.520748138427734, -40.68788528442383, -38.855018615722656, -37.02215576171875, -35.189292907714844, -33.35643005371094, -31.5235652923584, -29.69070053100586, -27.857837677001953, -26.024974822998047, -24.192110061645508, -22.3592472076416, -20.526384353637695, -18.693519592285156, -16.86065673828125, -15.027791976928711, -13.194929122924805, -11.362065315246582, -9.52920150756836, -7.696337699890137, -5.863473892211914, -4.030610084533691, -2.197746753692627, -0.3648829460144043, 1.4679803848266602, 3.300844192504883, 5.1337080001831055, 6.966571807861328, 8.79943561553955, 10.632299423217773, 12.46516227722168, 14.298027038574219, 16.130889892578125, 17.96375274658203, 19.79661750793457, 21.62948226928711, 23.462345123291016, 25.295209884643555, 27.12807273864746, 28.9609375, 30.793800354003906, 32.62666320800781, 34.45952606201172, 36.292388916015625, 38.12525177001953, 39.95811462402344, 41.79098129272461, 43.623844146728516, 45.45670700073242, 47.28956985473633, 49.1224365234375, 50.955299377441406, 52.78816223144531, 54.62102508544922, 56.45389175415039, 58.2867546081543, 60.1196174621582, 61.95248031616211, 63.78534698486328, 65.61820983886719]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 12.0, 10.0, 16.0, 13.0, 15.0, 12.0, 25.0, 18.0, 22.0, 27.0, 30.0, 36.0, 31.0, 30.0, 38.0, 45.0, 37.0, 35.0, 32.0, 30.0, 37.0, 48.0, 43.0, 36.0, 26.0, 22.0, 24.0, 22.0, 29.0, 24.0, 20.0, 14.0, 18.0, 20.0, 16.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-57.952789306640625, -56.12928009033203, -54.30577087402344, -52.482261657714844, -50.65875244140625, -48.835243225097656, -47.01173400878906, -45.188228607177734, -43.36471939086914, -41.54121017456055, -39.71770095825195, -37.89419174194336, -36.070682525634766, -34.24717712402344, -32.423667907714844, -30.60015869140625, -28.776647567749023, -26.95313835144043, -25.129629135131836, -23.306121826171875, -21.48261260986328, -19.659103393554688, -17.835594177246094, -16.0120849609375, -14.188576698303223, -12.365067481994629, -10.541559219360352, -8.718050003051758, -6.894541263580322, -5.071032524108887, -3.247523307800293, -1.4240150451660156, 0.3994941711425781, 2.2230029106140137, 4.046511650085449, 5.870020866394043, 7.6935296058654785, 9.517038345336914, 11.340547561645508, 13.164055824279785, 14.987565040588379, 16.811073303222656, 18.63458251953125, 20.458091735839844, 22.281600952148438, 24.10511016845703, 25.928619384765625, 27.752126693725586, 29.57563591003418, 31.399145126342773, 33.222652435302734, 35.04616165161133, 36.86967086791992, 38.693180084228516, 40.51668930053711, 42.3401985168457, 44.1637077331543, 45.98721694946289, 47.810726165771484, 49.63423538208008, 51.45774459838867, 53.28125, 55.104759216308594, 56.92826843261719, 58.75177764892578]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 9.0, 7.0, 12.0, 16.0, 41.0, 56.0, 114.0, 171.0, 276.0, 518.0, 845.0, 1430.0, 2432.0, 3982.0, 6618.0, 11230.0, 18183.0, 29285.0, 47799.0, 75373.0, 115975.0, 171795.0, 244658.0, 327657.0, 406329.0, 464337.0, 480116.0, 448525.0, 383491.0, 300464.0, 221609.0, 154049.0, 102335.0, 66236.0, 41896.0, 26034.0, 16115.0, 9533.0, 6024.0, 3466.0, 2147.0, 1237.0, 791.0, 462.0, 261.0, 158.0, 80.0, 50.0, 26.0, 9.0, 9.0, 7.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-46.3125, -44.83544921875, -43.3583984375, -41.88134765625, -40.404296875, -38.92724609375, -37.4501953125, -35.97314453125, -34.49609375, -33.01904296875, -31.5419921875, -30.06494140625, -28.587890625, -27.11083984375, -25.6337890625, -24.15673828125, -22.6796875, -21.20263671875, -19.7255859375, -18.24853515625, -16.771484375, -15.29443359375, -13.8173828125, -12.34033203125, -10.86328125, -9.38623046875, -7.9091796875, -6.43212890625, -4.955078125, -3.47802734375, -2.0009765625, -0.52392578125, 0.953125, 2.43017578125, 3.9072265625, 5.38427734375, 6.861328125, 8.33837890625, 9.8154296875, 11.29248046875, 12.76953125, 14.24658203125, 15.7236328125, 17.20068359375, 18.677734375, 20.15478515625, 21.6318359375, 23.10888671875, 24.5859375, 26.06298828125, 27.5400390625, 29.01708984375, 30.494140625, 31.97119140625, 33.4482421875, 34.92529296875, 36.40234375, 37.87939453125, 39.3564453125, 40.83349609375, 42.310546875, 43.78759765625, 45.2646484375, 46.74169921875, 48.21875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 8.0, 9.0, 11.0, 14.0, 13.0, 15.0, 9.0, 20.0, 20.0, 20.0, 18.0, 32.0, 31.0, 24.0, 35.0, 37.0, 36.0, 44.0, 36.0, 38.0, 25.0, 36.0, 35.0, 52.0, 37.0, 32.0, 37.0, 23.0, 21.0, 23.0, 25.0, 22.0, 19.0, 16.0, 19.0, 17.0, 20.0, 8.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.96875, -47.3779296875, -45.787109375, -44.1962890625, -42.60546875, -41.0146484375, -39.423828125, -37.8330078125, -36.2421875, -34.6513671875, -33.060546875, -31.4697265625, -29.87890625, -28.2880859375, -26.697265625, -25.1064453125, -23.515625, -21.9248046875, -20.333984375, -18.7431640625, -17.15234375, -15.5615234375, -13.970703125, -12.3798828125, -10.7890625, -9.1982421875, -7.607421875, -6.0166015625, -4.42578125, -2.8349609375, -1.244140625, 0.3466796875, 1.9375, 3.5283203125, 5.119140625, 6.7099609375, 8.30078125, 9.8916015625, 11.482421875, 13.0732421875, 14.6640625, 16.2548828125, 17.845703125, 19.4365234375, 21.02734375, 22.6181640625, 24.208984375, 25.7998046875, 27.390625, 28.9814453125, 30.572265625, 32.1630859375, 33.75390625, 35.3447265625, 36.935546875, 38.5263671875, 40.1171875, 41.7080078125, 43.298828125, 44.8896484375, 46.48046875, 48.0712890625, 49.662109375, 51.2529296875, 52.84375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 12.0, 18.0, 41.0, 39.0, 75.0, 123.0, 193.0, 360.0, 598.0, 1028.0, 1830.0, 2987.0, 5234.0, 8709.0, 14719.0, 24372.0, 39141.0, 62090.0, 95903.0, 142267.0, 203593.0, 273915.0, 347688.0, 412171.0, 447502.0, 448860.0, 413315.0, 352027.0, 278462.0, 206765.0, 145842.0, 98444.0, 64030.0, 40405.0, 24981.0, 14831.0, 8919.0, 5273.0, 3100.0, 1875.0, 1003.0, 621.0, 403.0, 215.0, 113.0, 81.0, 44.0, 21.0, 23.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.25, -50.66796875, -49.0859375, -47.50390625, -45.921875, -44.33984375, -42.7578125, -41.17578125, -39.59375, -38.01171875, -36.4296875, -34.84765625, -33.265625, -31.68359375, -30.1015625, -28.51953125, -26.9375, -25.35546875, -23.7734375, -22.19140625, -20.609375, -19.02734375, -17.4453125, -15.86328125, -14.28125, -12.69921875, -11.1171875, -9.53515625, -7.953125, -6.37109375, -4.7890625, -3.20703125, -1.625, -0.04296875, 1.5390625, 3.12109375, 4.703125, 6.28515625, 7.8671875, 9.44921875, 11.03125, 12.61328125, 14.1953125, 15.77734375, 17.359375, 18.94140625, 20.5234375, 22.10546875, 23.6875, 25.26953125, 26.8515625, 28.43359375, 30.015625, 31.59765625, 33.1796875, 34.76171875, 36.34375, 37.92578125, 39.5078125, 41.08984375, 42.671875, 44.25390625, 45.8359375, 47.41796875, 49.0]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 15.0, 17.0, 23.0, 32.0, 36.0, 40.0, 61.0, 70.0, 92.0, 87.0, 102.0, 132.0, 132.0, 143.0, 167.0, 183.0, 187.0, 176.0, 192.0, 185.0, 160.0, 207.0, 170.0, 165.0, 148.0, 154.0, 135.0, 117.0, 119.0, 86.0, 84.0, 73.0, 80.0, 61.0, 38.0, 38.0, 31.0, 17.0, 11.0, 13.0, 11.0, 7.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.189697265625, -20.47314453125, -19.756591796875, -19.0400390625, -18.323486328125, -17.60693359375, -16.890380859375, -16.173828125, -15.457275390625, -14.74072265625, -14.024169921875, -13.3076171875, -12.591064453125, -11.87451171875, -11.157958984375, -10.44140625, -9.724853515625, -9.00830078125, -8.291748046875, -7.5751953125, -6.858642578125, -6.14208984375, -5.425537109375, -4.708984375, -3.992431640625, -3.27587890625, -2.559326171875, -1.8427734375, -1.126220703125, -0.40966796875, 0.306884765625, 1.0234375, 1.739990234375, 2.45654296875, 3.173095703125, 3.8896484375, 4.606201171875, 5.32275390625, 6.039306640625, 6.755859375, 7.472412109375, 8.18896484375, 8.905517578125, 9.6220703125, 10.338623046875, 11.05517578125, 11.771728515625, 12.48828125, 13.204833984375, 13.92138671875, 14.637939453125, 15.3544921875, 16.071044921875, 16.78759765625, 17.504150390625, 18.220703125, 18.937255859375, 19.65380859375, 20.370361328125, 21.0869140625, 21.803466796875, 22.52001953125, 23.236572265625, 23.953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 13.0, 10.0, 18.0, 17.0, 9.0, 15.0, 25.0, 28.0, 32.0, 36.0, 36.0, 41.0, 38.0, 43.0, 42.0, 45.0, 46.0, 54.0, 49.0, 43.0, 26.0, 32.0, 42.0, 29.0, 30.0, 16.0, 25.0, 22.0, 21.0, 18.0, 13.0, 11.0, 19.0, 8.0, 5.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.52864074707031, -57.64255905151367, -55.75647735595703, -53.870399475097656, -51.984317779541016, -50.098236083984375, -48.212154388427734, -46.326072692871094, -44.43999099731445, -42.55390930175781, -40.66782760620117, -38.78174591064453, -36.895668029785156, -35.009586334228516, -33.123504638671875, -31.237422943115234, -29.351343154907227, -27.465261459350586, -25.579181671142578, -23.693099975585938, -21.807018280029297, -19.920936584472656, -18.03485679626465, -16.148775100708008, -14.262694358825684, -12.37661361694336, -10.490531921386719, -8.604451179504395, -6.718369960784912, -4.83228874206543, -2.9462080001831055, -1.0601263046264648, 0.8259544372558594, 2.712035655975342, 4.598116874694824, 6.484197616577148, 8.370279312133789, 10.256360054016113, 12.142440795898438, 14.028522491455078, 15.914603233337402, 17.800683975219727, 19.686765670776367, 21.572845458984375, 23.458927154541016, 25.345008850097656, 27.231090545654297, 29.117172241210938, 31.003252029418945, 32.88933181762695, 34.775413513183594, 36.661495208740234, 38.547576904296875, 40.433658599853516, 42.319740295410156, 44.20581817626953, 46.09189987182617, 47.97798156738281, 49.86406326293945, 51.750144958496094, 53.63622283935547, 55.52230453491211, 57.40838623046875, 59.29446792602539, 61.18054962158203]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 12.0, 21.0, 17.0, 21.0, 18.0, 21.0, 26.0, 34.0, 35.0, 25.0, 49.0, 34.0, 36.0, 36.0, 48.0, 48.0, 48.0, 23.0, 33.0, 30.0, 29.0, 40.0, 31.0, 30.0, 37.0, 20.0, 21.0, 26.0, 17.0, 22.0, 14.0, 10.0, 9.0, 12.0, 7.0, 4.0, 2.0, 11.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-64.69147491455078, -62.7783203125, -60.86516571044922, -58.95201110839844, -57.038856506347656, -55.125701904296875, -53.21254348754883, -51.29938888549805, -49.386234283447266, -47.473079681396484, -45.5599250793457, -43.64677047729492, -41.733612060546875, -39.820457458496094, -37.90730285644531, -35.99414825439453, -34.08099365234375, -32.16783905029297, -30.254684448242188, -28.341527938842773, -26.428373336791992, -24.51521873474121, -22.602062225341797, -20.688907623291016, -18.775753021240234, -16.862598419189453, -14.949442863464355, -13.036287307739258, -11.123132705688477, -9.209978103637695, -7.296822547912598, -5.3836669921875, -3.4705162048339844, -1.557361125946045, 0.35579395294189453, 2.268949031829834, 4.182104110717773, 6.095258712768555, 8.008414268493652, 9.92156982421875, 11.834724426269531, 13.747879028320312, 15.66103458404541, 17.574190139770508, 19.48734474182129, 21.40049934387207, 23.313655853271484, 25.226810455322266, 27.139965057373047, 29.053119659423828, 30.96627426147461, 32.87942886352539, 34.79258728027344, 36.70574188232422, 38.618896484375, 40.53205108642578, 42.44520568847656, 44.358360290527344, 46.271514892578125, 48.184669494628906, 50.09782409667969, 52.01097869873047, 53.924137115478516, 55.8372917175293, 57.75044631958008]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 15.0, 21.0, 42.0, 52.0, 110.0, 204.0, 287.0, 446.0, 667.0, 1074.0, 1732.0, 2695.0, 4164.0, 6549.0, 9802.0, 14721.0, 21784.0, 31119.0, 43144.0, 56914.0, 72665.0, 87571.0, 98149.0, 103846.0, 101154.0, 92112.0, 77995.0, 62614.0, 47788.0, 34640.0, 24810.0, 17211.0, 11566.0, 7461.0, 4902.0, 3037.0, 2011.0, 1298.0, 807.0, 497.0, 305.0, 206.0, 139.0, 88.0, 50.0, 31.0, 23.0, 7.0, 8.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-18.328125, -17.74951171875, -17.1708984375, -16.59228515625, -16.013671875, -15.43505859375, -14.8564453125, -14.27783203125, -13.69921875, -13.12060546875, -12.5419921875, -11.96337890625, -11.384765625, -10.80615234375, -10.2275390625, -9.64892578125, -9.0703125, -8.49169921875, -7.9130859375, -7.33447265625, -6.755859375, -6.17724609375, -5.5986328125, -5.02001953125, -4.44140625, -3.86279296875, -3.2841796875, -2.70556640625, -2.126953125, -1.54833984375, -0.9697265625, -0.39111328125, 0.1875, 0.76611328125, 1.3447265625, 1.92333984375, 2.501953125, 3.08056640625, 3.6591796875, 4.23779296875, 4.81640625, 5.39501953125, 5.9736328125, 6.55224609375, 7.130859375, 7.70947265625, 8.2880859375, 8.86669921875, 9.4453125, 10.02392578125, 10.6025390625, 11.18115234375, 11.759765625, 12.33837890625, 12.9169921875, 13.49560546875, 14.07421875, 14.65283203125, 15.2314453125, 15.81005859375, 16.388671875, 16.96728515625, 17.5458984375, 18.12451171875, 18.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 13.0, 18.0, 19.0, 21.0, 20.0, 19.0, 22.0, 35.0, 33.0, 27.0, 52.0, 30.0, 36.0, 40.0, 38.0, 54.0, 44.0, 29.0, 26.0, 36.0, 30.0, 37.0, 34.0, 24.0, 40.0, 23.0, 21.0, 24.0, 20.0, 16.0, 21.0, 9.0, 9.0, 14.0, 3.0, 7.0, 3.0, 4.0, 11.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-65.375, -63.4619140625, -61.548828125, -59.6357421875, -57.72265625, -55.8095703125, -53.896484375, -51.9833984375, -50.0703125, -48.1572265625, -46.244140625, -44.3310546875, -42.41796875, -40.5048828125, -38.591796875, -36.6787109375, -34.765625, -32.8525390625, -30.939453125, -29.0263671875, -27.11328125, -25.2001953125, -23.287109375, -21.3740234375, -19.4609375, -17.5478515625, -15.634765625, -13.7216796875, -11.80859375, -9.8955078125, -7.982421875, -6.0693359375, -4.15625, -2.2431640625, -0.330078125, 1.5830078125, 3.49609375, 5.4091796875, 7.322265625, 9.2353515625, 11.1484375, 13.0615234375, 14.974609375, 16.8876953125, 18.80078125, 20.7138671875, 22.626953125, 24.5400390625, 26.453125, 28.3662109375, 30.279296875, 32.1923828125, 34.10546875, 36.0185546875, 37.931640625, 39.8447265625, 41.7578125, 43.6708984375, 45.583984375, 47.4970703125, 49.41015625, 51.3232421875, 53.236328125, 55.1494140625, 57.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 29.0, 20.0, 47.0, 68.0, 115.0, 166.0, 271.0, 439.0, 714.0, 1163.0, 1796.0, 3071.0, 5055.0, 8535.0, 14536.0, 24678.0, 65859.0, 822944.0, 44245.0, 22326.0, 12982.0, 7681.0, 4560.0, 2755.0, 1676.0, 1004.0, 679.0, 361.0, 249.0, 153.0, 108.0, 62.0, 43.0, 32.0, 29.0, 17.0, 13.0, 10.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.75146484375, -60.7529296875, -58.75439453125, -56.755859375, -54.75732421875, -52.7587890625, -50.76025390625, -48.76171875, -46.76318359375, -44.7646484375, -42.76611328125, -40.767578125, -38.76904296875, -36.7705078125, -34.77197265625, -32.7734375, -30.77490234375, -28.7763671875, -26.77783203125, -24.779296875, -22.78076171875, -20.7822265625, -18.78369140625, -16.78515625, -14.78662109375, -12.7880859375, -10.78955078125, -8.791015625, -6.79248046875, -4.7939453125, -2.79541015625, -0.796875, 1.20166015625, 3.2001953125, 5.19873046875, 7.197265625, 9.19580078125, 11.1943359375, 13.19287109375, 15.19140625, 17.18994140625, 19.1884765625, 21.18701171875, 23.185546875, 25.18408203125, 27.1826171875, 29.18115234375, 31.1796875, 33.17822265625, 35.1767578125, 37.17529296875, 39.173828125, 41.17236328125, 43.1708984375, 45.16943359375, 47.16796875, 49.16650390625, 51.1650390625, 53.16357421875, 55.162109375, 57.16064453125, 59.1591796875, 61.15771484375, 63.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 7.0, 3.0, 5.0, 12.0, 12.0, 16.0, 20.0, 20.0, 15.0, 15.0, 16.0, 33.0, 22.0, 32.0, 33.0, 28.0, 31.0, 42.0, 46.0, 42.0, 39.0, 36.0, 44.0, 46.0, 29.0, 36.0, 34.0, 31.0, 35.0, 24.0, 36.0, 11.0, 23.0, 16.0, 16.0, 15.0, 14.0, 11.0, 13.0, 8.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-36.5, -35.20703125, -33.9140625, -32.62109375, -31.328125, -30.03515625, -28.7421875, -27.44921875, -26.15625, -24.86328125, -23.5703125, -22.27734375, -20.984375, -19.69140625, -18.3984375, -17.10546875, -15.8125, -14.51953125, -13.2265625, -11.93359375, -10.640625, -9.34765625, -8.0546875, -6.76171875, -5.46875, -4.17578125, -2.8828125, -1.58984375, -0.296875, 0.99609375, 2.2890625, 3.58203125, 4.875, 6.16796875, 7.4609375, 8.75390625, 10.046875, 11.33984375, 12.6328125, 13.92578125, 15.21875, 16.51171875, 17.8046875, 19.09765625, 20.390625, 21.68359375, 22.9765625, 24.26953125, 25.5625, 26.85546875, 28.1484375, 29.44140625, 30.734375, 32.02734375, 33.3203125, 34.61328125, 35.90625, 37.19921875, 38.4921875, 39.78515625, 41.078125, 42.37109375, 43.6640625, 44.95703125, 46.25]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 6.0, 13.0, 16.0, 20.0, 20.0, 28.0, 30.0, 54.0, 55.0, 85.0, 135.0, 197.0, 307.0, 415.0, 587.0, 875.0, 1283.0, 1981.0, 3019.0, 4365.0, 6915.0, 10843.0, 18394.0, 34143.0, 428441.0, 451171.0, 35013.0, 18489.0, 11139.0, 6921.0, 4500.0, 2956.0, 1949.0, 1310.0, 900.0, 582.0, 412.0, 292.0, 216.0, 153.0, 93.0, 56.0, 37.0, 31.0, 28.0, 22.0, 21.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.021484375, -2.924041748046875, -2.82659912109375, -2.729156494140625, -2.6317138671875, -2.534271240234375, -2.43682861328125, -2.339385986328125, -2.241943359375, -2.144500732421875, -2.04705810546875, -1.949615478515625, -1.8521728515625, -1.754730224609375, -1.65728759765625, -1.559844970703125, -1.46240234375, -1.364959716796875, -1.26751708984375, -1.170074462890625, -1.0726318359375, -0.975189208984375, -0.87774658203125, -0.780303955078125, -0.682861328125, -0.585418701171875, -0.48797607421875, -0.390533447265625, -0.2930908203125, -0.195648193359375, -0.09820556640625, -0.000762939453125, 0.0966796875, 0.194122314453125, 0.29156494140625, 0.389007568359375, 0.4864501953125, 0.583892822265625, 0.68133544921875, 0.778778076171875, 0.876220703125, 0.973663330078125, 1.07110595703125, 1.168548583984375, 1.2659912109375, 1.363433837890625, 1.46087646484375, 1.558319091796875, 1.65576171875, 1.753204345703125, 1.85064697265625, 1.948089599609375, 2.0455322265625, 2.142974853515625, 2.24041748046875, 2.337860107421875, 2.435302734375, 2.532745361328125, 2.63018798828125, 2.727630615234375, 2.8250732421875, 2.922515869140625, 3.01995849609375, 3.117401123046875, 3.21484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 3.0, 10.0, 8.0, 11.0, 16.0, 13.0, 20.0, 38.0, 41.0, 43.0, 49.0, 49.0, 70.0, 67.0, 55.0, 72.0, 68.0, 66.0, 60.0, 49.0, 34.0, 32.0, 21.0, 20.0, 19.0, 14.0, 6.0, 7.0, 8.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006780624389648438, -0.0006585270166397095, -0.0006389915943145752, -0.0006194561719894409, -0.0005999207496643066, -0.0005803853273391724, -0.0005608499050140381, -0.0005413144826889038, -0.0005217790603637695, -0.0005022436380386353, -0.000482708215713501, -0.0004631727933883667, -0.0004436373710632324, -0.00042410194873809814, -0.00040456652641296387, -0.0003850311040878296, -0.0003654956817626953, -0.00034596025943756104, -0.00032642483711242676, -0.0003068894147872925, -0.0002873539924621582, -0.0002678185701370239, -0.00024828314781188965, -0.00022874772548675537, -0.0002092123031616211, -0.00018967688083648682, -0.00017014145851135254, -0.00015060603618621826, -0.00013107061386108398, -0.00011153519153594971, -9.199976921081543e-05, -7.246434688568115e-05, -5.2928924560546875e-05, -3.33935022354126e-05, -1.385807991027832e-05, 5.677342414855957e-06, 2.5212764739990234e-05, 4.474818706512451e-05, 6.428360939025879e-05, 8.381903171539307e-05, 0.00010335445404052734, 0.00012288987636566162, 0.0001424252986907959, 0.00016196072101593018, 0.00018149614334106445, 0.00020103156566619873, 0.000220566987991333, 0.00024010241031646729, 0.00025963783264160156, 0.00027917325496673584, 0.0002987086772918701, 0.0003182440996170044, 0.00033777952194213867, 0.00035731494426727295, 0.0003768503665924072, 0.0003963857889175415, 0.0004159212112426758, 0.00043545663356781006, 0.00045499205589294434, 0.0004745274782180786, 0.0004940629005432129, 0.0005135983228683472, 0.0005331337451934814, 0.0005526691675186157, 0.00057220458984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 17.0, 23.0, 42.0, 58.0, 122.0, 160.0, 317.0, 476.0, 899.0, 1422.0, 2460.0, 4068.0, 7191.0, 12502.0, 21338.0, 36166.0, 58505.0, 87191.0, 118613.0, 141771.0, 146817.0, 130243.0, 100603.0, 69246.0, 44349.0, 26678.0, 15494.0, 8971.0, 5285.0, 3039.0, 1759.0, 1077.0, 636.0, 409.0, 240.0, 131.0, 81.0, 54.0, 38.0, 14.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.57421875, -2.491729736328125, -2.40924072265625, -2.326751708984375, -2.2442626953125, -2.161773681640625, -2.07928466796875, -1.996795654296875, -1.914306640625, -1.831817626953125, -1.74932861328125, -1.666839599609375, -1.5843505859375, -1.501861572265625, -1.41937255859375, -1.336883544921875, -1.25439453125, -1.171905517578125, -1.08941650390625, -1.006927490234375, -0.9244384765625, -0.841949462890625, -0.75946044921875, -0.676971435546875, -0.594482421875, -0.511993408203125, -0.42950439453125, -0.347015380859375, -0.2645263671875, -0.182037353515625, -0.09954833984375, -0.017059326171875, 0.0654296875, 0.147918701171875, 0.23040771484375, 0.312896728515625, 0.3953857421875, 0.477874755859375, 0.56036376953125, 0.642852783203125, 0.725341796875, 0.807830810546875, 0.89031982421875, 0.972808837890625, 1.0552978515625, 1.137786865234375, 1.22027587890625, 1.302764892578125, 1.38525390625, 1.467742919921875, 1.55023193359375, 1.632720947265625, 1.7152099609375, 1.797698974609375, 1.88018798828125, 1.962677001953125, 2.045166015625, 2.127655029296875, 2.21014404296875, 2.292633056640625, 2.3751220703125, 2.457611083984375, 2.54010009765625, 2.622589111328125, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 7.0, 15.0, 14.0, 18.0, 19.0, 34.0, 45.0, 40.0, 63.0, 56.0, 77.0, 63.0, 70.0, 67.0, 58.0, 58.0, 62.0, 46.0, 32.0, 30.0, 30.0, 14.0, 14.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3828125, -1.342437744140625, -1.30206298828125, -1.261688232421875, -1.2213134765625, -1.180938720703125, -1.14056396484375, -1.100189208984375, -1.059814453125, -1.019439697265625, -0.97906494140625, -0.938690185546875, -0.8983154296875, -0.857940673828125, -0.81756591796875, -0.777191162109375, -0.73681640625, -0.696441650390625, -0.65606689453125, -0.615692138671875, -0.5753173828125, -0.534942626953125, -0.49456787109375, -0.454193115234375, -0.413818359375, -0.373443603515625, -0.33306884765625, -0.292694091796875, -0.2523193359375, -0.211944580078125, -0.17156982421875, -0.131195068359375, -0.0908203125, -0.050445556640625, -0.01007080078125, 0.030303955078125, 0.0706787109375, 0.111053466796875, 0.15142822265625, 0.191802978515625, 0.232177734375, 0.272552490234375, 0.31292724609375, 0.353302001953125, 0.3936767578125, 0.434051513671875, 0.47442626953125, 0.514801025390625, 0.55517578125, 0.595550537109375, 0.63592529296875, 0.676300048828125, 0.7166748046875, 0.757049560546875, 0.79742431640625, 0.837799072265625, 0.878173828125, 0.918548583984375, 0.95892333984375, 0.999298095703125, 1.0396728515625, 1.080047607421875, 1.12042236328125, 1.160797119140625, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 6.0, 6.0, 8.0, 14.0, 14.0, 19.0, 26.0, 13.0, 29.0, 21.0, 42.0, 37.0, 29.0, 40.0, 49.0, 32.0, 48.0, 41.0, 48.0, 54.0, 37.0, 40.0, 32.0, 25.0, 36.0, 33.0, 31.0, 16.0, 21.0, 19.0, 20.0, 19.0, 14.0, 17.0, 11.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.30906295776367, -57.45502471923828, -55.600990295410156, -53.746952056884766, -51.89291763305664, -50.03887939453125, -48.184844970703125, -46.330806732177734, -44.476768493652344, -42.62273025512695, -40.76869583129883, -38.91465759277344, -37.06062316894531, -35.20658493041992, -33.35254669189453, -31.498512268066406, -29.64447593688965, -27.79043960571289, -25.936403274536133, -24.082366943359375, -22.228328704833984, -20.374292373657227, -18.52025604248047, -16.666217803955078, -14.812182426452637, -12.958146095275879, -11.104108810424805, -9.250072479248047, -7.396035671234131, -5.541998863220215, -3.687962532043457, -1.8339252471923828, 0.020111083984375, 1.8741477727890015, 3.728184461593628, 5.582221031188965, 7.436257839202881, 9.290294647216797, 11.144330978393555, 12.998368263244629, 14.852404594421387, 16.70644187927246, 18.56047821044922, 20.414514541625977, 22.268550872802734, 24.122589111328125, 25.97662353515625, 27.83066177368164, 29.6846981048584, 31.538734436035156, 33.39277267456055, 35.24680709838867, 37.10084533691406, 38.95487976074219, 40.80891799926758, 42.66295623779297, 44.516990661621094, 46.371028900146484, 48.22506332397461, 50.0791015625, 51.933135986328125, 53.787174224853516, 55.641212463378906, 57.49524688720703, 59.34928512573242]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 5.0, 8.0, 14.0, 14.0, 19.0, 19.0, 22.0, 21.0, 22.0, 33.0, 30.0, 33.0, 40.0, 38.0, 34.0, 40.0, 42.0, 52.0, 44.0, 35.0, 23.0, 37.0, 28.0, 37.0, 35.0, 25.0, 37.0, 25.0, 21.0, 25.0, 25.0, 11.0, 23.0, 7.0, 12.0, 12.0, 6.0, 8.0, 1.0, 7.0, 7.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-66.13524627685547, -64.21019744873047, -62.28514099121094, -60.36009216308594, -58.43503952026367, -56.509986877441406, -54.584938049316406, -52.65988540649414, -50.734832763671875, -48.80978012084961, -46.884727478027344, -44.959678649902344, -43.03462600708008, -41.10957336425781, -39.18452453613281, -37.25947189331055, -35.33441925048828, -33.409366607666016, -31.484315872192383, -29.55926513671875, -27.634212493896484, -25.70915985107422, -23.784109115600586, -21.859058380126953, -19.934005737304688, -18.008953094482422, -16.08390235900879, -14.15885066986084, -12.23379898071289, -10.308747291564941, -8.383695602416992, -6.458643913269043, -4.533588409423828, -2.608536720275879, -0.6834850311279297, 1.2415666580200195, 3.1666183471679688, 5.091670036315918, 7.016721725463867, 8.941773414611816, 10.866825103759766, 12.791876792907715, 14.716928482055664, 16.641979217529297, 18.567031860351562, 20.492084503173828, 22.41713523864746, 24.342185974121094, 26.26723861694336, 28.192291259765625, 30.117341995239258, 32.04239273071289, 33.967445373535156, 35.89249801635742, 37.81755065917969, 39.74259948730469, 41.66765213012695, 43.59270477294922, 45.51775360107422, 47.442806243896484, 49.36785888671875, 51.292911529541016, 53.21796417236328, 55.14301300048828, 57.06806564331055]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 12.0, 15.0, 16.0, 33.0, 49.0, 95.0, 162.0, 254.0, 468.0, 770.0, 1227.0, 2063.0, 3467.0, 5427.0, 8808.0, 13491.0, 20254.0, 29931.0, 41901.0, 56631.0, 72347.0, 87351.0, 98721.0, 104176.0, 102123.0, 94705.0, 80175.0, 65328.0, 50269.0, 36078.0, 25508.0, 17168.0, 11135.0, 7174.0, 4477.0, 2629.0, 1563.0, 1021.0, 609.0, 347.0, 220.0, 126.0, 85.0, 47.0, 39.0, 18.0, 19.0, 7.0, 7.0, 6.0, 3.0, 3.0], "bins": [-51.625, -50.18212890625, -48.7392578125, -47.29638671875, -45.853515625, -44.41064453125, -42.9677734375, -41.52490234375, -40.08203125, -38.63916015625, -37.1962890625, -35.75341796875, -34.310546875, -32.86767578125, -31.4248046875, -29.98193359375, -28.5390625, -27.09619140625, -25.6533203125, -24.21044921875, -22.767578125, -21.32470703125, -19.8818359375, -18.43896484375, -16.99609375, -15.55322265625, -14.1103515625, -12.66748046875, -11.224609375, -9.78173828125, -8.3388671875, -6.89599609375, -5.453125, -4.01025390625, -2.5673828125, -1.12451171875, 0.318359375, 1.76123046875, 3.2041015625, 4.64697265625, 6.08984375, 7.53271484375, 8.9755859375, 10.41845703125, 11.861328125, 13.30419921875, 14.7470703125, 16.18994140625, 17.6328125, 19.07568359375, 20.5185546875, 21.96142578125, 23.404296875, 24.84716796875, 26.2900390625, 27.73291015625, 29.17578125, 30.61865234375, 32.0615234375, 33.50439453125, 34.947265625, 36.39013671875, 37.8330078125, 39.27587890625, 40.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 10.0, 5.0, 8.0, 13.0, 17.0, 18.0, 15.0, 23.0, 26.0, 20.0, 31.0, 31.0, 33.0, 46.0, 33.0, 41.0, 35.0, 38.0, 54.0, 48.0, 32.0, 29.0, 34.0, 27.0, 43.0, 31.0, 24.0, 36.0, 25.0, 24.0, 23.0, 21.0, 15.0, 17.0, 8.0, 13.0, 11.0, 7.0, 6.0, 2.0, 9.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-63.90625, -62.03857421875, -60.1708984375, -58.30322265625, -56.435546875, -54.56787109375, -52.7001953125, -50.83251953125, -48.96484375, -47.09716796875, -45.2294921875, -43.36181640625, -41.494140625, -39.62646484375, -37.7587890625, -35.89111328125, -34.0234375, -32.15576171875, -30.2880859375, -28.42041015625, -26.552734375, -24.68505859375, -22.8173828125, -20.94970703125, -19.08203125, -17.21435546875, -15.3466796875, -13.47900390625, -11.611328125, -9.74365234375, -7.8759765625, -6.00830078125, -4.140625, -2.27294921875, -0.4052734375, 1.46240234375, 3.330078125, 5.19775390625, 7.0654296875, 8.93310546875, 10.80078125, 12.66845703125, 14.5361328125, 16.40380859375, 18.271484375, 20.13916015625, 22.0068359375, 23.87451171875, 25.7421875, 27.60986328125, 29.4775390625, 31.34521484375, 33.212890625, 35.08056640625, 36.9482421875, 38.81591796875, 40.68359375, 42.55126953125, 44.4189453125, 46.28662109375, 48.154296875, 50.02197265625, 51.8896484375, 53.75732421875, 55.625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 14.0, 19.0, 28.0, 42.0, 71.0, 109.0, 225.0, 400.0, 653.0, 1157.0, 2127.0, 3751.0, 6469.0, 11028.0, 18452.0, 29698.0, 45634.0, 66206.0, 88613.0, 109342.0, 122416.0, 123803.0, 113711.0, 95141.0, 72251.0, 51625.0, 33926.0, 21354.0, 12700.0, 7534.0, 4322.0, 2441.0, 1436.0, 809.0, 460.0, 244.0, 118.0, 93.0, 50.0, 30.0, 21.0, 11.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-59.71875, -57.9697265625, -56.220703125, -54.4716796875, -52.72265625, -50.9736328125, -49.224609375, -47.4755859375, -45.7265625, -43.9775390625, -42.228515625, -40.4794921875, -38.73046875, -36.9814453125, -35.232421875, -33.4833984375, -31.734375, -29.9853515625, -28.236328125, -26.4873046875, -24.73828125, -22.9892578125, -21.240234375, -19.4912109375, -17.7421875, -15.9931640625, -14.244140625, -12.4951171875, -10.74609375, -8.9970703125, -7.248046875, -5.4990234375, -3.75, -2.0009765625, -0.251953125, 1.4970703125, 3.24609375, 4.9951171875, 6.744140625, 8.4931640625, 10.2421875, 11.9912109375, 13.740234375, 15.4892578125, 17.23828125, 18.9873046875, 20.736328125, 22.4853515625, 24.234375, 25.9833984375, 27.732421875, 29.4814453125, 31.23046875, 32.9794921875, 34.728515625, 36.4775390625, 38.2265625, 39.9755859375, 41.724609375, 43.4736328125, 45.22265625, 46.9716796875, 48.720703125, 50.4697265625, 52.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 1.0, 7.0, 5.0, 9.0, 8.0, 18.0, 8.0, 13.0, 13.0, 18.0, 21.0, 25.0, 43.0, 45.0, 32.0, 42.0, 42.0, 44.0, 32.0, 45.0, 43.0, 48.0, 40.0, 36.0, 51.0, 46.0, 42.0, 32.0, 20.0, 28.0, 21.0, 20.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.1611328125, -32.884765625, -31.6083984375, -30.33203125, -29.0556640625, -27.779296875, -26.5029296875, -25.2265625, -23.9501953125, -22.673828125, -21.3974609375, -20.12109375, -18.8447265625, -17.568359375, -16.2919921875, -15.015625, -13.7392578125, -12.462890625, -11.1865234375, -9.91015625, -8.6337890625, -7.357421875, -6.0810546875, -4.8046875, -3.5283203125, -2.251953125, -0.9755859375, 0.30078125, 1.5771484375, 2.853515625, 4.1298828125, 5.40625, 6.6826171875, 7.958984375, 9.2353515625, 10.51171875, 11.7880859375, 13.064453125, 14.3408203125, 15.6171875, 16.8935546875, 18.169921875, 19.4462890625, 20.72265625, 21.9990234375, 23.275390625, 24.5517578125, 25.828125, 27.1044921875, 28.380859375, 29.6572265625, 30.93359375, 32.2099609375, 33.486328125, 34.7626953125, 36.0390625, 37.3154296875, 38.591796875, 39.8681640625, 41.14453125, 42.4208984375, 43.697265625, 44.9736328125, 46.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 11.0, 26.0, 34.0, 57.0, 58.0, 121.0, 203.0, 293.0, 503.0, 857.0, 1322.0, 2229.0, 3670.0, 6008.0, 9759.0, 15776.0, 25028.0, 38276.0, 56786.0, 79037.0, 101597.0, 119689.0, 125760.0, 119399.0, 101764.0, 79075.0, 56686.0, 38493.0, 24879.0, 15709.0, 9812.0, 5992.0, 3702.0, 2404.0, 1351.0, 852.0, 538.0, 310.0, 189.0, 108.0, 81.0, 39.0, 25.0, 18.0, 9.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.265625, -20.630859375, -19.99609375, -19.361328125, -18.7265625, -18.091796875, -17.45703125, -16.822265625, -16.1875, -15.552734375, -14.91796875, -14.283203125, -13.6484375, -13.013671875, -12.37890625, -11.744140625, -11.109375, -10.474609375, -9.83984375, -9.205078125, -8.5703125, -7.935546875, -7.30078125, -6.666015625, -6.03125, -5.396484375, -4.76171875, -4.126953125, -3.4921875, -2.857421875, -2.22265625, -1.587890625, -0.953125, -0.318359375, 0.31640625, 0.951171875, 1.5859375, 2.220703125, 2.85546875, 3.490234375, 4.125, 4.759765625, 5.39453125, 6.029296875, 6.6640625, 7.298828125, 7.93359375, 8.568359375, 9.203125, 9.837890625, 10.47265625, 11.107421875, 11.7421875, 12.376953125, 13.01171875, 13.646484375, 14.28125, 14.916015625, 15.55078125, 16.185546875, 16.8203125, 17.455078125, 18.08984375, 18.724609375, 19.359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 0.0, 9.0, 6.0, 11.0, 9.0, 19.0, 26.0, 30.0, 28.0, 29.0, 40.0, 29.0, 35.0, 44.0, 47.0, 39.0, 58.0, 50.0, 52.0, 53.0, 52.0, 48.0, 54.0, 35.0, 30.0, 28.0, 21.0, 13.0, 14.0, 19.0, 13.0, 15.0, 8.0, 13.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027179718017578125, -0.0026380717754364014, -0.0025581717491149902, -0.002478271722793579, -0.002398371696472168, -0.002318471670150757, -0.0022385716438293457, -0.0021586716175079346, -0.0020787715911865234, -0.0019988715648651123, -0.0019189715385437012, -0.00183907151222229, -0.001759171485900879, -0.0016792714595794678, -0.0015993714332580566, -0.0015194714069366455, -0.0014395713806152344, -0.0013596713542938232, -0.0012797713279724121, -0.001199871301651001, -0.0011199712753295898, -0.0010400712490081787, -0.0009601712226867676, -0.0008802711963653564, -0.0008003711700439453, -0.0007204711437225342, -0.000640571117401123, -0.0005606710910797119, -0.0004807710647583008, -0.00040087103843688965, -0.0003209710121154785, -0.00024107098579406738, -0.00016117095947265625, -8.127093315124512e-05, -1.3709068298339844e-06, 7.852911949157715e-05, 0.00015842914581298828, 0.00023832917213439941, 0.00031822919845581055, 0.0003981292247772217, 0.0004780292510986328, 0.0005579292774200439, 0.0006378293037414551, 0.0007177293300628662, 0.0007976293563842773, 0.0008775293827056885, 0.0009574294090270996, 0.0010373294353485107, 0.0011172294616699219, 0.001197129487991333, 0.0012770295143127441, 0.0013569295406341553, 0.0014368295669555664, 0.0015167295932769775, 0.0015966296195983887, 0.0016765296459197998, 0.001756429672241211, 0.001836329698562622, 0.0019162297248840332, 0.0019961297512054443, 0.0020760297775268555, 0.0021559298038482666, 0.0022358298301696777, 0.002315729856491089, 0.0023956298828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 6.0, 10.0, 9.0, 15.0, 24.0, 29.0, 54.0, 79.0, 110.0, 181.0, 239.0, 386.0, 592.0, 894.0, 1309.0, 2182.0, 3423.0, 5398.0, 8586.0, 13496.0, 20716.0, 30839.0, 45531.0, 62592.0, 82705.0, 101267.0, 113885.0, 116311.0, 108279.0, 92450.0, 73503.0, 53948.0, 37497.0, 25511.0, 16645.0, 10920.0, 6888.0, 4310.0, 2761.0, 1780.0, 1084.0, 688.0, 512.0, 318.0, 188.0, 141.0, 74.0, 67.0, 42.0, 27.0, 30.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.61376953125, -17.9775390625, -17.34130859375, -16.705078125, -16.06884765625, -15.4326171875, -14.79638671875, -14.16015625, -13.52392578125, -12.8876953125, -12.25146484375, -11.615234375, -10.97900390625, -10.3427734375, -9.70654296875, -9.0703125, -8.43408203125, -7.7978515625, -7.16162109375, -6.525390625, -5.88916015625, -5.2529296875, -4.61669921875, -3.98046875, -3.34423828125, -2.7080078125, -2.07177734375, -1.435546875, -0.79931640625, -0.1630859375, 0.47314453125, 1.109375, 1.74560546875, 2.3818359375, 3.01806640625, 3.654296875, 4.29052734375, 4.9267578125, 5.56298828125, 6.19921875, 6.83544921875, 7.4716796875, 8.10791015625, 8.744140625, 9.38037109375, 10.0166015625, 10.65283203125, 11.2890625, 11.92529296875, 12.5615234375, 13.19775390625, 13.833984375, 14.47021484375, 15.1064453125, 15.74267578125, 16.37890625, 17.01513671875, 17.6513671875, 18.28759765625, 18.923828125, 19.56005859375, 20.1962890625, 20.83251953125, 21.46875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 18.0, 14.0, 26.0, 34.0, 28.0, 29.0, 44.0, 43.0, 53.0, 32.0, 40.0, 53.0, 39.0, 45.0, 45.0, 55.0, 37.0, 46.0, 47.0, 37.0, 33.0, 26.0, 25.0, 18.0, 15.0, 10.0, 9.0, 13.0, 14.0, 9.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.5401611328125, -10.244384765625, -9.9486083984375, -9.65283203125, -9.3570556640625, -9.061279296875, -8.7655029296875, -8.4697265625, -8.1739501953125, -7.878173828125, -7.5823974609375, -7.28662109375, -6.9908447265625, -6.695068359375, -6.3992919921875, -6.103515625, -5.8077392578125, -5.511962890625, -5.2161865234375, -4.92041015625, -4.6246337890625, -4.328857421875, -4.0330810546875, -3.7373046875, -3.4415283203125, -3.145751953125, -2.8499755859375, -2.55419921875, -2.2584228515625, -1.962646484375, -1.6668701171875, -1.37109375, -1.0753173828125, -0.779541015625, -0.4837646484375, -0.18798828125, 0.1077880859375, 0.403564453125, 0.6993408203125, 0.9951171875, 1.2908935546875, 1.586669921875, 1.8824462890625, 2.17822265625, 2.4739990234375, 2.769775390625, 3.0655517578125, 3.361328125, 3.6571044921875, 3.952880859375, 4.2486572265625, 4.54443359375, 4.8402099609375, 5.135986328125, 5.4317626953125, 5.7275390625, 6.0233154296875, 6.319091796875, 6.6148681640625, 6.91064453125, 7.2064208984375, 7.502197265625, 7.7979736328125, 8.09375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 9.0, 6.0, 7.0, 10.0, 12.0, 16.0, 17.0, 13.0, 21.0, 14.0, 20.0, 28.0, 29.0, 40.0, 26.0, 30.0, 35.0, 33.0, 45.0, 32.0, 48.0, 36.0, 41.0, 30.0, 36.0, 37.0, 25.0, 40.0, 22.0, 34.0, 32.0, 30.0, 13.0, 15.0, 16.0, 20.0, 12.0, 19.0, 12.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.6223258972168, -50.923892974853516, -49.2254638671875, -47.52703094482422, -45.82859802246094, -44.130165100097656, -42.431732177734375, -40.73330307006836, -39.03487014770508, -37.3364372253418, -35.63800811767578, -33.9395751953125, -32.24114227294922, -30.542709350585938, -28.84427833557129, -27.14584732055664, -25.44741439819336, -23.748981475830078, -22.05055046081543, -20.35211944580078, -18.6536865234375, -16.95525360107422, -15.25682258605957, -13.558390617370605, -11.85995864868164, -10.161526679992676, -8.463094711303711, -6.764662742614746, -5.066230773925781, -3.3677988052368164, -1.6693668365478516, 0.02906513214111328, 1.7274932861328125, 3.4259252548217773, 5.124357223510742, 6.822789192199707, 8.521221160888672, 10.219653129577637, 11.918085098266602, 13.616517066955566, 15.314949035644531, 17.013381958007812, 18.71181297302246, 20.41024398803711, 22.10867691040039, 23.807109832763672, 25.50554084777832, 27.20397186279297, 28.90240478515625, 30.60083770751953, 32.29927062988281, 33.99769973754883, 35.69613265991211, 37.39456558227539, 39.092994689941406, 40.79142761230469, 42.48986053466797, 44.18829345703125, 45.88672637939453, 47.58515548706055, 49.28358840942383, 50.98202133178711, 52.680450439453125, 54.378883361816406, 56.07731628417969]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 9.0, 1.0, 6.0, 6.0, 16.0, 18.0, 15.0, 20.0, 17.0, 16.0, 24.0, 32.0, 28.0, 34.0, 28.0, 34.0, 38.0, 33.0, 36.0, 35.0, 32.0, 43.0, 48.0, 46.0, 39.0, 21.0, 17.0, 29.0, 32.0, 23.0, 27.0, 24.0, 20.0, 22.0, 17.0, 18.0, 11.0, 17.0, 10.0, 9.0, 11.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0], "bins": [-60.79109191894531, -58.962013244628906, -57.132938385009766, -55.303863525390625, -53.47478485107422, -51.64570617675781, -49.81663131713867, -47.98755645751953, -46.158477783203125, -44.32939910888672, -42.50032424926758, -40.67124938964844, -38.84217071533203, -37.013092041015625, -35.184017181396484, -33.354942321777344, -31.525863647460938, -29.696786880493164, -27.86771011352539, -26.038633346557617, -24.209556579589844, -22.38047981262207, -20.551403045654297, -18.722326278686523, -16.89324951171875, -15.064172744750977, -13.235095977783203, -11.40601921081543, -9.576942443847656, -7.747865676879883, -5.918788909912109, -4.089712142944336, -2.2606353759765625, -0.43155860900878906, 1.3975181579589844, 3.226594924926758, 5.055671691894531, 6.884748458862305, 8.713825225830078, 10.542901992797852, 12.371978759765625, 14.201055526733398, 16.030132293701172, 17.859209060668945, 19.68828582763672, 21.517362594604492, 23.346439361572266, 25.17551612854004, 27.004592895507812, 28.833669662475586, 30.66274642944336, 32.4918212890625, 34.320899963378906, 36.14997863769531, 37.97905349731445, 39.808128356933594, 41.63720703125, 43.466285705566406, 45.29536056518555, 47.12443542480469, 48.953514099121094, 50.7825927734375, 52.61166763305664, 54.44074249267578, 56.26982116699219]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 15.0, 16.0, 43.0, 53.0, 110.0, 202.0, 302.0, 560.0, 948.0, 1499.0, 2658.0, 4424.0, 7812.0, 12695.0, 21313.0, 34675.0, 56118.0, 87907.0, 135690.0, 197674.0, 274988.0, 359450.0, 433133.0, 476629.0, 474078.0, 429743.0, 355592.0, 271669.0, 193760.0, 132617.0, 86380.0, 54948.0, 34199.0, 20833.0, 12862.0, 7606.0, 4562.0, 2650.0, 1510.0, 927.0, 585.0, 333.0, 217.0, 109.0, 72.0, 44.0, 24.0, 16.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-50.0, -48.48388671875, -46.9677734375, -45.45166015625, -43.935546875, -42.41943359375, -40.9033203125, -39.38720703125, -37.87109375, -36.35498046875, -34.8388671875, -33.32275390625, -31.806640625, -30.29052734375, -28.7744140625, -27.25830078125, -25.7421875, -24.22607421875, -22.7099609375, -21.19384765625, -19.677734375, -18.16162109375, -16.6455078125, -15.12939453125, -13.61328125, -12.09716796875, -10.5810546875, -9.06494140625, -7.548828125, -6.03271484375, -4.5166015625, -3.00048828125, -1.484375, 0.03173828125, 1.5478515625, 3.06396484375, 4.580078125, 6.09619140625, 7.6123046875, 9.12841796875, 10.64453125, 12.16064453125, 13.6767578125, 15.19287109375, 16.708984375, 18.22509765625, 19.7412109375, 21.25732421875, 22.7734375, 24.28955078125, 25.8056640625, 27.32177734375, 28.837890625, 30.35400390625, 31.8701171875, 33.38623046875, 34.90234375, 36.41845703125, 37.9345703125, 39.45068359375, 40.966796875, 42.48291015625, 43.9990234375, 45.51513671875, 47.03125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 3.0, 7.0, 14.0, 17.0, 18.0, 17.0, 14.0, 10.0, 35.0, 27.0, 28.0, 37.0, 26.0, 33.0, 32.0, 33.0, 33.0, 42.0, 36.0, 41.0, 40.0, 53.0, 33.0, 26.0, 16.0, 27.0, 34.0, 20.0, 30.0, 23.0, 27.0, 16.0, 16.0, 19.0, 14.0, 16.0, 16.0, 10.0, 9.0, 6.0, 7.0, 10.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-53.53125, -51.93359375, -50.3359375, -48.73828125, -47.140625, -45.54296875, -43.9453125, -42.34765625, -40.75, -39.15234375, -37.5546875, -35.95703125, -34.359375, -32.76171875, -31.1640625, -29.56640625, -27.96875, -26.37109375, -24.7734375, -23.17578125, -21.578125, -19.98046875, -18.3828125, -16.78515625, -15.1875, -13.58984375, -11.9921875, -10.39453125, -8.796875, -7.19921875, -5.6015625, -4.00390625, -2.40625, -0.80859375, 0.7890625, 2.38671875, 3.984375, 5.58203125, 7.1796875, 8.77734375, 10.375, 11.97265625, 13.5703125, 15.16796875, 16.765625, 18.36328125, 19.9609375, 21.55859375, 23.15625, 24.75390625, 26.3515625, 27.94921875, 29.546875, 31.14453125, 32.7421875, 34.33984375, 35.9375, 37.53515625, 39.1328125, 40.73046875, 42.328125, 43.92578125, 45.5234375, 47.12109375, 48.71875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 15.0, 21.0, 45.0, 64.0, 87.0, 155.0, 255.0, 443.0, 727.0, 1218.0, 1868.0, 3018.0, 4789.0, 7671.0, 11638.0, 18312.0, 27826.0, 41486.0, 60697.0, 87082.0, 121527.0, 162519.0, 212577.0, 264046.0, 314088.0, 353107.0, 376755.0, 377906.0, 358145.0, 319335.0, 270766.0, 219291.0, 169721.0, 125538.0, 91449.0, 63584.0, 44140.0, 29060.0, 19277.0, 12505.0, 8014.0, 5046.0, 3227.0, 1969.0, 1299.0, 731.0, 498.0, 303.0, 169.0, 109.0, 77.0, 36.0, 24.0, 11.0, 7.0, 5.0, 2.0, 3.0], "bins": [-44.625, -43.275390625, -41.92578125, -40.576171875, -39.2265625, -37.876953125, -36.52734375, -35.177734375, -33.828125, -32.478515625, -31.12890625, -29.779296875, -28.4296875, -27.080078125, -25.73046875, -24.380859375, -23.03125, -21.681640625, -20.33203125, -18.982421875, -17.6328125, -16.283203125, -14.93359375, -13.583984375, -12.234375, -10.884765625, -9.53515625, -8.185546875, -6.8359375, -5.486328125, -4.13671875, -2.787109375, -1.4375, -0.087890625, 1.26171875, 2.611328125, 3.9609375, 5.310546875, 6.66015625, 8.009765625, 9.359375, 10.708984375, 12.05859375, 13.408203125, 14.7578125, 16.107421875, 17.45703125, 18.806640625, 20.15625, 21.505859375, 22.85546875, 24.205078125, 25.5546875, 26.904296875, 28.25390625, 29.603515625, 30.953125, 32.302734375, 33.65234375, 35.001953125, 36.3515625, 37.701171875, 39.05078125, 40.400390625, 41.75]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 8.0, 11.0, 17.0, 19.0, 19.0, 20.0, 41.0, 33.0, 59.0, 67.0, 73.0, 93.0, 110.0, 115.0, 123.0, 132.0, 176.0, 167.0, 175.0, 197.0, 202.0, 216.0, 192.0, 212.0, 189.0, 175.0, 157.0, 159.0, 147.0, 127.0, 110.0, 94.0, 99.0, 60.0, 63.0, 36.0, 43.0, 35.0, 24.0, 17.0, 8.0, 14.0, 9.0, 5.0, 5.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.754638671875, -21.96240234375, -21.170166015625, -20.3779296875, -19.585693359375, -18.79345703125, -18.001220703125, -17.208984375, -16.416748046875, -15.62451171875, -14.832275390625, -14.0400390625, -13.247802734375, -12.45556640625, -11.663330078125, -10.87109375, -10.078857421875, -9.28662109375, -8.494384765625, -7.7021484375, -6.909912109375, -6.11767578125, -5.325439453125, -4.533203125, -3.740966796875, -2.94873046875, -2.156494140625, -1.3642578125, -0.572021484375, 0.22021484375, 1.012451171875, 1.8046875, 2.596923828125, 3.38916015625, 4.181396484375, 4.9736328125, 5.765869140625, 6.55810546875, 7.350341796875, 8.142578125, 8.934814453125, 9.72705078125, 10.519287109375, 11.3115234375, 12.103759765625, 12.89599609375, 13.688232421875, 14.48046875, 15.272705078125, 16.06494140625, 16.857177734375, 17.6494140625, 18.441650390625, 19.23388671875, 20.026123046875, 20.818359375, 21.610595703125, 22.40283203125, 23.195068359375, 23.9873046875, 24.779541015625, 25.57177734375, 26.364013671875, 27.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 9.0, 8.0, 17.0, 17.0, 17.0, 17.0, 22.0, 17.0, 25.0, 25.0, 27.0, 30.0, 36.0, 35.0, 40.0, 36.0, 50.0, 42.0, 37.0, 39.0, 47.0, 40.0, 33.0, 37.0, 40.0, 31.0, 28.0, 24.0, 21.0, 19.0, 20.0, 15.0, 13.0, 12.0, 11.0, 16.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-55.089813232421875, -53.33258819580078, -51.57536697387695, -49.818145751953125, -48.06092071533203, -46.30369567871094, -44.54647445678711, -42.78925323486328, -41.03202819824219, -39.274803161621094, -37.517581939697266, -35.76036071777344, -34.003135681152344, -32.24591064453125, -30.488689422607422, -28.73146629333496, -26.9742431640625, -25.21702003479004, -23.459796905517578, -21.702573776245117, -19.945350646972656, -18.188127517700195, -16.430904388427734, -14.673681259155273, -12.916458129882812, -11.159235000610352, -9.40201187133789, -7.64478874206543, -5.887565612792969, -4.130342483520508, -2.373119354248047, -0.6158962249755859, 1.1413230895996094, 2.8985462188720703, 4.655769348144531, 6.412992477416992, 8.170215606689453, 9.927438735961914, 11.684661865234375, 13.441884994506836, 15.199108123779297, 16.956331253051758, 18.71355438232422, 20.47077751159668, 22.22800064086914, 23.9852237701416, 25.742446899414062, 27.499670028686523, 29.256893157958984, 31.014116287231445, 32.771339416503906, 34.528564453125, 36.28578567504883, 38.043006896972656, 39.80023193359375, 41.557456970214844, 43.31467819213867, 45.0718994140625, 46.829124450683594, 48.58634948730469, 50.343570709228516, 52.100791931152344, 53.85801696777344, 55.61524200439453, 57.37246322631836]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 9.0, 17.0, 8.0, 20.0, 15.0, 20.0, 19.0, 18.0, 27.0, 38.0, 43.0, 33.0, 37.0, 54.0, 56.0, 48.0, 42.0, 54.0, 45.0, 50.0, 34.0, 28.0, 30.0, 40.0, 34.0, 20.0, 20.0, 24.0, 16.0, 24.0, 9.0, 18.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.63072204589844, -65.49087524414062, -63.35102844238281, -61.211181640625, -59.07133483886719, -56.931488037109375, -54.79164123535156, -52.65179443359375, -50.51194763183594, -48.372100830078125, -46.23225402832031, -44.0924072265625, -41.95256042480469, -39.812713623046875, -37.67286682128906, -35.53302001953125, -33.39317321777344, -31.253326416015625, -29.113479614257812, -26.9736328125, -24.833786010742188, -22.693939208984375, -20.554092407226562, -18.41424560546875, -16.274398803710938, -14.134552001953125, -11.994705200195312, -9.8548583984375, -7.7150115966796875, -5.575164794921875, -3.4353179931640625, -1.29547119140625, 0.8443679809570312, 2.9842147827148438, 5.124061584472656, 7.263908386230469, 9.403755187988281, 11.543601989746094, 13.683448791503906, 15.823295593261719, 17.96314239501953, 20.102989196777344, 22.242835998535156, 24.38268280029297, 26.52252960205078, 28.662376403808594, 30.802223205566406, 32.94207000732422, 35.08191680908203, 37.221763610839844, 39.361610412597656, 41.50145721435547, 43.64130401611328, 45.781150817871094, 47.920997619628906, 50.06084442138672, 52.20069122314453, 54.340538024902344, 56.480384826660156, 58.62023162841797, 60.76007843017578, 62.899925231933594, 65.0397720336914, 67.17961883544922, 69.31946563720703]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 25.0, 26.0, 62.0, 91.0, 138.0, 260.0, 396.0, 603.0, 914.0, 1605.0, 2527.0, 4223.0, 6642.0, 10523.0, 16486.0, 24841.0, 37094.0, 52564.0, 70562.0, 89126.0, 105253.0, 114155.0, 112891.0, 102152.0, 84774.0, 66581.0, 48129.0, 33654.0, 22522.0, 14510.0, 9563.0, 5936.0, 3661.0, 2251.0, 1482.0, 885.0, 568.0, 317.0, 194.0, 133.0, 80.0, 50.0, 38.0, 18.0, 9.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.265625, -16.740478515625, -16.21533203125, -15.690185546875, -15.1650390625, -14.639892578125, -14.11474609375, -13.589599609375, -13.064453125, -12.539306640625, -12.01416015625, -11.489013671875, -10.9638671875, -10.438720703125, -9.91357421875, -9.388427734375, -8.86328125, -8.338134765625, -7.81298828125, -7.287841796875, -6.7626953125, -6.237548828125, -5.71240234375, -5.187255859375, -4.662109375, -4.136962890625, -3.61181640625, -3.086669921875, -2.5615234375, -2.036376953125, -1.51123046875, -0.986083984375, -0.4609375, 0.064208984375, 0.58935546875, 1.114501953125, 1.6396484375, 2.164794921875, 2.68994140625, 3.215087890625, 3.740234375, 4.265380859375, 4.79052734375, 5.315673828125, 5.8408203125, 6.365966796875, 6.89111328125, 7.416259765625, 7.94140625, 8.466552734375, 8.99169921875, 9.516845703125, 10.0419921875, 10.567138671875, 11.09228515625, 11.617431640625, 12.142578125, 12.667724609375, 13.19287109375, 13.718017578125, 14.2431640625, 14.768310546875, 15.29345703125, 15.818603515625, 16.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 14.0, 10.0, 19.0, 16.0, 21.0, 17.0, 20.0, 27.0, 41.0, 39.0, 36.0, 37.0, 55.0, 50.0, 53.0, 40.0, 52.0, 53.0, 43.0, 35.0, 28.0, 28.0, 43.0, 31.0, 20.0, 21.0, 21.0, 17.0, 25.0, 10.0, 16.0, 8.0, 6.0, 1.0, 8.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.375, -65.232421875, -63.08984375, -60.947265625, -58.8046875, -56.662109375, -54.51953125, -52.376953125, -50.234375, -48.091796875, -45.94921875, -43.806640625, -41.6640625, -39.521484375, -37.37890625, -35.236328125, -33.09375, -30.951171875, -28.80859375, -26.666015625, -24.5234375, -22.380859375, -20.23828125, -18.095703125, -15.953125, -13.810546875, -11.66796875, -9.525390625, -7.3828125, -5.240234375, -3.09765625, -0.955078125, 1.1875, 3.330078125, 5.47265625, 7.615234375, 9.7578125, 11.900390625, 14.04296875, 16.185546875, 18.328125, 20.470703125, 22.61328125, 24.755859375, 26.8984375, 29.041015625, 31.18359375, 33.326171875, 35.46875, 37.611328125, 39.75390625, 41.896484375, 44.0390625, 46.181640625, 48.32421875, 50.466796875, 52.609375, 54.751953125, 56.89453125, 59.037109375, 61.1796875, 63.322265625, 65.46484375, 67.607421875, 69.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 19.0, 28.0, 42.0, 59.0, 101.0, 124.0, 210.0, 380.0, 701.0, 1161.0, 1983.0, 3774.0, 6799.0, 12682.0, 24370.0, 64058.0, 846814.0, 41624.0, 19884.0, 10689.0, 5795.0, 3108.0, 1713.0, 987.0, 581.0, 323.0, 197.0, 124.0, 83.0, 51.0, 20.0, 14.0, 13.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-68.375, -66.26171875, -64.1484375, -62.03515625, -59.921875, -57.80859375, -55.6953125, -53.58203125, -51.46875, -49.35546875, -47.2421875, -45.12890625, -43.015625, -40.90234375, -38.7890625, -36.67578125, -34.5625, -32.44921875, -30.3359375, -28.22265625, -26.109375, -23.99609375, -21.8828125, -19.76953125, -17.65625, -15.54296875, -13.4296875, -11.31640625, -9.203125, -7.08984375, -4.9765625, -2.86328125, -0.75, 1.36328125, 3.4765625, 5.58984375, 7.703125, 9.81640625, 11.9296875, 14.04296875, 16.15625, 18.26953125, 20.3828125, 22.49609375, 24.609375, 26.72265625, 28.8359375, 30.94921875, 33.0625, 35.17578125, 37.2890625, 39.40234375, 41.515625, 43.62890625, 45.7421875, 47.85546875, 49.96875, 52.08203125, 54.1953125, 56.30859375, 58.421875, 60.53515625, 62.6484375, 64.76171875, 66.875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 7.0, 12.0, 12.0, 15.0, 9.0, 14.0, 5.0, 19.0, 21.0, 22.0, 26.0, 42.0, 27.0, 27.0, 37.0, 34.0, 41.0, 35.0, 43.0, 42.0, 48.0, 37.0, 42.0, 31.0, 38.0, 22.0, 22.0, 29.0, 34.0, 32.0, 29.0, 21.0, 20.0, 10.0, 11.0, 14.0, 22.0, 6.0, 12.0, 8.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.90625, -39.634765625, -38.36328125, -37.091796875, -35.8203125, -34.548828125, -33.27734375, -32.005859375, -30.734375, -29.462890625, -28.19140625, -26.919921875, -25.6484375, -24.376953125, -23.10546875, -21.833984375, -20.5625, -19.291015625, -18.01953125, -16.748046875, -15.4765625, -14.205078125, -12.93359375, -11.662109375, -10.390625, -9.119140625, -7.84765625, -6.576171875, -5.3046875, -4.033203125, -2.76171875, -1.490234375, -0.21875, 1.052734375, 2.32421875, 3.595703125, 4.8671875, 6.138671875, 7.41015625, 8.681640625, 9.953125, 11.224609375, 12.49609375, 13.767578125, 15.0390625, 16.310546875, 17.58203125, 18.853515625, 20.125, 21.396484375, 22.66796875, 23.939453125, 25.2109375, 26.482421875, 27.75390625, 29.025390625, 30.296875, 31.568359375, 32.83984375, 34.111328125, 35.3828125, 36.654296875, 37.92578125, 39.197265625, 40.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 13.0, 4.0, 8.0, 12.0, 25.0, 21.0, 44.0, 62.0, 109.0, 173.0, 270.0, 430.0, 665.0, 1062.0, 1890.0, 3042.0, 5166.0, 9334.0, 17119.0, 35667.0, 691283.0, 219865.0, 28840.0, 14297.0, 7822.0, 4469.0, 2664.0, 1589.0, 966.0, 588.0, 362.0, 223.0, 151.0, 115.0, 71.0, 46.0, 28.0, 21.0, 9.0, 6.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.046875, -3.923736572265625, -3.80059814453125, -3.677459716796875, -3.5543212890625, -3.431182861328125, -3.30804443359375, -3.184906005859375, -3.061767578125, -2.938629150390625, -2.81549072265625, -2.692352294921875, -2.5692138671875, -2.446075439453125, -2.32293701171875, -2.199798583984375, -2.07666015625, -1.953521728515625, -1.83038330078125, -1.707244873046875, -1.5841064453125, -1.460968017578125, -1.33782958984375, -1.214691162109375, -1.091552734375, -0.968414306640625, -0.84527587890625, -0.722137451171875, -0.5989990234375, -0.475860595703125, -0.35272216796875, -0.229583740234375, -0.1064453125, 0.016693115234375, 0.13983154296875, 0.262969970703125, 0.3861083984375, 0.509246826171875, 0.63238525390625, 0.755523681640625, 0.878662109375, 1.001800537109375, 1.12493896484375, 1.248077392578125, 1.3712158203125, 1.494354248046875, 1.61749267578125, 1.740631103515625, 1.86376953125, 1.986907958984375, 2.11004638671875, 2.233184814453125, 2.3563232421875, 2.479461669921875, 2.60260009765625, 2.725738525390625, 2.848876953125, 2.972015380859375, 3.09515380859375, 3.218292236328125, 3.3414306640625, 3.464569091796875, 3.58770751953125, 3.710845947265625, 3.833984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 15.0, 24.0, 19.0, 22.0, 20.0, 31.0, 41.0, 53.0, 45.0, 64.0, 62.0, 55.0, 69.0, 69.0, 62.0, 52.0, 51.0, 46.0, 38.0, 34.0, 22.0, 13.0, 11.0, 11.0, 15.0, 6.0, 3.0, 3.0, 2.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032973289489746094, -0.0003195516765117645, -0.0003093704581260681, -0.0002991892397403717, -0.0002890080213546753, -0.0002788268029689789, -0.00026864558458328247, -0.00025846436619758606, -0.00024828314781188965, -0.00023810192942619324, -0.00022792071104049683, -0.00021773949265480042, -0.000207558274269104, -0.0001973770558834076, -0.00018719583749771118, -0.00017701461911201477, -0.00016683340072631836, -0.00015665218234062195, -0.00014647096395492554, -0.00013628974556922913, -0.00012610852718353271, -0.0001159273087978363, -0.00010574609041213989, -9.556487202644348e-05, -8.538365364074707e-05, -7.520243525505066e-05, -6.502121686935425e-05, -5.483999848365784e-05, -4.4658780097961426e-05, -3.4477561712265015e-05, -2.4296343326568604e-05, -1.4115124940872192e-05, -3.933906555175781e-06, 6.24731183052063e-06, 1.642853021621704e-05, 2.6609748601913452e-05, 3.679096698760986e-05, 4.6972185373306274e-05, 5.7153403759002686e-05, 6.73346221446991e-05, 7.751584053039551e-05, 8.769705891609192e-05, 9.787827730178833e-05, 0.00010805949568748474, 0.00011824071407318115, 0.00012842193245887756, 0.00013860315084457397, 0.00014878436923027039, 0.0001589655876159668, 0.0001691468060016632, 0.00017932802438735962, 0.00018950924277305603, 0.00019969046115875244, 0.00020987167954444885, 0.00022005289793014526, 0.00023023411631584167, 0.00024041533470153809, 0.0002505965530872345, 0.0002607777714729309, 0.0002709589898586273, 0.00028114020824432373, 0.00029132142663002014, 0.00030150264501571655, 0.00031168386340141296, 0.0003218650817871094]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 20.0, 22.0, 48.0, 83.0, 96.0, 142.0, 225.0, 328.0, 539.0, 804.0, 1305.0, 1914.0, 2805.0, 4298.0, 6560.0, 9772.0, 14553.0, 21426.0, 30320.0, 42355.0, 56279.0, 72241.0, 87534.0, 99925.0, 104887.0, 102726.0, 92544.0, 77478.0, 61433.0, 46939.0, 34226.0, 24359.0, 16709.0, 11382.0, 7474.0, 5017.0, 3372.0, 2109.0, 1528.0, 947.0, 672.0, 386.0, 258.0, 174.0, 112.0, 86.0, 37.0, 37.0, 14.0, 14.0, 12.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.19140625, -2.122222900390625, -2.05303955078125, -1.983856201171875, -1.9146728515625, -1.845489501953125, -1.77630615234375, -1.707122802734375, -1.637939453125, -1.568756103515625, -1.49957275390625, -1.430389404296875, -1.3612060546875, -1.292022705078125, -1.22283935546875, -1.153656005859375, -1.08447265625, -1.015289306640625, -0.94610595703125, -0.876922607421875, -0.8077392578125, -0.738555908203125, -0.66937255859375, -0.600189208984375, -0.531005859375, -0.461822509765625, -0.39263916015625, -0.323455810546875, -0.2542724609375, -0.185089111328125, -0.11590576171875, -0.046722412109375, 0.0224609375, 0.091644287109375, 0.16082763671875, 0.230010986328125, 0.2991943359375, 0.368377685546875, 0.43756103515625, 0.506744384765625, 0.575927734375, 0.645111083984375, 0.71429443359375, 0.783477783203125, 0.8526611328125, 0.921844482421875, 0.99102783203125, 1.060211181640625, 1.12939453125, 1.198577880859375, 1.26776123046875, 1.336944580078125, 1.4061279296875, 1.475311279296875, 1.54449462890625, 1.613677978515625, 1.682861328125, 1.752044677734375, 1.82122802734375, 1.890411376953125, 1.9595947265625, 2.028778076171875, 2.09796142578125, 2.167144775390625, 2.236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 4.0, 13.0, 17.0, 19.0, 13.0, 22.0, 20.0, 17.0, 30.0, 29.0, 26.0, 40.0, 32.0, 39.0, 28.0, 31.0, 30.0, 40.0, 35.0, 43.0, 31.0, 38.0, 34.0, 40.0, 27.0, 28.0, 32.0, 28.0, 24.0, 34.0, 33.0, 23.0, 20.0, 18.0, 18.0, 7.0, 9.0, 8.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9815673828125, -0.948486328125, -0.9154052734375, -0.88232421875, -0.8492431640625, -0.816162109375, -0.7830810546875, -0.75, -0.7169189453125, -0.683837890625, -0.6507568359375, -0.61767578125, -0.5845947265625, -0.551513671875, -0.5184326171875, -0.4853515625, -0.4522705078125, -0.419189453125, -0.3861083984375, -0.35302734375, -0.3199462890625, -0.286865234375, -0.2537841796875, -0.220703125, -0.1876220703125, -0.154541015625, -0.1214599609375, -0.08837890625, -0.0552978515625, -0.022216796875, 0.0108642578125, 0.0439453125, 0.0770263671875, 0.110107421875, 0.1431884765625, 0.17626953125, 0.2093505859375, 0.242431640625, 0.2755126953125, 0.30859375, 0.3416748046875, 0.374755859375, 0.4078369140625, 0.44091796875, 0.4739990234375, 0.507080078125, 0.5401611328125, 0.5732421875, 0.6063232421875, 0.639404296875, 0.6724853515625, 0.70556640625, 0.7386474609375, 0.771728515625, 0.8048095703125, 0.837890625, 0.8709716796875, 0.904052734375, 0.9371337890625, 0.97021484375, 1.0032958984375, 1.036376953125, 1.0694580078125, 1.1025390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 12.0, 10.0, 4.0, 19.0, 14.0, 19.0, 26.0, 18.0, 22.0, 22.0, 31.0, 33.0, 40.0, 27.0, 58.0, 29.0, 48.0, 49.0, 39.0, 30.0, 42.0, 43.0, 41.0, 36.0, 37.0, 37.0, 33.0, 18.0, 21.0, 21.0, 15.0, 24.0, 13.0, 15.0, 13.0, 6.0, 6.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.38033676147461, -53.55709457397461, -51.73385238647461, -49.91061019897461, -48.08736801147461, -46.26412582397461, -44.440887451171875, -42.617645263671875, -40.794403076171875, -38.971160888671875, -37.147918701171875, -35.324676513671875, -33.501434326171875, -31.678192138671875, -29.854951858520508, -28.031709671020508, -26.208465576171875, -24.385223388671875, -22.561981201171875, -20.738739013671875, -18.915496826171875, -17.092254638671875, -15.269014358520508, -13.445772171020508, -11.622529983520508, -9.799287796020508, -7.976046085357666, -6.152804374694824, -4.329562187194824, -2.506319999694824, -0.6830787658691406, 1.1401634216308594, 2.9634056091308594, 4.786647796630859, 6.609889507293701, 8.433131217956543, 10.256373405456543, 12.079615592956543, 13.902856826782227, 15.726099014282227, 17.549341201782227, 19.372583389282227, 21.195825576782227, 23.019065856933594, 24.842308044433594, 26.665550231933594, 28.488792419433594, 30.312034606933594, 32.135276794433594, 33.958518981933594, 35.781761169433594, 37.605003356933594, 39.428245544433594, 41.251487731933594, 43.074729919433594, 44.897972106933594, 46.721214294433594, 48.544456481933594, 50.367698669433594, 52.190940856933594, 54.014183044433594, 55.837425231933594, 57.660667419433594, 59.483909606933594, 61.30714797973633]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 10.0, 9.0, 12.0, 14.0, 18.0, 15.0, 22.0, 21.0, 19.0, 26.0, 34.0, 48.0, 34.0, 50.0, 49.0, 50.0, 53.0, 45.0, 57.0, 53.0, 32.0, 40.0, 24.0, 36.0, 36.0, 33.0, 13.0, 21.0, 27.0, 21.0, 18.0, 12.0, 14.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.64140319824219, -66.4472427368164, -64.25308227539062, -62.058921813964844, -59.86476135253906, -57.67060089111328, -55.4764404296875, -53.28227996826172, -51.08811950683594, -48.893959045410156, -46.699798583984375, -44.505638122558594, -42.31147766113281, -40.11731719970703, -37.92315673828125, -35.72899627685547, -33.53483581542969, -31.340675354003906, -29.146514892578125, -26.952354431152344, -24.758193969726562, -22.56403350830078, -20.369873046875, -18.17571258544922, -15.981552124023438, -13.787391662597656, -11.593231201171875, -9.399070739746094, -7.2049102783203125, -5.010749816894531, -2.81658935546875, -0.6224288940429688, 1.5717391967773438, 3.765899658203125, 5.960060119628906, 8.154220581054688, 10.348381042480469, 12.54254150390625, 14.736701965332031, 16.930862426757812, 19.125022888183594, 21.319183349609375, 23.513343811035156, 25.707504272460938, 27.90166473388672, 30.0958251953125, 32.28998565673828, 34.48414611816406, 36.678306579589844, 38.872467041015625, 41.066627502441406, 43.26078796386719, 45.45494842529297, 47.64910888671875, 49.84326934814453, 52.03742980957031, 54.231590270996094, 56.425750732421875, 58.619911193847656, 60.81407165527344, 63.00823211669922, 65.202392578125, 67.39655303955078, 69.59071350097656, 71.78487396240234]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 13.0, 24.0, 25.0, 29.0, 46.0, 90.0, 129.0, 212.0, 346.0, 580.0, 894.0, 1339.0, 2063.0, 3184.0, 4697.0, 7297.0, 10661.0, 15494.0, 21968.0, 30123.0, 40381.0, 51593.0, 63610.0, 75477.0, 84733.0, 90799.0, 91530.0, 88087.0, 79538.0, 68016.0, 56747.0, 44721.0, 34137.0, 24851.0, 17738.0, 12511.0, 8646.0, 5731.0, 3692.0, 2449.0, 1595.0, 1008.0, 651.0, 409.0, 247.0, 160.0, 125.0, 63.0, 37.0, 18.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0], "bins": [-42.40625, -41.12890625, -39.8515625, -38.57421875, -37.296875, -36.01953125, -34.7421875, -33.46484375, -32.1875, -30.91015625, -29.6328125, -28.35546875, -27.078125, -25.80078125, -24.5234375, -23.24609375, -21.96875, -20.69140625, -19.4140625, -18.13671875, -16.859375, -15.58203125, -14.3046875, -13.02734375, -11.75, -10.47265625, -9.1953125, -7.91796875, -6.640625, -5.36328125, -4.0859375, -2.80859375, -1.53125, -0.25390625, 1.0234375, 2.30078125, 3.578125, 4.85546875, 6.1328125, 7.41015625, 8.6875, 9.96484375, 11.2421875, 12.51953125, 13.796875, 15.07421875, 16.3515625, 17.62890625, 18.90625, 20.18359375, 21.4609375, 22.73828125, 24.015625, 25.29296875, 26.5703125, 27.84765625, 29.125, 30.40234375, 31.6796875, 32.95703125, 34.234375, 35.51171875, 36.7890625, 38.06640625, 39.34375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 14.0, 9.0, 12.0, 11.0, 21.0, 8.0, 23.0, 23.0, 20.0, 23.0, 34.0, 44.0, 41.0, 44.0, 52.0, 48.0, 54.0, 48.0, 54.0, 47.0, 40.0, 38.0, 26.0, 37.0, 37.0, 31.0, 15.0, 23.0, 24.0, 20.0, 21.0, 10.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.322265625, -62.20703125, -60.091796875, -57.9765625, -55.861328125, -53.74609375, -51.630859375, -49.515625, -47.400390625, -45.28515625, -43.169921875, -41.0546875, -38.939453125, -36.82421875, -34.708984375, -32.59375, -30.478515625, -28.36328125, -26.248046875, -24.1328125, -22.017578125, -19.90234375, -17.787109375, -15.671875, -13.556640625, -11.44140625, -9.326171875, -7.2109375, -5.095703125, -2.98046875, -0.865234375, 1.25, 3.365234375, 5.48046875, 7.595703125, 9.7109375, 11.826171875, 13.94140625, 16.056640625, 18.171875, 20.287109375, 22.40234375, 24.517578125, 26.6328125, 28.748046875, 30.86328125, 32.978515625, 35.09375, 37.208984375, 39.32421875, 41.439453125, 43.5546875, 45.669921875, 47.78515625, 49.900390625, 52.015625, 54.130859375, 56.24609375, 58.361328125, 60.4765625, 62.591796875, 64.70703125, 66.822265625, 68.9375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 21.0, 29.0, 53.0, 77.0, 118.0, 225.0, 288.0, 487.0, 761.0, 1279.0, 1951.0, 3001.0, 4818.0, 7415.0, 11288.0, 16811.0, 24220.0, 34115.0, 46992.0, 61471.0, 76301.0, 88742.0, 98193.0, 100575.0, 97178.0, 87484.0, 74515.0, 59920.0, 46068.0, 33728.0, 23543.0, 16018.0, 10990.0, 7156.0, 4562.0, 3006.0, 1872.0, 1176.0, 814.0, 470.0, 318.0, 178.0, 99.0, 78.0, 49.0, 34.0, 22.0, 9.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-43.53125, -42.1474609375, -40.763671875, -39.3798828125, -37.99609375, -36.6123046875, -35.228515625, -33.8447265625, -32.4609375, -31.0771484375, -29.693359375, -28.3095703125, -26.92578125, -25.5419921875, -24.158203125, -22.7744140625, -21.390625, -20.0068359375, -18.623046875, -17.2392578125, -15.85546875, -14.4716796875, -13.087890625, -11.7041015625, -10.3203125, -8.9365234375, -7.552734375, -6.1689453125, -4.78515625, -3.4013671875, -2.017578125, -0.6337890625, 0.75, 2.1337890625, 3.517578125, 4.9013671875, 6.28515625, 7.6689453125, 9.052734375, 10.4365234375, 11.8203125, 13.2041015625, 14.587890625, 15.9716796875, 17.35546875, 18.7392578125, 20.123046875, 21.5068359375, 22.890625, 24.2744140625, 25.658203125, 27.0419921875, 28.42578125, 29.8095703125, 31.193359375, 32.5771484375, 33.9609375, 35.3447265625, 36.728515625, 38.1123046875, 39.49609375, 40.8798828125, 42.263671875, 43.6474609375, 45.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 5.0, 6.0, 12.0, 19.0, 14.0, 23.0, 25.0, 38.0, 35.0, 36.0, 49.0, 45.0, 55.0, 59.0, 54.0, 54.0, 52.0, 45.0, 49.0, 44.0, 34.0, 40.0, 45.0, 39.0, 22.0, 18.0, 14.0, 16.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.71875, -50.111328125, -48.50390625, -46.896484375, -45.2890625, -43.681640625, -42.07421875, -40.466796875, -38.859375, -37.251953125, -35.64453125, -34.037109375, -32.4296875, -30.822265625, -29.21484375, -27.607421875, -26.0, -24.392578125, -22.78515625, -21.177734375, -19.5703125, -17.962890625, -16.35546875, -14.748046875, -13.140625, -11.533203125, -9.92578125, -8.318359375, -6.7109375, -5.103515625, -3.49609375, -1.888671875, -0.28125, 1.326171875, 2.93359375, 4.541015625, 6.1484375, 7.755859375, 9.36328125, 10.970703125, 12.578125, 14.185546875, 15.79296875, 17.400390625, 19.0078125, 20.615234375, 22.22265625, 23.830078125, 25.4375, 27.044921875, 28.65234375, 30.259765625, 31.8671875, 33.474609375, 35.08203125, 36.689453125, 38.296875, 39.904296875, 41.51171875, 43.119140625, 44.7265625, 46.333984375, 47.94140625, 49.548828125, 51.15625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 38.0, 58.0, 85.0, 132.0, 235.0, 315.0, 513.0, 913.0, 1517.0, 2534.0, 4281.0, 6962.0, 11518.0, 18253.0, 28655.0, 43167.0, 62105.0, 83495.0, 103356.0, 118686.0, 122406.0, 113826.0, 96462.0, 74870.0, 53835.0, 36811.0, 24170.0, 15287.0, 9507.0, 5800.0, 3416.0, 2143.0, 1209.0, 730.0, 462.0, 278.0, 179.0, 109.0, 67.0, 41.0, 28.0, 21.0, 13.0, 9.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.15869140625, -18.5048828125, -17.85107421875, -17.197265625, -16.54345703125, -15.8896484375, -15.23583984375, -14.58203125, -13.92822265625, -13.2744140625, -12.62060546875, -11.966796875, -11.31298828125, -10.6591796875, -10.00537109375, -9.3515625, -8.69775390625, -8.0439453125, -7.39013671875, -6.736328125, -6.08251953125, -5.4287109375, -4.77490234375, -4.12109375, -3.46728515625, -2.8134765625, -2.15966796875, -1.505859375, -0.85205078125, -0.1982421875, 0.45556640625, 1.109375, 1.76318359375, 2.4169921875, 3.07080078125, 3.724609375, 4.37841796875, 5.0322265625, 5.68603515625, 6.33984375, 6.99365234375, 7.6474609375, 8.30126953125, 8.955078125, 9.60888671875, 10.2626953125, 10.91650390625, 11.5703125, 12.22412109375, 12.8779296875, 13.53173828125, 14.185546875, 14.83935546875, 15.4931640625, 16.14697265625, 16.80078125, 17.45458984375, 18.1083984375, 18.76220703125, 19.416015625, 20.06982421875, 20.7236328125, 21.37744140625, 22.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 10.0, 5.0, 15.0, 14.0, 11.0, 18.0, 24.0, 28.0, 26.0, 32.0, 33.0, 38.0, 45.0, 46.0, 48.0, 53.0, 48.0, 47.0, 47.0, 39.0, 43.0, 50.0, 37.0, 36.0, 20.0, 31.0, 23.0, 22.0, 20.0, 9.0, 11.0, 10.0, 8.0, 5.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.002513885498046875, -0.002439558506011963, -0.0023652315139770508, -0.0022909045219421387, -0.0022165775299072266, -0.0021422505378723145, -0.0020679235458374023, -0.0019935965538024902, -0.0019192695617675781, -0.001844942569732666, -0.001770615577697754, -0.0016962885856628418, -0.0016219615936279297, -0.0015476346015930176, -0.0014733076095581055, -0.0013989806175231934, -0.0013246536254882812, -0.0012503266334533691, -0.001175999641418457, -0.001101672649383545, -0.0010273456573486328, -0.0009530186653137207, -0.0008786916732788086, -0.0008043646812438965, -0.0007300376892089844, -0.0006557106971740723, -0.0005813837051391602, -0.000507056713104248, -0.00043272972106933594, -0.00035840272903442383, -0.0002840757369995117, -0.0002097487449645996, -0.0001354217529296875, -6.109476089477539e-05, 1.3232231140136719e-05, 8.755922317504883e-05, 0.00016188621520996094, 0.00023621320724487305, 0.00031054019927978516, 0.00038486719131469727, 0.0004591941833496094, 0.0005335211753845215, 0.0006078481674194336, 0.0006821751594543457, 0.0007565021514892578, 0.0008308291435241699, 0.000905156135559082, 0.0009794831275939941, 0.0010538101196289062, 0.0011281371116638184, 0.0012024641036987305, 0.0012767910957336426, 0.0013511180877685547, 0.0014254450798034668, 0.001499772071838379, 0.001574099063873291, 0.0016484260559082031, 0.0017227530479431152, 0.0017970800399780273, 0.0018714070320129395, 0.0019457340240478516, 0.0020200610160827637, 0.0020943880081176758, 0.002168715000152588, 0.0022430419921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 12.0, 30.0, 42.0, 66.0, 78.0, 140.0, 184.0, 326.0, 497.0, 731.0, 1142.0, 1761.0, 2695.0, 4207.0, 6469.0, 9805.0, 14688.0, 21966.0, 32010.0, 44478.0, 60519.0, 77594.0, 93598.0, 104777.0, 108160.0, 103839.0, 91634.0, 74998.0, 58021.0, 42679.0, 30336.0, 20854.0, 14099.0, 8991.0, 5948.0, 3856.0, 2576.0, 1673.0, 1083.0, 725.0, 426.0, 284.0, 183.0, 115.0, 88.0, 61.0, 28.0, 24.0, 11.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-19.265625, -18.652587890625, -18.03955078125, -17.426513671875, -16.8134765625, -16.200439453125, -15.58740234375, -14.974365234375, -14.361328125, -13.748291015625, -13.13525390625, -12.522216796875, -11.9091796875, -11.296142578125, -10.68310546875, -10.070068359375, -9.45703125, -8.843994140625, -8.23095703125, -7.617919921875, -7.0048828125, -6.391845703125, -5.77880859375, -5.165771484375, -4.552734375, -3.939697265625, -3.32666015625, -2.713623046875, -2.1005859375, -1.487548828125, -0.87451171875, -0.261474609375, 0.3515625, 0.964599609375, 1.57763671875, 2.190673828125, 2.8037109375, 3.416748046875, 4.02978515625, 4.642822265625, 5.255859375, 5.868896484375, 6.48193359375, 7.094970703125, 7.7080078125, 8.321044921875, 8.93408203125, 9.547119140625, 10.16015625, 10.773193359375, 11.38623046875, 11.999267578125, 12.6123046875, 13.225341796875, 13.83837890625, 14.451416015625, 15.064453125, 15.677490234375, 16.29052734375, 16.903564453125, 17.5166015625, 18.129638671875, 18.74267578125, 19.355712890625, 19.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 2.0, 14.0, 12.0, 4.0, 17.0, 28.0, 26.0, 20.0, 24.0, 37.0, 47.0, 45.0, 42.0, 53.0, 50.0, 54.0, 48.0, 43.0, 54.0, 45.0, 38.0, 41.0, 42.0, 29.0, 27.0, 25.0, 24.0, 19.0, 21.0, 11.0, 9.0, 12.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-10.4375, -10.1297607421875, -9.822021484375, -9.5142822265625, -9.20654296875, -8.8988037109375, -8.591064453125, -8.2833251953125, -7.9755859375, -7.6678466796875, -7.360107421875, -7.0523681640625, -6.74462890625, -6.4368896484375, -6.129150390625, -5.8214111328125, -5.513671875, -5.2059326171875, -4.898193359375, -4.5904541015625, -4.28271484375, -3.9749755859375, -3.667236328125, -3.3594970703125, -3.0517578125, -2.7440185546875, -2.436279296875, -2.1285400390625, -1.82080078125, -1.5130615234375, -1.205322265625, -0.8975830078125, -0.58984375, -0.2821044921875, 0.025634765625, 0.3333740234375, 0.64111328125, 0.9488525390625, 1.256591796875, 1.5643310546875, 1.8720703125, 2.1798095703125, 2.487548828125, 2.7952880859375, 3.10302734375, 3.4107666015625, 3.718505859375, 4.0262451171875, 4.333984375, 4.6417236328125, 4.949462890625, 5.2572021484375, 5.56494140625, 5.8726806640625, 6.180419921875, 6.4881591796875, 6.7958984375, 7.1036376953125, 7.411376953125, 7.7191162109375, 8.02685546875, 8.3345947265625, 8.642333984375, 8.9500732421875, 9.2578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 13.0, 18.0, 10.0, 22.0, 17.0, 22.0, 24.0, 24.0, 26.0, 24.0, 32.0, 29.0, 33.0, 30.0, 34.0, 45.0, 39.0, 37.0, 33.0, 41.0, 29.0, 41.0, 35.0, 30.0, 32.0, 28.0, 22.0, 19.0, 14.0, 25.0, 15.0, 18.0, 13.0, 16.0, 11.0, 20.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.57626724243164, -46.00093078613281, -44.425594329833984, -42.850257873535156, -41.274925231933594, -39.699588775634766, -38.12425231933594, -36.54891586303711, -34.97357940673828, -33.39824295043945, -31.822908401489258, -30.24757194519043, -28.6722354888916, -27.096900939941406, -25.521564483642578, -23.94622802734375, -22.370893478393555, -20.795557022094727, -19.22022247314453, -17.644886016845703, -16.069549560546875, -14.494214057922363, -12.918878555297852, -11.343542098999023, -9.768206596374512, -8.19287109375, -6.617534637451172, -5.04219913482666, -3.4668631553649902, -1.8915271759033203, -0.3161916732788086, 1.2591447830200195, 2.8344802856445312, 4.409816265106201, 5.985152244567871, 7.560487747192383, 9.135824203491211, 10.711159706115723, 12.286495208740234, 13.861831665039062, 15.437167167663574, 17.012502670288086, 18.587839126586914, 20.16317367553711, 21.738510131835938, 23.313846588134766, 24.889183044433594, 26.464519500732422, 28.039854049682617, 29.615190505981445, 31.19052505493164, 32.76586151123047, 34.3411979675293, 35.916534423828125, 37.49186706542969, 39.06720733642578, 40.642539978027344, 42.21787643432617, 43.793212890625, 45.36854553222656, 46.94388198852539, 48.51921844482422, 50.09455490112305, 51.669891357421875, 53.2452278137207]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 10.0, 14.0, 10.0, 18.0, 14.0, 16.0, 34.0, 18.0, 31.0, 32.0, 37.0, 30.0, 41.0, 38.0, 44.0, 37.0, 34.0, 56.0, 47.0, 50.0, 33.0, 41.0, 41.0, 37.0, 37.0, 24.0, 25.0, 20.0, 18.0, 15.0, 16.0, 9.0, 11.0, 8.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.180599212646484, -61.082515716552734, -58.984432220458984, -56.8863525390625, -54.78826904296875, -52.690185546875, -50.59210205078125, -48.4940185546875, -46.39593505859375, -44.2978515625, -42.19976806640625, -40.1016845703125, -38.003604888916016, -35.905521392822266, -33.807437896728516, -31.709354400634766, -29.61127471923828, -27.51319122314453, -25.415109634399414, -23.317026138305664, -21.218944549560547, -19.120861053466797, -17.022777557373047, -14.924695014953613, -12.82661247253418, -10.728529930114746, -8.630447387695312, -6.5323638916015625, -4.434281349182129, -2.3361988067626953, -0.2381153106689453, 1.8599672317504883, 3.9580459594726562, 6.05612850189209, 8.154211044311523, 10.252294540405273, 12.350377082824707, 14.44845962524414, 16.54654312133789, 18.64462661743164, 20.742708206176758, 22.840791702270508, 24.938873291015625, 27.036956787109375, 29.135040283203125, 31.233121871948242, 33.331207275390625, 35.42928695678711, 37.52737045288086, 39.62545394897461, 41.72353744506836, 43.821617126464844, 45.919700622558594, 48.017784118652344, 50.115867614746094, 52.213951110839844, 54.312034606933594, 56.410118103027344, 58.508201599121094, 60.606285095214844, 62.70436477661133, 64.80244445800781, 66.90052795410156, 68.99861145019531, 71.09669494628906]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 21.0, 38.0, 60.0, 101.0, 162.0, 283.0, 471.0, 759.0, 1238.0, 2002.0, 3271.0, 5274.0, 8580.0, 13781.0, 21449.0, 33350.0, 50604.0, 75652.0, 111510.0, 158367.0, 216735.0, 281654.0, 346194.0, 398288.0, 424198.0, 419881.0, 385390.0, 328748.0, 263344.0, 199960.0, 144467.0, 101911.0, 68613.0, 45374.0, 30139.0, 19355.0, 12284.0, 7931.0, 4881.0, 3061.0, 1855.0, 1169.0, 733.0, 429.0, 265.0, 168.0, 96.0, 67.0, 42.0, 28.0, 12.0, 11.0, 8.0, 5.0, 3.0, 0.0, 3.0], "bins": [-43.1875, -41.83251953125, -40.4775390625, -39.12255859375, -37.767578125, -36.41259765625, -35.0576171875, -33.70263671875, -32.34765625, -30.99267578125, -29.6376953125, -28.28271484375, -26.927734375, -25.57275390625, -24.2177734375, -22.86279296875, -21.5078125, -20.15283203125, -18.7978515625, -17.44287109375, -16.087890625, -14.73291015625, -13.3779296875, -12.02294921875, -10.66796875, -9.31298828125, -7.9580078125, -6.60302734375, -5.248046875, -3.89306640625, -2.5380859375, -1.18310546875, 0.171875, 1.52685546875, 2.8818359375, 4.23681640625, 5.591796875, 6.94677734375, 8.3017578125, 9.65673828125, 11.01171875, 12.36669921875, 13.7216796875, 15.07666015625, 16.431640625, 17.78662109375, 19.1416015625, 20.49658203125, 21.8515625, 23.20654296875, 24.5615234375, 25.91650390625, 27.271484375, 28.62646484375, 29.9814453125, 31.33642578125, 32.69140625, 34.04638671875, 35.4013671875, 36.75634765625, 38.111328125, 39.46630859375, 40.8212890625, 42.17626953125, 43.53125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 6.0, 6.0, 11.0, 13.0, 11.0, 18.0, 13.0, 22.0, 30.0, 25.0, 35.0, 29.0, 30.0, 31.0, 47.0, 38.0, 38.0, 31.0, 45.0, 52.0, 45.0, 48.0, 40.0, 43.0, 33.0, 37.0, 33.0, 27.0, 21.0, 18.0, 19.0, 19.0, 13.0, 11.0, 6.0, 9.0, 8.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.1796875, -52.359375, -50.5390625, -48.71875, -46.8984375, -45.078125, -43.2578125, -41.4375, -39.6171875, -37.796875, -35.9765625, -34.15625, -32.3359375, -30.515625, -28.6953125, -26.875, -25.0546875, -23.234375, -21.4140625, -19.59375, -17.7734375, -15.953125, -14.1328125, -12.3125, -10.4921875, -8.671875, -6.8515625, -5.03125, -3.2109375, -1.390625, 0.4296875, 2.25, 4.0703125, 5.890625, 7.7109375, 9.53125, 11.3515625, 13.171875, 14.9921875, 16.8125, 18.6328125, 20.453125, 22.2734375, 24.09375, 25.9140625, 27.734375, 29.5546875, 31.375, 33.1953125, 35.015625, 36.8359375, 38.65625, 40.4765625, 42.296875, 44.1171875, 45.9375, 47.7578125, 49.578125, 51.3984375, 53.21875, 55.0390625, 56.859375, 58.6796875, 60.5]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 27.0, 33.0, 53.0, 102.0, 169.0, 323.0, 490.0, 890.0, 1513.0, 2478.0, 4184.0, 6783.0, 11356.0, 18283.0, 28719.0, 44732.0, 66945.0, 97496.0, 139459.0, 190665.0, 248387.0, 307323.0, 359410.0, 395469.0, 406839.0, 390484.0, 354055.0, 297747.0, 238975.0, 181915.0, 132655.0, 92836.0, 62686.0, 41319.0, 26673.0, 16537.0, 10394.0, 6355.0, 3792.0, 2358.0, 1380.0, 840.0, 486.0, 270.0, 167.0, 79.0, 71.0, 32.0, 18.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.9375, -42.4931640625, -41.048828125, -39.6044921875, -38.16015625, -36.7158203125, -35.271484375, -33.8271484375, -32.3828125, -30.9384765625, -29.494140625, -28.0498046875, -26.60546875, -25.1611328125, -23.716796875, -22.2724609375, -20.828125, -19.3837890625, -17.939453125, -16.4951171875, -15.05078125, -13.6064453125, -12.162109375, -10.7177734375, -9.2734375, -7.8291015625, -6.384765625, -4.9404296875, -3.49609375, -2.0517578125, -0.607421875, 0.8369140625, 2.28125, 3.7255859375, 5.169921875, 6.6142578125, 8.05859375, 9.5029296875, 10.947265625, 12.3916015625, 13.8359375, 15.2802734375, 16.724609375, 18.1689453125, 19.61328125, 21.0576171875, 22.501953125, 23.9462890625, 25.390625, 26.8349609375, 28.279296875, 29.7236328125, 31.16796875, 32.6123046875, 34.056640625, 35.5009765625, 36.9453125, 38.3896484375, 39.833984375, 41.2783203125, 42.72265625, 44.1669921875, 45.611328125, 47.0556640625, 48.5]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 14.0, 20.0, 18.0, 35.0, 29.0, 54.0, 55.0, 95.0, 90.0, 120.0, 142.0, 150.0, 163.0, 201.0, 207.0, 246.0, 215.0, 253.0, 220.0, 253.0, 204.0, 203.0, 176.0, 169.0, 151.0, 109.0, 111.0, 89.0, 66.0, 58.0, 38.0, 36.0, 22.0, 11.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.948974609375, -28.00732421875, -27.065673828125, -26.1240234375, -25.182373046875, -24.24072265625, -23.299072265625, -22.357421875, -21.415771484375, -20.47412109375, -19.532470703125, -18.5908203125, -17.649169921875, -16.70751953125, -15.765869140625, -14.82421875, -13.882568359375, -12.94091796875, -11.999267578125, -11.0576171875, -10.115966796875, -9.17431640625, -8.232666015625, -7.291015625, -6.349365234375, -5.40771484375, -4.466064453125, -3.5244140625, -2.582763671875, -1.64111328125, -0.699462890625, 0.2421875, 1.183837890625, 2.12548828125, 3.067138671875, 4.0087890625, 4.950439453125, 5.89208984375, 6.833740234375, 7.775390625, 8.717041015625, 9.65869140625, 10.600341796875, 11.5419921875, 12.483642578125, 13.42529296875, 14.366943359375, 15.30859375, 16.250244140625, 17.19189453125, 18.133544921875, 19.0751953125, 20.016845703125, 20.95849609375, 21.900146484375, 22.841796875, 23.783447265625, 24.72509765625, 25.666748046875, 26.6083984375, 27.550048828125, 28.49169921875, 29.433349609375, 30.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 7.0, 7.0, 16.0, 9.0, 12.0, 23.0, 21.0, 26.0, 23.0, 24.0, 30.0, 44.0, 38.0, 42.0, 41.0, 38.0, 41.0, 36.0, 45.0, 33.0, 36.0, 40.0, 41.0, 28.0, 27.0, 29.0, 24.0, 33.0, 28.0, 16.0, 10.0, 15.0, 21.0, 15.0, 14.0, 9.0, 5.0, 7.0, 6.0, 3.0, 8.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.45366668701172, -50.6524772644043, -48.85129165649414, -47.05010223388672, -45.2489128112793, -43.447723388671875, -41.64653778076172, -39.8453483581543, -38.044158935546875, -36.24296951293945, -34.4417839050293, -32.640594482421875, -30.839405059814453, -29.038217544555664, -27.237030029296875, -25.435840606689453, -23.634653091430664, -21.833465576171875, -20.032276153564453, -18.231088638305664, -16.429899215698242, -14.628711700439453, -12.827523231506348, -11.026334762573242, -9.225146293640137, -7.423957824707031, -5.622769355773926, -3.8215813636779785, -2.020392894744873, -0.21920490264892578, 1.5819835662841797, 3.383172035217285, 5.184360504150391, 6.985548973083496, 8.786737442016602, 10.58792495727539, 12.389114379882812, 14.190301895141602, 15.991490364074707, 17.792678833007812, 19.593868255615234, 21.395055770874023, 23.196245193481445, 24.997432708740234, 26.798622131347656, 28.599809646606445, 30.400997161865234, 32.202186584472656, 34.00337219238281, 35.804561614990234, 37.60574722290039, 39.40693664550781, 41.208126068115234, 43.009315490722656, 44.81050109863281, 46.611690521240234, 48.412879943847656, 50.21406936645508, 52.015254974365234, 53.816444396972656, 55.61763381958008, 57.4188232421875, 59.220008850097656, 61.02119827270508, 62.8223876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 7.0, 11.0, 12.0, 12.0, 19.0, 18.0, 19.0, 16.0, 23.0, 33.0, 36.0, 30.0, 36.0, 27.0, 40.0, 47.0, 36.0, 43.0, 28.0, 33.0, 48.0, 46.0, 33.0, 38.0, 43.0, 28.0, 31.0, 31.0, 23.0, 26.0, 15.0, 13.0, 13.0, 13.0, 9.0, 11.0, 8.0, 5.0, 9.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.35512924194336, -57.40300750732422, -55.45088195800781, -53.49876022338867, -51.54663848876953, -49.594512939453125, -47.642391204833984, -45.690269470214844, -43.73814392089844, -41.7860221862793, -39.83389663696289, -37.88177490234375, -35.92965316772461, -33.97753143310547, -32.02540588378906, -30.073284149169922, -28.12116241455078, -26.169038772583008, -24.216917037963867, -22.264793395996094, -20.312671661376953, -18.36054801940918, -16.408424377441406, -14.45630168914795, -12.504179000854492, -10.552056312561035, -8.599933624267578, -6.647809982299805, -4.695687294006348, -2.7435646057128906, -0.7914409637451172, 1.1606817245483398, 3.1128082275390625, 5.0649309158325195, 7.017054080963135, 8.96917724609375, 10.921299934387207, 12.873422622680664, 14.825546264648438, 16.777667999267578, 18.72979164123535, 20.681915283203125, 22.634037017822266, 24.58616065979004, 26.538284301757812, 28.490406036376953, 30.442529678344727, 32.3946533203125, 34.34677505493164, 36.29889678955078, 38.25102233886719, 40.20314407348633, 42.15526580810547, 44.107391357421875, 46.059513092041016, 48.011634826660156, 49.96376037597656, 51.9158821105957, 53.86800765991211, 55.82012939453125, 57.77225112915039, 59.72437286376953, 61.67649841308594, 63.62862014770508, 65.58074188232422]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 17.0, 34.0, 60.0, 80.0, 124.0, 213.0, 316.0, 551.0, 890.0, 1403.0, 2415.0, 3822.0, 6190.0, 10068.0, 15631.0, 24099.0, 36110.0, 52881.0, 73214.0, 95966.0, 115330.0, 124420.0, 119704.0, 103653.0, 81756.0, 59845.0, 41990.0, 28283.0, 18457.0, 11608.0, 7405.0, 4586.0, 2902.0, 1713.0, 1056.0, 696.0, 404.0, 228.0, 166.0, 79.0, 68.0, 36.0, 27.0, 20.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.70947265625, -13.2626953125, -12.81591796875, -12.369140625, -11.92236328125, -11.4755859375, -11.02880859375, -10.58203125, -10.13525390625, -9.6884765625, -9.24169921875, -8.794921875, -8.34814453125, -7.9013671875, -7.45458984375, -7.0078125, -6.56103515625, -6.1142578125, -5.66748046875, -5.220703125, -4.77392578125, -4.3271484375, -3.88037109375, -3.43359375, -2.98681640625, -2.5400390625, -2.09326171875, -1.646484375, -1.19970703125, -0.7529296875, -0.30615234375, 0.140625, 0.58740234375, 1.0341796875, 1.48095703125, 1.927734375, 2.37451171875, 2.8212890625, 3.26806640625, 3.71484375, 4.16162109375, 4.6083984375, 5.05517578125, 5.501953125, 5.94873046875, 6.3955078125, 6.84228515625, 7.2890625, 7.73583984375, 8.1826171875, 8.62939453125, 9.076171875, 9.52294921875, 9.9697265625, 10.41650390625, 10.86328125, 11.31005859375, 11.7568359375, 12.20361328125, 12.650390625, 13.09716796875, 13.5439453125, 13.99072265625, 14.4375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 11.0, 10.0, 13.0, 18.0, 19.0, 20.0, 17.0, 18.0, 39.0, 35.0, 30.0, 35.0, 28.0, 39.0, 47.0, 40.0, 38.0, 29.0, 35.0, 48.0, 45.0, 39.0, 31.0, 44.0, 30.0, 31.0, 29.0, 26.0, 22.0, 18.0, 12.0, 14.0, 11.0, 10.0, 11.0, 8.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.65625, -57.69384765625, -55.7314453125, -53.76904296875, -51.806640625, -49.84423828125, -47.8818359375, -45.91943359375, -43.95703125, -41.99462890625, -40.0322265625, -38.06982421875, -36.107421875, -34.14501953125, -32.1826171875, -30.22021484375, -28.2578125, -26.29541015625, -24.3330078125, -22.37060546875, -20.408203125, -18.44580078125, -16.4833984375, -14.52099609375, -12.55859375, -10.59619140625, -8.6337890625, -6.67138671875, -4.708984375, -2.74658203125, -0.7841796875, 1.17822265625, 3.140625, 5.10302734375, 7.0654296875, 9.02783203125, 10.990234375, 12.95263671875, 14.9150390625, 16.87744140625, 18.83984375, 20.80224609375, 22.7646484375, 24.72705078125, 26.689453125, 28.65185546875, 30.6142578125, 32.57666015625, 34.5390625, 36.50146484375, 38.4638671875, 40.42626953125, 42.388671875, 44.35107421875, 46.3134765625, 48.27587890625, 50.23828125, 52.20068359375, 54.1630859375, 56.12548828125, 58.087890625, 60.05029296875, 62.0126953125, 63.97509765625, 65.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 4.0, 5.0, 4.0, 3.0, 11.0, 7.0, 14.0, 24.0, 20.0, 39.0, 59.0, 87.0, 108.0, 163.0, 240.0, 439.0, 639.0, 1174.0, 1999.0, 3646.0, 6865.0, 13202.0, 26368.0, 129229.0, 792977.0, 35183.0, 16627.0, 8642.0, 4587.0, 2511.0, 1422.0, 845.0, 502.0, 306.0, 185.0, 131.0, 81.0, 50.0, 46.0, 31.0, 27.0, 16.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-60.625, -58.7412109375, -56.857421875, -54.9736328125, -53.08984375, -51.2060546875, -49.322265625, -47.4384765625, -45.5546875, -43.6708984375, -41.787109375, -39.9033203125, -38.01953125, -36.1357421875, -34.251953125, -32.3681640625, -30.484375, -28.6005859375, -26.716796875, -24.8330078125, -22.94921875, -21.0654296875, -19.181640625, -17.2978515625, -15.4140625, -13.5302734375, -11.646484375, -9.7626953125, -7.87890625, -5.9951171875, -4.111328125, -2.2275390625, -0.34375, 1.5400390625, 3.423828125, 5.3076171875, 7.19140625, 9.0751953125, 10.958984375, 12.8427734375, 14.7265625, 16.6103515625, 18.494140625, 20.3779296875, 22.26171875, 24.1455078125, 26.029296875, 27.9130859375, 29.796875, 31.6806640625, 33.564453125, 35.4482421875, 37.33203125, 39.2158203125, 41.099609375, 42.9833984375, 44.8671875, 46.7509765625, 48.634765625, 50.5185546875, 52.40234375, 54.2861328125, 56.169921875, 58.0537109375, 59.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 9.0, 6.0, 12.0, 8.0, 12.0, 10.0, 9.0, 14.0, 21.0, 21.0, 30.0, 26.0, 38.0, 43.0, 35.0, 37.0, 32.0, 52.0, 44.0, 42.0, 45.0, 40.0, 45.0, 48.0, 34.0, 34.0, 31.0, 35.0, 18.0, 28.0, 18.0, 20.0, 15.0, 15.0, 17.0, 9.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25, -42.8720703125, -41.494140625, -40.1162109375, -38.73828125, -37.3603515625, -35.982421875, -34.6044921875, -33.2265625, -31.8486328125, -30.470703125, -29.0927734375, -27.71484375, -26.3369140625, -24.958984375, -23.5810546875, -22.203125, -20.8251953125, -19.447265625, -18.0693359375, -16.69140625, -15.3134765625, -13.935546875, -12.5576171875, -11.1796875, -9.8017578125, -8.423828125, -7.0458984375, -5.66796875, -4.2900390625, -2.912109375, -1.5341796875, -0.15625, 1.2216796875, 2.599609375, 3.9775390625, 5.35546875, 6.7333984375, 8.111328125, 9.4892578125, 10.8671875, 12.2451171875, 13.623046875, 15.0009765625, 16.37890625, 17.7568359375, 19.134765625, 20.5126953125, 21.890625, 23.2685546875, 24.646484375, 26.0244140625, 27.40234375, 28.7802734375, 30.158203125, 31.5361328125, 32.9140625, 34.2919921875, 35.669921875, 37.0478515625, 38.42578125, 39.8037109375, 41.181640625, 42.5595703125, 43.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 2.0, 16.0, 13.0, 19.0, 28.0, 33.0, 48.0, 77.0, 89.0, 155.0, 211.0, 281.0, 489.0, 751.0, 1220.0, 2022.0, 3565.0, 5928.0, 10030.0, 18880.0, 38460.0, 779718.0, 126165.0, 26697.0, 14171.0, 7758.0, 4594.0, 2651.0, 1598.0, 953.0, 608.0, 423.0, 267.0, 174.0, 132.0, 93.0, 66.0, 36.0, 34.0, 25.0, 17.0, 16.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.078125, -2.981231689453125, -2.88433837890625, -2.787445068359375, -2.6905517578125, -2.593658447265625, -2.49676513671875, -2.399871826171875, -2.302978515625, -2.206085205078125, -2.10919189453125, -2.012298583984375, -1.9154052734375, -1.818511962890625, -1.72161865234375, -1.624725341796875, -1.52783203125, -1.430938720703125, -1.33404541015625, -1.237152099609375, -1.1402587890625, -1.043365478515625, -0.94647216796875, -0.849578857421875, -0.752685546875, -0.655792236328125, -0.55889892578125, -0.462005615234375, -0.3651123046875, -0.268218994140625, -0.17132568359375, -0.074432373046875, 0.0224609375, 0.119354248046875, 0.21624755859375, 0.313140869140625, 0.4100341796875, 0.506927490234375, 0.60382080078125, 0.700714111328125, 0.797607421875, 0.894500732421875, 0.99139404296875, 1.088287353515625, 1.1851806640625, 1.282073974609375, 1.37896728515625, 1.475860595703125, 1.57275390625, 1.669647216796875, 1.76654052734375, 1.863433837890625, 1.9603271484375, 2.057220458984375, 2.15411376953125, 2.251007080078125, 2.347900390625, 2.444793701171875, 2.54168701171875, 2.638580322265625, 2.7354736328125, 2.832366943359375, 2.92926025390625, 3.026153564453125, 3.123046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 6.0, 11.0, 13.0, 12.0, 15.0, 21.0, 24.0, 40.0, 51.0, 60.0, 60.0, 76.0, 69.0, 48.0, 80.0, 82.0, 57.0, 52.0, 42.0, 32.0, 31.0, 22.0, 10.0, 19.0, 10.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001575946807861328, -0.0001520290970802307, -0.0001464635133743286, -0.00014089792966842651, -0.00013533234596252441, -0.00012976676225662231, -0.00012420117855072021, -0.00011863559484481812, -0.00011307001113891602, -0.00010750442743301392, -0.00010193884372711182, -9.637326002120972e-05, -9.080767631530762e-05, -8.524209260940552e-05, -7.967650890350342e-05, -7.411092519760132e-05, -6.854534149169922e-05, -6.297975778579712e-05, -5.741417407989502e-05, -5.184859037399292e-05, -4.628300666809082e-05, -4.071742296218872e-05, -3.515183925628662e-05, -2.958625555038452e-05, -2.4020671844482422e-05, -1.8455088138580322e-05, -1.2889504432678223e-05, -7.323920726776123e-06, -1.7583370208740234e-06, 3.807246685028076e-06, 9.372830390930176e-06, 1.4938414096832275e-05, 2.0503997802734375e-05, 2.6069581508636475e-05, 3.1635165214538574e-05, 3.7200748920440674e-05, 4.2766332626342773e-05, 4.833191633224487e-05, 5.389750003814697e-05, 5.946308374404907e-05, 6.502866744995117e-05, 7.059425115585327e-05, 7.615983486175537e-05, 8.172541856765747e-05, 8.729100227355957e-05, 9.285658597946167e-05, 9.842216968536377e-05, 0.00010398775339126587, 0.00010955333709716797, 0.00011511892080307007, 0.00012068450450897217, 0.00012625008821487427, 0.00013181567192077637, 0.00013738125562667847, 0.00014294683933258057, 0.00014851242303848267, 0.00015407800674438477, 0.00015964359045028687, 0.00016520917415618896, 0.00017077475786209106, 0.00017634034156799316, 0.00018190592527389526, 0.00018747150897979736, 0.00019303709268569946, 0.00019860267639160156]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 8.0, 8.0, 18.0, 17.0, 34.0, 59.0, 85.0, 115.0, 218.0, 352.0, 536.0, 769.0, 1219.0, 1936.0, 3008.0, 4623.0, 7230.0, 11011.0, 16365.0, 23813.0, 34252.0, 48244.0, 64622.0, 82775.0, 100291.0, 112705.0, 113801.0, 103428.0, 86222.0, 67624.0, 50612.0, 36157.0, 25641.0, 17367.0, 11588.0, 7730.0, 5008.0, 3168.0, 2147.0, 1326.0, 848.0, 578.0, 381.0, 224.0, 153.0, 82.0, 58.0, 41.0, 30.0, 14.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.025390625, -1.95574951171875, -1.8861083984375, -1.81646728515625, -1.746826171875, -1.67718505859375, -1.6075439453125, -1.53790283203125, -1.46826171875, -1.39862060546875, -1.3289794921875, -1.25933837890625, -1.189697265625, -1.12005615234375, -1.0504150390625, -0.98077392578125, -0.9111328125, -0.84149169921875, -0.7718505859375, -0.70220947265625, -0.632568359375, -0.56292724609375, -0.4932861328125, -0.42364501953125, -0.35400390625, -0.28436279296875, -0.2147216796875, -0.14508056640625, -0.075439453125, -0.00579833984375, 0.0638427734375, 0.13348388671875, 0.203125, 0.27276611328125, 0.3424072265625, 0.41204833984375, 0.481689453125, 0.55133056640625, 0.6209716796875, 0.69061279296875, 0.76025390625, 0.82989501953125, 0.8995361328125, 0.96917724609375, 1.038818359375, 1.10845947265625, 1.1781005859375, 1.24774169921875, 1.3173828125, 1.38702392578125, 1.4566650390625, 1.52630615234375, 1.595947265625, 1.66558837890625, 1.7352294921875, 1.80487060546875, 1.87451171875, 1.94415283203125, 2.0137939453125, 2.08343505859375, 2.153076171875, 2.22271728515625, 2.2923583984375, 2.36199951171875, 2.431640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 14.0, 17.0, 19.0, 10.0, 21.0, 29.0, 28.0, 32.0, 40.0, 35.0, 52.0, 36.0, 37.0, 52.0, 46.0, 50.0, 45.0, 42.0, 42.0, 43.0, 53.0, 38.0, 30.0, 22.0, 18.0, 20.0, 27.0, 13.0, 19.0, 10.0, 5.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.103515625, -1.070770263671875, -1.03802490234375, -1.005279541015625, -0.9725341796875, -0.939788818359375, -0.90704345703125, -0.874298095703125, -0.841552734375, -0.808807373046875, -0.77606201171875, -0.743316650390625, -0.7105712890625, -0.677825927734375, -0.64508056640625, -0.612335205078125, -0.57958984375, -0.546844482421875, -0.51409912109375, -0.481353759765625, -0.4486083984375, -0.415863037109375, -0.38311767578125, -0.350372314453125, -0.317626953125, -0.284881591796875, -0.25213623046875, -0.219390869140625, -0.1866455078125, -0.153900146484375, -0.12115478515625, -0.088409423828125, -0.0556640625, -0.022918701171875, 0.00982666015625, 0.042572021484375, 0.0753173828125, 0.108062744140625, 0.14080810546875, 0.173553466796875, 0.206298828125, 0.239044189453125, 0.27178955078125, 0.304534912109375, 0.3372802734375, 0.370025634765625, 0.40277099609375, 0.435516357421875, 0.46826171875, 0.501007080078125, 0.53375244140625, 0.566497802734375, 0.5992431640625, 0.631988525390625, 0.66473388671875, 0.697479248046875, 0.730224609375, 0.762969970703125, 0.79571533203125, 0.828460693359375, 0.8612060546875, 0.893951416015625, 0.92669677734375, 0.959442138671875, 0.9921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 4.0, 9.0, 11.0, 9.0, 13.0, 21.0, 16.0, 15.0, 19.0, 27.0, 26.0, 34.0, 36.0, 38.0, 41.0, 47.0, 31.0, 36.0, 53.0, 29.0, 40.0, 39.0, 42.0, 30.0, 29.0, 28.0, 30.0, 35.0, 26.0, 27.0, 17.0, 8.0, 19.0, 17.0, 19.0, 10.0, 10.0, 5.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.127662658691406, -53.357574462890625, -51.587486267089844, -49.81739807128906, -48.047306060791016, -46.277217864990234, -44.50712966918945, -42.73704147338867, -40.966949462890625, -39.196861267089844, -37.42677307128906, -35.65668487548828, -33.886592864990234, -32.11650466918945, -30.346416473388672, -28.57632827758789, -26.80624008178711, -25.036151885986328, -23.266061782836914, -21.495973587036133, -19.72588348388672, -17.955795288085938, -16.185707092285156, -14.415617942810059, -12.645528793334961, -10.875439643859863, -9.105350494384766, -7.335262298583984, -5.565173149108887, -3.795083999633789, -2.024995803833008, -0.25490665435791016, 1.5151824951171875, 3.285271406173706, 5.055360317230225, 6.825448989868164, 8.595538139343262, 10.36562728881836, 12.13571548461914, 13.905804634094238, 15.675893783569336, 17.445981979370117, 19.21607208251953, 20.986160278320312, 22.756248474121094, 24.526338577270508, 26.29642677307129, 28.066516876220703, 29.836605072021484, 31.606693267822266, 33.37678146362305, 35.146873474121094, 36.916961669921875, 38.687049865722656, 40.45713806152344, 42.22722625732422, 43.997314453125, 45.76740264892578, 47.53749084472656, 49.307579040527344, 51.07767105102539, 52.84775924682617, 54.61784744262695, 56.387935638427734, 58.15802764892578]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 11.0, 9.0, 14.0, 17.0, 20.0, 18.0, 20.0, 19.0, 32.0, 40.0, 28.0, 36.0, 26.0, 42.0, 48.0, 38.0, 40.0, 28.0, 37.0, 41.0, 46.0, 41.0, 33.0, 41.0, 34.0, 33.0, 27.0, 27.0, 20.0, 17.0, 13.0, 11.0, 15.0, 11.0, 12.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.02375793457031, -58.05263900756836, -56.08151626586914, -54.11039733886719, -52.13927459716797, -50.168155670166016, -48.19703674316406, -46.225914001464844, -44.25479507446289, -42.28367614746094, -40.31255340576172, -38.341434478759766, -36.37031555175781, -34.399192810058594, -32.42807388305664, -30.456953048706055, -28.48583221435547, -26.514711380004883, -24.543590545654297, -22.572471618652344, -20.601350784301758, -18.630229949951172, -16.65911102294922, -14.687990188598633, -12.716869354248047, -10.745748519897461, -8.774628639221191, -6.803508281707764, -4.832387924194336, -2.86126708984375, -0.8901472091674805, 1.080972671508789, 3.052093505859375, 5.023213863372803, 6.9943342208862305, 8.9654541015625, 10.936574935913086, 12.907695770263672, 14.878815650939941, 16.84993553161621, 18.821056365966797, 20.792177200317383, 22.76329803466797, 24.734416961669922, 26.705537796020508, 28.676658630371094, 30.647777557373047, 32.618896484375, 34.59001922607422, 36.56113815307617, 38.53226089477539, 40.503379821777344, 42.47450256347656, 44.445621490478516, 46.41674041748047, 48.38786315917969, 50.35898208618164, 52.330101013183594, 54.30122375488281, 56.272342681884766, 58.24346160888672, 60.21458435058594, 62.18570327758789, 64.15682220458984, 66.12794494628906]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 9.0, 14.0, 16.0, 36.0, 59.0, 95.0, 172.0, 276.0, 516.0, 975.0, 1753.0, 3279.0, 6053.0, 10554.0, 18216.0, 29788.0, 45599.0, 65871.0, 87032.0, 107752.0, 120799.0, 122597.0, 114046.0, 96165.0, 74650.0, 53696.0, 35700.0, 22391.0, 13522.0, 7697.0, 4174.0, 2269.0, 1205.0, 677.0, 364.0, 196.0, 119.0, 76.0, 49.0, 25.0, 22.0, 15.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.28125, -50.60595703125, -48.9306640625, -47.25537109375, -45.580078125, -43.90478515625, -42.2294921875, -40.55419921875, -38.87890625, -37.20361328125, -35.5283203125, -33.85302734375, -32.177734375, -30.50244140625, -28.8271484375, -27.15185546875, -25.4765625, -23.80126953125, -22.1259765625, -20.45068359375, -18.775390625, -17.10009765625, -15.4248046875, -13.74951171875, -12.07421875, -10.39892578125, -8.7236328125, -7.04833984375, -5.373046875, -3.69775390625, -2.0224609375, -0.34716796875, 1.328125, 3.00341796875, 4.6787109375, 6.35400390625, 8.029296875, 9.70458984375, 11.3798828125, 13.05517578125, 14.73046875, 16.40576171875, 18.0810546875, 19.75634765625, 21.431640625, 23.10693359375, 24.7822265625, 26.45751953125, 28.1328125, 29.80810546875, 31.4833984375, 33.15869140625, 34.833984375, 36.50927734375, 38.1845703125, 39.85986328125, 41.53515625, 43.21044921875, 44.8857421875, 46.56103515625, 48.236328125, 49.91162109375, 51.5869140625, 53.26220703125, 54.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 7.0, 8.0, 10.0, 15.0, 13.0, 26.0, 16.0, 20.0, 18.0, 36.0, 36.0, 29.0, 39.0, 23.0, 43.0, 54.0, 33.0, 38.0, 34.0, 34.0, 48.0, 43.0, 44.0, 32.0, 42.0, 27.0, 33.0, 26.0, 30.0, 21.0, 16.0, 13.0, 12.0, 11.0, 14.0, 10.0, 4.0, 5.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-58.4375, -56.513671875, -54.58984375, -52.666015625, -50.7421875, -48.818359375, -46.89453125, -44.970703125, -43.046875, -41.123046875, -39.19921875, -37.275390625, -35.3515625, -33.427734375, -31.50390625, -29.580078125, -27.65625, -25.732421875, -23.80859375, -21.884765625, -19.9609375, -18.037109375, -16.11328125, -14.189453125, -12.265625, -10.341796875, -8.41796875, -6.494140625, -4.5703125, -2.646484375, -0.72265625, 1.201171875, 3.125, 5.048828125, 6.97265625, 8.896484375, 10.8203125, 12.744140625, 14.66796875, 16.591796875, 18.515625, 20.439453125, 22.36328125, 24.287109375, 26.2109375, 28.134765625, 30.05859375, 31.982421875, 33.90625, 35.830078125, 37.75390625, 39.677734375, 41.6015625, 43.525390625, 45.44921875, 47.373046875, 49.296875, 51.220703125, 53.14453125, 55.068359375, 56.9921875, 58.916015625, 60.83984375, 62.763671875, 64.6875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 28.0, 42.0, 72.0, 118.0, 232.0, 400.0, 716.0, 1124.0, 1976.0, 3389.0, 5614.0, 9282.0, 14744.0, 22655.0, 33012.0, 47160.0, 62745.0, 79667.0, 93982.0, 104757.0, 106934.0, 102408.0, 91338.0, 76778.0, 59012.0, 44307.0, 30819.0, 20864.0, 13379.0, 8519.0, 5105.0, 3097.0, 1836.0, 1080.0, 566.0, 343.0, 185.0, 89.0, 62.0, 40.0, 27.0, 13.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -36.9443359375, -35.544921875, -34.1455078125, -32.74609375, -31.3466796875, -29.947265625, -28.5478515625, -27.1484375, -25.7490234375, -24.349609375, -22.9501953125, -21.55078125, -20.1513671875, -18.751953125, -17.3525390625, -15.953125, -14.5537109375, -13.154296875, -11.7548828125, -10.35546875, -8.9560546875, -7.556640625, -6.1572265625, -4.7578125, -3.3583984375, -1.958984375, -0.5595703125, 0.83984375, 2.2392578125, 3.638671875, 5.0380859375, 6.4375, 7.8369140625, 9.236328125, 10.6357421875, 12.03515625, 13.4345703125, 14.833984375, 16.2333984375, 17.6328125, 19.0322265625, 20.431640625, 21.8310546875, 23.23046875, 24.6298828125, 26.029296875, 27.4287109375, 28.828125, 30.2275390625, 31.626953125, 33.0263671875, 34.42578125, 35.8251953125, 37.224609375, 38.6240234375, 40.0234375, 41.4228515625, 42.822265625, 44.2216796875, 45.62109375, 47.0205078125, 48.419921875, 49.8193359375, 51.21875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 14.0, 11.0, 23.0, 24.0, 23.0, 24.0, 28.0, 41.0, 33.0, 40.0, 40.0, 33.0, 30.0, 39.0, 31.0, 45.0, 52.0, 33.0, 31.0, 33.0, 26.0, 36.0, 30.0, 23.0, 31.0, 32.0, 17.0, 18.0, 14.0, 13.0, 6.0, 11.0, 11.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -37.95361328125, -36.7509765625, -35.54833984375, -34.345703125, -33.14306640625, -31.9404296875, -30.73779296875, -29.53515625, -28.33251953125, -27.1298828125, -25.92724609375, -24.724609375, -23.52197265625, -22.3193359375, -21.11669921875, -19.9140625, -18.71142578125, -17.5087890625, -16.30615234375, -15.103515625, -13.90087890625, -12.6982421875, -11.49560546875, -10.29296875, -9.09033203125, -7.8876953125, -6.68505859375, -5.482421875, -4.27978515625, -3.0771484375, -1.87451171875, -0.671875, 0.53076171875, 1.7333984375, 2.93603515625, 4.138671875, 5.34130859375, 6.5439453125, 7.74658203125, 8.94921875, 10.15185546875, 11.3544921875, 12.55712890625, 13.759765625, 14.96240234375, 16.1650390625, 17.36767578125, 18.5703125, 19.77294921875, 20.9755859375, 22.17822265625, 23.380859375, 24.58349609375, 25.7861328125, 26.98876953125, 28.19140625, 29.39404296875, 30.5966796875, 31.79931640625, 33.001953125, 34.20458984375, 35.4072265625, 36.60986328125, 37.8125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 7.0, 9.0, 15.0, 16.0, 28.0, 40.0, 63.0, 83.0, 112.0, 171.0, 281.0, 409.0, 635.0, 965.0, 1399.0, 2245.0, 3617.0, 5312.0, 8165.0, 12283.0, 17880.0, 26066.0, 36264.0, 49083.0, 62972.0, 77076.0, 89514.0, 97786.0, 99381.0, 95072.0, 85738.0, 72287.0, 57817.0, 44470.0, 32111.0, 22807.0, 15819.0, 10431.0, 6795.0, 4734.0, 2943.0, 1986.0, 1300.0, 824.0, 539.0, 323.0, 233.0, 148.0, 86.0, 76.0, 56.0, 29.0, 27.0, 15.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0], "bins": [-15.8359375, -15.345947265625, -14.85595703125, -14.365966796875, -13.8759765625, -13.385986328125, -12.89599609375, -12.406005859375, -11.916015625, -11.426025390625, -10.93603515625, -10.446044921875, -9.9560546875, -9.466064453125, -8.97607421875, -8.486083984375, -7.99609375, -7.506103515625, -7.01611328125, -6.526123046875, -6.0361328125, -5.546142578125, -5.05615234375, -4.566162109375, -4.076171875, -3.586181640625, -3.09619140625, -2.606201171875, -2.1162109375, -1.626220703125, -1.13623046875, -0.646240234375, -0.15625, 0.333740234375, 0.82373046875, 1.313720703125, 1.8037109375, 2.293701171875, 2.78369140625, 3.273681640625, 3.763671875, 4.253662109375, 4.74365234375, 5.233642578125, 5.7236328125, 6.213623046875, 6.70361328125, 7.193603515625, 7.68359375, 8.173583984375, 8.66357421875, 9.153564453125, 9.6435546875, 10.133544921875, 10.62353515625, 11.113525390625, 11.603515625, 12.093505859375, 12.58349609375, 13.073486328125, 13.5634765625, 14.053466796875, 14.54345703125, 15.033447265625, 15.5234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 17.0, 15.0, 18.0, 19.0, 26.0, 39.0, 36.0, 37.0, 51.0, 31.0, 60.0, 44.0, 61.0, 63.0, 59.0, 51.0, 43.0, 43.0, 31.0, 43.0, 34.0, 38.0, 26.0, 23.0, 23.0, 13.0, 8.0, 11.0, 4.0, 3.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002838134765625, -0.0027550160884857178, -0.0026718974113464355, -0.0025887787342071533, -0.002505660057067871, -0.002422541379928589, -0.0023394227027893066, -0.0022563040256500244, -0.002173185348510742, -0.00209006667137146, -0.0020069479942321777, -0.0019238293170928955, -0.0018407106399536133, -0.001757591962814331, -0.0016744732856750488, -0.0015913546085357666, -0.0015082359313964844, -0.0014251172542572021, -0.00134199857711792, -0.0012588798999786377, -0.0011757612228393555, -0.0010926425457000732, -0.001009523868560791, -0.0009264051914215088, -0.0008432865142822266, -0.0007601678371429443, -0.0006770491600036621, -0.0005939304828643799, -0.0005108118057250977, -0.00042769312858581543, -0.0003445744514465332, -0.000261455774307251, -0.00017833709716796875, -9.521842002868652e-05, -1.2099742889404297e-05, 7.101893424987793e-05, 0.00015413761138916016, 0.00023725628852844238, 0.0003203749656677246, 0.00040349364280700684, 0.00048661231994628906, 0.0005697309970855713, 0.0006528496742248535, 0.0007359683513641357, 0.000819087028503418, 0.0009022057056427002, 0.0009853243827819824, 0.0010684430599212646, 0.0011515617370605469, 0.001234680414199829, 0.0013177990913391113, 0.0014009177684783936, 0.0014840364456176758, 0.001567155122756958, 0.0016502737998962402, 0.0017333924770355225, 0.0018165111541748047, 0.001899629831314087, 0.001982748508453369, 0.0020658671855926514, 0.0021489858627319336, 0.002232104539871216, 0.002315223217010498, 0.0023983418941497803, 0.0024814605712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 17.0, 24.0, 27.0, 30.0, 61.0, 108.0, 164.0, 246.0, 413.0, 645.0, 1092.0, 1808.0, 2903.0, 4750.0, 7764.0, 12540.0, 20049.0, 30420.0, 44945.0, 63377.0, 83710.0, 102572.0, 115229.0, 118124.0, 110168.0, 94337.0, 74417.0, 54443.0, 37555.0, 24931.0, 16044.0, 9984.0, 6040.0, 3722.0, 2251.0, 1362.0, 903.0, 517.0, 304.0, 210.0, 135.0, 68.0, 40.0, 41.0, 23.0, 16.0, 14.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.788330078125, -18.12353515625, -17.458740234375, -16.7939453125, -16.129150390625, -15.46435546875, -14.799560546875, -14.134765625, -13.469970703125, -12.80517578125, -12.140380859375, -11.4755859375, -10.810791015625, -10.14599609375, -9.481201171875, -8.81640625, -8.151611328125, -7.48681640625, -6.822021484375, -6.1572265625, -5.492431640625, -4.82763671875, -4.162841796875, -3.498046875, -2.833251953125, -2.16845703125, -1.503662109375, -0.8388671875, -0.174072265625, 0.49072265625, 1.155517578125, 1.8203125, 2.485107421875, 3.14990234375, 3.814697265625, 4.4794921875, 5.144287109375, 5.80908203125, 6.473876953125, 7.138671875, 7.803466796875, 8.46826171875, 9.133056640625, 9.7978515625, 10.462646484375, 11.12744140625, 11.792236328125, 12.45703125, 13.121826171875, 13.78662109375, 14.451416015625, 15.1162109375, 15.781005859375, 16.44580078125, 17.110595703125, 17.775390625, 18.440185546875, 19.10498046875, 19.769775390625, 20.4345703125, 21.099365234375, 21.76416015625, 22.428955078125, 23.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 12.0, 5.0, 14.0, 4.0, 12.0, 12.0, 17.0, 20.0, 21.0, 21.0, 28.0, 17.0, 27.0, 39.0, 48.0, 33.0, 33.0, 33.0, 45.0, 51.0, 48.0, 30.0, 41.0, 34.0, 43.0, 40.0, 25.0, 28.0, 21.0, 21.0, 20.0, 20.0, 14.0, 23.0, 27.0, 9.0, 9.0, 9.0, 9.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.96484375, -7.69805908203125, -7.4312744140625, -7.16448974609375, -6.897705078125, -6.63092041015625, -6.3641357421875, -6.09735107421875, -5.83056640625, -5.56378173828125, -5.2969970703125, -5.03021240234375, -4.763427734375, -4.49664306640625, -4.2298583984375, -3.96307373046875, -3.6962890625, -3.42950439453125, -3.1627197265625, -2.89593505859375, -2.629150390625, -2.36236572265625, -2.0955810546875, -1.82879638671875, -1.56201171875, -1.29522705078125, -1.0284423828125, -0.76165771484375, -0.494873046875, -0.22808837890625, 0.0386962890625, 0.30548095703125, 0.572265625, 0.83905029296875, 1.1058349609375, 1.37261962890625, 1.639404296875, 1.90618896484375, 2.1729736328125, 2.43975830078125, 2.70654296875, 2.97332763671875, 3.2401123046875, 3.50689697265625, 3.773681640625, 4.04046630859375, 4.3072509765625, 4.57403564453125, 4.8408203125, 5.10760498046875, 5.3743896484375, 5.64117431640625, 5.907958984375, 6.17474365234375, 6.4415283203125, 6.70831298828125, 6.97509765625, 7.24188232421875, 7.5086669921875, 7.77545166015625, 8.042236328125, 8.30902099609375, 8.5758056640625, 8.84259033203125, 9.109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 10.0, 2.0, 10.0, 9.0, 11.0, 8.0, 8.0, 11.0, 16.0, 22.0, 16.0, 13.0, 27.0, 34.0, 32.0, 33.0, 41.0, 40.0, 37.0, 28.0, 31.0, 46.0, 32.0, 44.0, 40.0, 32.0, 29.0, 30.0, 28.0, 26.0, 26.0, 23.0, 28.0, 26.0, 27.0, 18.0, 25.0, 9.0, 9.0, 9.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.527687072753906, -54.86153030395508, -53.19537353515625, -51.52921676635742, -49.863059997558594, -48.19690704345703, -46.53074645996094, -44.864593505859375, -43.19843673706055, -41.53227996826172, -39.86612319946289, -38.19996643066406, -36.533809661865234, -34.867652893066406, -33.201499938964844, -31.535343170166016, -29.869184494018555, -28.203027725219727, -26.5368709564209, -24.870716094970703, -23.204559326171875, -21.538402557373047, -19.87224578857422, -18.20608901977539, -16.539932250976562, -14.873775482177734, -13.207619667053223, -11.541462898254395, -9.875307083129883, -8.209150314331055, -6.542993545532227, -4.876837730407715, -3.210681915283203, -1.5445255041122437, 0.12163090705871582, 1.7877874374389648, 3.4539437294006348, 5.120100021362305, 6.786256790161133, 8.452412605285645, 10.118569374084473, 11.7847261428833, 13.450881958007812, 15.11703872680664, 16.78319549560547, 18.449352264404297, 20.115509033203125, 21.78166389465332, 23.44782066345215, 25.113977432250977, 26.780134201049805, 28.4462890625, 30.112445831298828, 31.778602600097656, 33.444759368896484, 35.11091613769531, 36.77707290649414, 38.44322967529297, 40.1093864440918, 41.775543212890625, 43.44169998168945, 45.10785675048828, 46.774009704589844, 48.44016647338867, 50.1063232421875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 15.0, 14.0, 8.0, 20.0, 10.0, 17.0, 20.0, 28.0, 23.0, 25.0, 34.0, 37.0, 38.0, 29.0, 38.0, 52.0, 34.0, 47.0, 45.0, 46.0, 43.0, 40.0, 39.0, 39.0, 30.0, 42.0, 25.0, 26.0, 16.0, 22.0, 20.0, 16.0, 13.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.81147384643555, -55.67109680175781, -53.53071594238281, -51.39033889770508, -49.249961853027344, -47.109580993652344, -44.96920394897461, -42.828826904296875, -40.688446044921875, -38.54806900024414, -36.40768814086914, -34.267311096191406, -32.12693405151367, -29.986555099487305, -27.846176147460938, -25.705799102783203, -23.56542205810547, -21.4250431060791, -19.284666061401367, -17.144287109375, -15.00390911102295, -12.863531112670898, -10.723152160644531, -8.58277416229248, -6.44239616394043, -4.302018165588379, -2.16163969039917, -0.021261215209960938, 2.11911678314209, 4.259494781494141, 6.399873733520508, 8.540251731872559, 10.680633544921875, 12.821011543273926, 14.961389541625977, 17.101768493652344, 19.242145538330078, 21.382524490356445, 23.522903442382812, 25.663280487060547, 27.803659439086914, 29.94403839111328, 32.084415435791016, 34.22479248046875, 36.36517333984375, 38.505550384521484, 40.64592742919922, 42.78630828857422, 44.92668533325195, 47.06706237792969, 49.20744323730469, 51.34782028198242, 53.488197326660156, 55.628578186035156, 57.76895523071289, 59.909332275390625, 62.049713134765625, 64.19009399414062, 66.3304672241211, 68.4708480834961, 70.6112289428711, 72.75160217285156, 74.89198303222656, 77.03236389160156, 79.17273712158203]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 24.0, 28.0, 47.0, 82.0, 129.0, 243.0, 456.0, 780.0, 1201.0, 2057.0, 3362.0, 5304.0, 8751.0, 13824.0, 22019.0, 34292.0, 52399.0, 78231.0, 114713.0, 160931.0, 217855.0, 277919.0, 339984.0, 388691.0, 414729.0, 409730.0, 381396.0, 329633.0, 267333.0, 206089.0, 149846.0, 106846.0, 72593.0, 47944.0, 31307.0, 20228.0, 12459.0, 7981.0, 4838.0, 3064.0, 1999.0, 1133.0, 712.0, 421.0, 230.0, 164.0, 113.0, 71.0, 43.0, 27.0, 10.0, 11.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-41.8125, -40.45947265625, -39.1064453125, -37.75341796875, -36.400390625, -35.04736328125, -33.6943359375, -32.34130859375, -30.98828125, -29.63525390625, -28.2822265625, -26.92919921875, -25.576171875, -24.22314453125, -22.8701171875, -21.51708984375, -20.1640625, -18.81103515625, -17.4580078125, -16.10498046875, -14.751953125, -13.39892578125, -12.0458984375, -10.69287109375, -9.33984375, -7.98681640625, -6.6337890625, -5.28076171875, -3.927734375, -2.57470703125, -1.2216796875, 0.13134765625, 1.484375, 2.83740234375, 4.1904296875, 5.54345703125, 6.896484375, 8.24951171875, 9.6025390625, 10.95556640625, 12.30859375, 13.66162109375, 15.0146484375, 16.36767578125, 17.720703125, 19.07373046875, 20.4267578125, 21.77978515625, 23.1328125, 24.48583984375, 25.8388671875, 27.19189453125, 28.544921875, 29.89794921875, 31.2509765625, 32.60400390625, 33.95703125, 35.31005859375, 36.6630859375, 38.01611328125, 39.369140625, 40.72216796875, 42.0751953125, 43.42822265625, 44.78125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 16.0, 11.0, 8.0, 15.0, 16.0, 19.0, 18.0, 30.0, 19.0, 21.0, 37.0, 42.0, 26.0, 37.0, 37.0, 44.0, 39.0, 42.0, 52.0, 41.0, 39.0, 42.0, 38.0, 40.0, 37.0, 36.0, 29.0, 20.0, 22.0, 19.0, 18.0, 20.0, 15.0, 9.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.03125, -49.15478515625, -47.2783203125, -45.40185546875, -43.525390625, -41.64892578125, -39.7724609375, -37.89599609375, -36.01953125, -34.14306640625, -32.2666015625, -30.39013671875, -28.513671875, -26.63720703125, -24.7607421875, -22.88427734375, -21.0078125, -19.13134765625, -17.2548828125, -15.37841796875, -13.501953125, -11.62548828125, -9.7490234375, -7.87255859375, -5.99609375, -4.11962890625, -2.2431640625, -0.36669921875, 1.509765625, 3.38623046875, 5.2626953125, 7.13916015625, 9.015625, 10.89208984375, 12.7685546875, 14.64501953125, 16.521484375, 18.39794921875, 20.2744140625, 22.15087890625, 24.02734375, 25.90380859375, 27.7802734375, 29.65673828125, 31.533203125, 33.40966796875, 35.2861328125, 37.16259765625, 39.0390625, 40.91552734375, 42.7919921875, 44.66845703125, 46.544921875, 48.42138671875, 50.2978515625, 52.17431640625, 54.05078125, 55.92724609375, 57.8037109375, 59.68017578125, 61.556640625, 63.43310546875, 65.3095703125, 67.18603515625, 69.0625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 15.0, 27.0, 46.0, 93.0, 190.0, 295.0, 500.0, 884.0, 1591.0, 2477.0, 4332.0, 7086.0, 11487.0, 18468.0, 29606.0, 45764.0, 68623.0, 101308.0, 140926.0, 191202.0, 248418.0, 304618.0, 354182.0, 387647.0, 398152.0, 384156.0, 348207.0, 299060.0, 242316.0, 185788.0, 137275.0, 95939.0, 66231.0, 44127.0, 28019.0, 17582.0, 11051.0, 6751.0, 4085.0, 2358.0, 1403.0, 824.0, 485.0, 284.0, 170.0, 92.0, 71.0, 35.0, 16.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-46.46875, -45.03662109375, -43.6044921875, -42.17236328125, -40.740234375, -39.30810546875, -37.8759765625, -36.44384765625, -35.01171875, -33.57958984375, -32.1474609375, -30.71533203125, -29.283203125, -27.85107421875, -26.4189453125, -24.98681640625, -23.5546875, -22.12255859375, -20.6904296875, -19.25830078125, -17.826171875, -16.39404296875, -14.9619140625, -13.52978515625, -12.09765625, -10.66552734375, -9.2333984375, -7.80126953125, -6.369140625, -4.93701171875, -3.5048828125, -2.07275390625, -0.640625, 0.79150390625, 2.2236328125, 3.65576171875, 5.087890625, 6.52001953125, 7.9521484375, 9.38427734375, 10.81640625, 12.24853515625, 13.6806640625, 15.11279296875, 16.544921875, 17.97705078125, 19.4091796875, 20.84130859375, 22.2734375, 23.70556640625, 25.1376953125, 26.56982421875, 28.001953125, 29.43408203125, 30.8662109375, 32.29833984375, 33.73046875, 35.16259765625, 36.5947265625, 38.02685546875, 39.458984375, 40.89111328125, 42.3232421875, 43.75537109375, 45.1875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 24.0, 35.0, 53.0, 60.0, 64.0, 81.0, 86.0, 108.0, 107.0, 138.0, 113.0, 156.0, 155.0, 188.0, 223.0, 166.0, 198.0, 195.0, 191.0, 196.0, 157.0, 168.0, 149.0, 156.0, 117.0, 102.0, 92.0, 82.0, 79.0, 71.0, 48.0, 54.0, 44.0, 29.0, 23.0, 31.0, 10.0, 19.0, 14.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0], "bins": [-25.15625, -24.398681640625, -23.64111328125, -22.883544921875, -22.1259765625, -21.368408203125, -20.61083984375, -19.853271484375, -19.095703125, -18.338134765625, -17.58056640625, -16.822998046875, -16.0654296875, -15.307861328125, -14.55029296875, -13.792724609375, -13.03515625, -12.277587890625, -11.52001953125, -10.762451171875, -10.0048828125, -9.247314453125, -8.48974609375, -7.732177734375, -6.974609375, -6.217041015625, -5.45947265625, -4.701904296875, -3.9443359375, -3.186767578125, -2.42919921875, -1.671630859375, -0.9140625, -0.156494140625, 0.60107421875, 1.358642578125, 2.1162109375, 2.873779296875, 3.63134765625, 4.388916015625, 5.146484375, 5.904052734375, 6.66162109375, 7.419189453125, 8.1767578125, 8.934326171875, 9.69189453125, 10.449462890625, 11.20703125, 11.964599609375, 12.72216796875, 13.479736328125, 14.2373046875, 14.994873046875, 15.75244140625, 16.510009765625, 17.267578125, 18.025146484375, 18.78271484375, 19.540283203125, 20.2978515625, 21.055419921875, 21.81298828125, 22.570556640625, 23.328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 6.0, 11.0, 15.0, 12.0, 9.0, 16.0, 20.0, 22.0, 26.0, 24.0, 27.0, 36.0, 39.0, 28.0, 38.0, 37.0, 42.0, 45.0, 50.0, 44.0, 43.0, 35.0, 38.0, 26.0, 37.0, 27.0, 26.0, 26.0, 24.0, 27.0, 12.0, 24.0, 12.0, 16.0, 9.0, 11.0, 3.0, 8.0, 8.0, 7.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.483909606933594, -53.61665725708008, -51.74940872192383, -49.88215637207031, -48.01490783691406, -46.14765548706055, -44.28040313720703, -42.41315460205078, -40.545902252197266, -38.67864990234375, -36.8114013671875, -34.944149017333984, -33.076900482177734, -31.20964813232422, -29.342397689819336, -27.475147247314453, -25.60789680480957, -23.740646362304688, -21.873395919799805, -20.006145477294922, -18.138893127441406, -16.271642684936523, -14.40439224243164, -12.537140846252441, -10.669890403747559, -8.802639961242676, -6.935388565063477, -5.068138122558594, -3.2008872032165527, -1.3336362838745117, 0.5336141586303711, 2.4008655548095703, 4.268115997314453, 6.135366916656494, 8.002617835998535, 9.869868278503418, 11.737119674682617, 13.6043701171875, 15.471620559692383, 17.338871002197266, 19.20612335205078, 21.073373794555664, 22.940624237060547, 24.807876586914062, 26.675127029418945, 28.542377471923828, 30.40962791442871, 32.276878356933594, 34.144126892089844, 36.01137924194336, 37.87862777709961, 39.745880126953125, 41.613128662109375, 43.48038101196289, 45.347633361816406, 47.214881896972656, 49.08213424682617, 50.94938659667969, 52.81663513183594, 54.68388748168945, 56.5511360168457, 58.41838836669922, 60.28563690185547, 62.152889251708984, 64.0201416015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 1.0, 9.0, 7.0, 11.0, 12.0, 11.0, 22.0, 25.0, 15.0, 27.0, 26.0, 21.0, 17.0, 24.0, 30.0, 36.0, 26.0, 37.0, 40.0, 31.0, 29.0, 40.0, 40.0, 31.0, 38.0, 45.0, 33.0, 36.0, 31.0, 29.0, 32.0, 20.0, 25.0, 19.0, 16.0, 15.0, 17.0, 12.0, 6.0, 7.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-50.905338287353516, -49.10744857788086, -47.30955505371094, -45.51166534423828, -43.71377182006836, -41.9158821105957, -40.11798858642578, -38.320098876953125, -36.52220916748047, -34.72431945800781, -32.92642593383789, -31.128536224365234, -29.330642700195312, -27.532752990722656, -25.734861373901367, -23.936969757080078, -22.139076232910156, -20.341184616088867, -18.543292999267578, -16.745403289794922, -14.947510719299316, -13.149619102478027, -11.351728439331055, -9.553836822509766, -7.755945205688477, -5.9580535888671875, -4.160162448883057, -2.362271308898926, -0.5643796920776367, 1.2335119247436523, 3.031402587890625, 4.829294204711914, 6.627189636230469, 8.425081253051758, 10.222972869873047, 12.02086353302002, 13.818755149841309, 15.616646766662598, 17.41453742980957, 19.21242904663086, 21.01032066345215, 22.808212280273438, 24.606103897094727, 26.403995513916016, 28.201885223388672, 29.999778747558594, 31.79766845703125, 33.595558166503906, 35.39345169067383, 37.191341400146484, 38.989234924316406, 40.78712463378906, 42.585018157958984, 44.38290786743164, 46.18080139160156, 47.97869110107422, 49.776580810546875, 51.57447052001953, 53.37236404418945, 55.17025375366211, 56.96814727783203, 58.76603698730469, 60.563926696777344, 62.361820220947266, 64.15971374511719]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 10.0, 14.0, 19.0, 30.0, 41.0, 67.0, 99.0, 157.0, 214.0, 303.0, 477.0, 690.0, 1068.0, 1575.0, 2380.0, 3621.0, 5432.0, 7967.0, 11607.0, 17099.0, 24088.0, 34120.0, 46662.0, 59974.0, 75804.0, 90004.0, 99220.0, 102146.0, 97896.0, 87647.0, 72903.0, 57617.0, 43967.0, 31704.0, 22688.0, 15950.0, 10989.0, 7450.0, 4882.0, 3232.0, 2244.0, 1514.0, 974.0, 692.0, 415.0, 293.0, 213.0, 142.0, 65.0, 74.0, 33.0, 33.0, 15.0, 13.0, 10.0, 7.0, 4.0, 5.0, 0.0, 3.0, 3.0], "bins": [-9.015625, -8.7191162109375, -8.422607421875, -8.1260986328125, -7.82958984375, -7.5330810546875, -7.236572265625, -6.9400634765625, -6.6435546875, -6.3470458984375, -6.050537109375, -5.7540283203125, -5.45751953125, -5.1610107421875, -4.864501953125, -4.5679931640625, -4.271484375, -3.9749755859375, -3.678466796875, -3.3819580078125, -3.08544921875, -2.7889404296875, -2.492431640625, -2.1959228515625, -1.8994140625, -1.6029052734375, -1.306396484375, -1.0098876953125, -0.71337890625, -0.4168701171875, -0.120361328125, 0.1761474609375, 0.47265625, 0.7691650390625, 1.065673828125, 1.3621826171875, 1.65869140625, 1.9552001953125, 2.251708984375, 2.5482177734375, 2.8447265625, 3.1412353515625, 3.437744140625, 3.7342529296875, 4.03076171875, 4.3272705078125, 4.623779296875, 4.9202880859375, 5.216796875, 5.5133056640625, 5.809814453125, 6.1063232421875, 6.40283203125, 6.6993408203125, 6.995849609375, 7.2923583984375, 7.5888671875, 7.8853759765625, 8.181884765625, 8.4783935546875, 8.77490234375, 9.0714111328125, 9.367919921875, 9.6644287109375, 9.9609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 0.0, 9.0, 7.0, 12.0, 11.0, 13.0, 22.0, 24.0, 15.0, 28.0, 25.0, 20.0, 17.0, 25.0, 33.0, 33.0, 31.0, 32.0, 40.0, 31.0, 32.0, 42.0, 34.0, 31.0, 43.0, 42.0, 34.0, 33.0, 31.0, 29.0, 32.0, 23.0, 23.0, 19.0, 16.0, 19.0, 13.0, 12.0, 5.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.125, -49.3232421875, -47.521484375, -45.7197265625, -43.91796875, -42.1162109375, -40.314453125, -38.5126953125, -36.7109375, -34.9091796875, -33.107421875, -31.3056640625, -29.50390625, -27.7021484375, -25.900390625, -24.0986328125, -22.296875, -20.4951171875, -18.693359375, -16.8916015625, -15.08984375, -13.2880859375, -11.486328125, -9.6845703125, -7.8828125, -6.0810546875, -4.279296875, -2.4775390625, -0.67578125, 1.1259765625, 2.927734375, 4.7294921875, 6.53125, 8.3330078125, 10.134765625, 11.9365234375, 13.73828125, 15.5400390625, 17.341796875, 19.1435546875, 20.9453125, 22.7470703125, 24.548828125, 26.3505859375, 28.15234375, 29.9541015625, 31.755859375, 33.5576171875, 35.359375, 37.1611328125, 38.962890625, 40.7646484375, 42.56640625, 44.3681640625, 46.169921875, 47.9716796875, 49.7734375, 51.5751953125, 53.376953125, 55.1787109375, 56.98046875, 58.7822265625, 60.583984375, 62.3857421875, 64.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 8.0, 5.0, 6.0, 8.0, 26.0, 22.0, 31.0, 72.0, 82.0, 149.0, 260.0, 422.0, 788.0, 1370.0, 2519.0, 4758.0, 8775.0, 17684.0, 38253.0, 832646.0, 89846.0, 24415.0, 12210.0, 6457.0, 3443.0, 1853.0, 1018.0, 597.0, 319.0, 189.0, 110.0, 85.0, 41.0, 32.0, 20.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.5, -41.07080078125, -39.6416015625, -38.21240234375, -36.783203125, -35.35400390625, -33.9248046875, -32.49560546875, -31.06640625, -29.63720703125, -28.2080078125, -26.77880859375, -25.349609375, -23.92041015625, -22.4912109375, -21.06201171875, -19.6328125, -18.20361328125, -16.7744140625, -15.34521484375, -13.916015625, -12.48681640625, -11.0576171875, -9.62841796875, -8.19921875, -6.77001953125, -5.3408203125, -3.91162109375, -2.482421875, -1.05322265625, 0.3759765625, 1.80517578125, 3.234375, 4.66357421875, 6.0927734375, 7.52197265625, 8.951171875, 10.38037109375, 11.8095703125, 13.23876953125, 14.66796875, 16.09716796875, 17.5263671875, 18.95556640625, 20.384765625, 21.81396484375, 23.2431640625, 24.67236328125, 26.1015625, 27.53076171875, 28.9599609375, 30.38916015625, 31.818359375, 33.24755859375, 34.6767578125, 36.10595703125, 37.53515625, 38.96435546875, 40.3935546875, 41.82275390625, 43.251953125, 44.68115234375, 46.1103515625, 47.53955078125, 48.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 11.0, 12.0, 9.0, 16.0, 14.0, 21.0, 28.0, 16.0, 19.0, 29.0, 35.0, 36.0, 40.0, 46.0, 36.0, 59.0, 46.0, 43.0, 31.0, 48.0, 47.0, 27.0, 26.0, 35.0, 38.0, 35.0, 23.0, 17.0, 19.0, 17.0, 13.0, 16.0, 13.0, 19.0, 10.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.41455078125, -42.0791015625, -40.74365234375, -39.408203125, -38.07275390625, -36.7373046875, -35.40185546875, -34.06640625, -32.73095703125, -31.3955078125, -30.06005859375, -28.724609375, -27.38916015625, -26.0537109375, -24.71826171875, -23.3828125, -22.04736328125, -20.7119140625, -19.37646484375, -18.041015625, -16.70556640625, -15.3701171875, -14.03466796875, -12.69921875, -11.36376953125, -10.0283203125, -8.69287109375, -7.357421875, -6.02197265625, -4.6865234375, -3.35107421875, -2.015625, -0.68017578125, 0.6552734375, 1.99072265625, 3.326171875, 4.66162109375, 5.9970703125, 7.33251953125, 8.66796875, 10.00341796875, 11.3388671875, 12.67431640625, 14.009765625, 15.34521484375, 16.6806640625, 18.01611328125, 19.3515625, 20.68701171875, 22.0224609375, 23.35791015625, 24.693359375, 26.02880859375, 27.3642578125, 28.69970703125, 30.03515625, 31.37060546875, 32.7060546875, 34.04150390625, 35.376953125, 36.71240234375, 38.0478515625, 39.38330078125, 40.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 6.0, 10.0, 22.0, 17.0, 21.0, 37.0, 34.0, 41.0, 75.0, 93.0, 152.0, 218.0, 370.0, 568.0, 1047.0, 1792.0, 3351.0, 6776.0, 13705.0, 29719.0, 336975.0, 590908.0, 32016.0, 14821.0, 7268.0, 3591.0, 1941.0, 1134.0, 636.0, 348.0, 240.0, 189.0, 110.0, 78.0, 57.0, 37.0, 27.0, 21.0, 19.0, 17.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.50390625, -3.39105224609375, -3.2781982421875, -3.16534423828125, -3.052490234375, -2.93963623046875, -2.8267822265625, -2.71392822265625, -2.60107421875, -2.48822021484375, -2.3753662109375, -2.26251220703125, -2.149658203125, -2.03680419921875, -1.9239501953125, -1.81109619140625, -1.6982421875, -1.58538818359375, -1.4725341796875, -1.35968017578125, -1.246826171875, -1.13397216796875, -1.0211181640625, -0.90826416015625, -0.79541015625, -0.68255615234375, -0.5697021484375, -0.45684814453125, -0.343994140625, -0.23114013671875, -0.1182861328125, -0.00543212890625, 0.107421875, 0.22027587890625, 0.3331298828125, 0.44598388671875, 0.558837890625, 0.67169189453125, 0.7845458984375, 0.89739990234375, 1.01025390625, 1.12310791015625, 1.2359619140625, 1.34881591796875, 1.461669921875, 1.57452392578125, 1.6873779296875, 1.80023193359375, 1.9130859375, 2.02593994140625, 2.1387939453125, 2.25164794921875, 2.364501953125, 2.47735595703125, 2.5902099609375, 2.70306396484375, 2.81591796875, 2.92877197265625, 3.0416259765625, 3.15447998046875, 3.267333984375, 3.38018798828125, 3.4930419921875, 3.60589599609375, 3.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 13.0, 12.0, 20.0, 26.0, 24.0, 28.0, 33.0, 48.0, 40.0, 50.0, 49.0, 61.0, 56.0, 64.0, 53.0, 52.0, 65.0, 41.0, 42.0, 29.0, 30.0, 20.0, 31.0, 23.0, 16.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.372550994157791e-05, -9.011663496494293e-05, -8.650775998830795e-05, -8.289888501167297e-05, -7.9290010035038e-05, -7.568113505840302e-05, -7.207226008176804e-05, -6.846338510513306e-05, -6.485451012849808e-05, -6.12456351518631e-05, -5.763676017522812e-05, -5.402788519859314e-05, -5.041901022195816e-05, -4.681013524532318e-05, -4.32012602686882e-05, -3.959238529205322e-05, -3.5983510315418243e-05, -3.2374635338783264e-05, -2.8765760362148285e-05, -2.5156885385513306e-05, -2.1548010408878326e-05, -1.7939135432243347e-05, -1.4330260455608368e-05, -1.0721385478973389e-05, -7.1125105023384094e-06, -3.50363552570343e-06, 1.0523945093154907e-07, 3.7141144275665283e-06, 7.3229894042015076e-06, 1.0931864380836487e-05, 1.4540739357471466e-05, 1.8149614334106445e-05, 2.1758489310741425e-05, 2.5367364287376404e-05, 2.8976239264011383e-05, 3.258511424064636e-05, 3.619398921728134e-05, 3.980286419391632e-05, 4.34117391705513e-05, 4.702061414718628e-05, 5.062948912382126e-05, 5.423836410045624e-05, 5.784723907709122e-05, 6.14561140537262e-05, 6.506498903036118e-05, 6.867386400699615e-05, 7.228273898363113e-05, 7.589161396026611e-05, 7.950048893690109e-05, 8.310936391353607e-05, 8.671823889017105e-05, 9.032711386680603e-05, 9.393598884344101e-05, 9.754486382007599e-05, 0.00010115373879671097, 0.00010476261377334595, 0.00010837148874998093, 0.0001119803637266159, 0.00011558923870325089, 0.00011919811367988586, 0.00012280698865652084, 0.00012641586363315582, 0.0001300247386097908, 0.00013363361358642578]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 8.0, 23.0, 26.0, 45.0, 84.0, 112.0, 188.0, 271.0, 469.0, 770.0, 1248.0, 2037.0, 3429.0, 5589.0, 9637.0, 15776.0, 26149.0, 42204.0, 65599.0, 96704.0, 132374.0, 155431.0, 147817.0, 117184.0, 83415.0, 54491.0, 34401.0, 21200.0, 12784.0, 7580.0, 4629.0, 2674.0, 1599.0, 955.0, 615.0, 400.0, 229.0, 120.0, 95.0, 68.0, 47.0, 26.0, 11.0, 12.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.900390625, -2.80914306640625, -2.7178955078125, -2.62664794921875, -2.535400390625, -2.44415283203125, -2.3529052734375, -2.26165771484375, -2.17041015625, -2.07916259765625, -1.9879150390625, -1.89666748046875, -1.805419921875, -1.71417236328125, -1.6229248046875, -1.53167724609375, -1.4404296875, -1.34918212890625, -1.2579345703125, -1.16668701171875, -1.075439453125, -0.98419189453125, -0.8929443359375, -0.80169677734375, -0.71044921875, -0.61920166015625, -0.5279541015625, -0.43670654296875, -0.345458984375, -0.25421142578125, -0.1629638671875, -0.07171630859375, 0.01953125, 0.11077880859375, 0.2020263671875, 0.29327392578125, 0.384521484375, 0.47576904296875, 0.5670166015625, 0.65826416015625, 0.74951171875, 0.84075927734375, 0.9320068359375, 1.02325439453125, 1.114501953125, 1.20574951171875, 1.2969970703125, 1.38824462890625, 1.4794921875, 1.57073974609375, 1.6619873046875, 1.75323486328125, 1.844482421875, 1.93572998046875, 2.0269775390625, 2.11822509765625, 2.20947265625, 2.30072021484375, 2.3919677734375, 2.48321533203125, 2.574462890625, 2.66571044921875, 2.7569580078125, 2.84820556640625, 2.939453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 7.0, 20.0, 10.0, 22.0, 23.0, 21.0, 25.0, 28.0, 31.0, 28.0, 34.0, 36.0, 31.0, 38.0, 33.0, 32.0, 63.0, 50.0, 51.0, 42.0, 49.0, 31.0, 33.0, 41.0, 24.0, 28.0, 34.0, 21.0, 23.0, 17.0, 19.0, 11.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2119140625, -1.1786270141601562, -1.1453399658203125, -1.1120529174804688, -1.078765869140625, -1.0454788208007812, -1.0121917724609375, -0.9789047241210938, -0.94561767578125, -0.9123306274414062, -0.8790435791015625, -0.8457565307617188, -0.812469482421875, -0.7791824340820312, -0.7458953857421875, -0.7126083374023438, -0.6793212890625, -0.6460342407226562, -0.6127471923828125, -0.5794601440429688, -0.546173095703125, -0.5128860473632812, -0.4795989990234375, -0.44631195068359375, -0.41302490234375, -0.37973785400390625, -0.3464508056640625, -0.31316375732421875, -0.279876708984375, -0.24658966064453125, -0.2133026123046875, -0.18001556396484375, -0.146728515625, -0.11344146728515625, -0.0801544189453125, -0.04686737060546875, -0.013580322265625, 0.01970672607421875, 0.0529937744140625, 0.08628082275390625, 0.11956787109375, 0.15285491943359375, 0.1861419677734375, 0.21942901611328125, 0.252716064453125, 0.28600311279296875, 0.3192901611328125, 0.35257720947265625, 0.3858642578125, 0.41915130615234375, 0.4524383544921875, 0.48572540283203125, 0.519012451171875, 0.5522994995117188, 0.5855865478515625, 0.6188735961914062, 0.65216064453125, 0.6854476928710938, 0.7187347412109375, 0.7520217895507812, 0.785308837890625, 0.8185958862304688, 0.8518829345703125, 0.8851699829101562, 0.91845703125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 15.0, 12.0, 13.0, 9.0, 19.0, 16.0, 30.0, 23.0, 17.0, 34.0, 40.0, 31.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 43.0, 34.0, 36.0, 37.0, 36.0, 30.0, 30.0, 32.0, 18.0, 26.0, 23.0, 13.0, 21.0, 19.0, 10.0, 8.0, 7.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.912818908691406, -53.04204177856445, -51.1712646484375, -49.30048751831055, -47.429710388183594, -45.55893325805664, -43.68815612792969, -41.8173828125, -39.94660186767578, -38.07582473754883, -36.205047607421875, -34.33427047729492, -32.46349334716797, -30.592716217041016, -28.721940994262695, -26.851163864135742, -24.980388641357422, -23.10961151123047, -21.238834381103516, -19.368057250976562, -17.49728012084961, -15.626503944396973, -13.755727767944336, -11.884950637817383, -10.01417350769043, -8.143396377563477, -6.272619724273682, -4.401843070983887, -2.5310659408569336, -0.6602888107299805, 1.2104873657226562, 3.0812644958496094, 4.9520416259765625, 6.822818756103516, 8.693595886230469, 10.564372062683105, 12.435149192810059, 14.305926322937012, 16.17670249938965, 18.0474796295166, 19.918256759643555, 21.789033889770508, 23.65981101989746, 25.53058624267578, 27.401363372802734, 29.272140502929688, 31.14291763305664, 33.013694763183594, 34.88447189331055, 36.7552490234375, 38.62602615356445, 40.496803283691406, 42.36758041381836, 44.23835754394531, 46.109130859375, 47.97991180419922, 49.850685119628906, 51.72146224975586, 53.59223937988281, 55.463016510009766, 57.33379364013672, 59.20457077026367, 61.075347900390625, 62.94612121582031, 64.81690216064453]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 16.0, 24.0, 20.0, 20.0, 25.0, 23.0, 22.0, 24.0, 23.0, 33.0, 31.0, 35.0, 36.0, 37.0, 24.0, 37.0, 41.0, 35.0, 34.0, 34.0, 47.0, 34.0, 31.0, 33.0, 30.0, 30.0, 21.0, 22.0, 21.0, 15.0, 17.0, 18.0, 7.0, 3.0, 12.0, 9.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.96181106567383, -49.15064239501953, -47.33946990966797, -45.52830123901367, -43.717132568359375, -41.90596008300781, -40.094791412353516, -38.28362274169922, -36.472450256347656, -34.66128158569336, -32.8501091003418, -31.0389404296875, -29.22776985168457, -27.41659927368164, -25.605430603027344, -23.794260025024414, -21.983089447021484, -20.171918869018555, -18.360748291015625, -16.549579620361328, -14.738409042358398, -12.927238464355469, -11.116068840026855, -9.304899215698242, -7.4937286376953125, -5.682558536529541, -3.8713884353637695, -2.060218334197998, -0.24904823303222656, 1.5621223449707031, 3.3732919692993164, 5.18446159362793, 6.995635986328125, 8.806806564331055, 10.617976188659668, 12.429145812988281, 14.240316390991211, 16.05148696899414, 17.862655639648438, 19.673826217651367, 21.484996795654297, 23.296167373657227, 25.107337951660156, 26.918506622314453, 28.729677200317383, 30.540847778320312, 32.35201644897461, 34.163185119628906, 35.97435760498047, 37.785526275634766, 39.59669876098633, 41.407867431640625, 43.21903991699219, 45.030208587646484, 46.84137725830078, 48.652549743652344, 50.46371841430664, 52.27488708496094, 54.0860595703125, 55.8972282409668, 57.708396911621094, 59.519569396972656, 61.33073806762695, 63.14190673828125, 64.95307922363281]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 12.0, 25.0, 40.0, 71.0, 89.0, 168.0, 263.0, 448.0, 739.0, 1193.0, 1930.0, 3152.0, 4795.0, 7269.0, 10550.0, 15717.0, 22293.0, 30518.0, 40658.0, 52069.0, 63835.0, 75542.0, 83509.0, 89533.0, 90778.0, 86503.0, 79057.0, 68847.0, 57659.0, 45140.0, 35299.0, 25929.0, 18239.0, 12830.0, 8514.0, 5449.0, 3705.0, 2335.0, 1444.0, 958.0, 547.0, 369.0, 197.0, 126.0, 94.0, 55.0, 23.0, 13.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-37.25, -36.09375, -34.9375, -33.78125, -32.625, -31.46875, -30.3125, -29.15625, -28.0, -26.84375, -25.6875, -24.53125, -23.375, -22.21875, -21.0625, -19.90625, -18.75, -17.59375, -16.4375, -15.28125, -14.125, -12.96875, -11.8125, -10.65625, -9.5, -8.34375, -7.1875, -6.03125, -4.875, -3.71875, -2.5625, -1.40625, -0.25, 0.90625, 2.0625, 3.21875, 4.375, 5.53125, 6.6875, 7.84375, 9.0, 10.15625, 11.3125, 12.46875, 13.625, 14.78125, 15.9375, 17.09375, 18.25, 19.40625, 20.5625, 21.71875, 22.875, 24.03125, 25.1875, 26.34375, 27.5, 28.65625, 29.8125, 30.96875, 32.125, 33.28125, 34.4375, 35.59375, 36.75]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 9.0, 9.0, 12.0, 11.0, 25.0, 22.0, 17.0, 28.0, 21.0, 24.0, 22.0, 26.0, 33.0, 28.0, 30.0, 39.0, 37.0, 30.0, 28.0, 42.0, 36.0, 30.0, 41.0, 43.0, 37.0, 30.0, 34.0, 34.0, 25.0, 24.0, 20.0, 22.0, 17.0, 17.0, 17.0, 8.0, 5.0, 11.0, 6.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-49.65625, -47.90234375, -46.1484375, -44.39453125, -42.640625, -40.88671875, -39.1328125, -37.37890625, -35.625, -33.87109375, -32.1171875, -30.36328125, -28.609375, -26.85546875, -25.1015625, -23.34765625, -21.59375, -19.83984375, -18.0859375, -16.33203125, -14.578125, -12.82421875, -11.0703125, -9.31640625, -7.5625, -5.80859375, -4.0546875, -2.30078125, -0.546875, 1.20703125, 2.9609375, 4.71484375, 6.46875, 8.22265625, 9.9765625, 11.73046875, 13.484375, 15.23828125, 16.9921875, 18.74609375, 20.5, 22.25390625, 24.0078125, 25.76171875, 27.515625, 29.26953125, 31.0234375, 32.77734375, 34.53125, 36.28515625, 38.0390625, 39.79296875, 41.546875, 43.30078125, 45.0546875, 46.80859375, 48.5625, 50.31640625, 52.0703125, 53.82421875, 55.578125, 57.33203125, 59.0859375, 60.83984375, 62.59375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 9.0, 23.0, 32.0, 43.0, 72.0, 117.0, 166.0, 246.0, 432.0, 628.0, 1004.0, 1526.0, 2285.0, 3433.0, 4993.0, 7187.0, 10428.0, 14558.0, 20210.0, 26655.0, 34445.0, 44101.0, 53701.0, 63620.0, 72353.0, 78222.0, 81872.0, 82336.0, 78863.0, 72505.0, 64138.0, 54054.0, 44333.0, 34699.0, 27237.0, 20022.0, 14824.0, 10568.0, 7432.0, 5169.0, 3269.0, 2332.0, 1549.0, 1013.0, 649.0, 422.0, 287.0, 181.0, 121.0, 68.0, 51.0, 24.0, 27.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-31.125, -30.12158203125, -29.1181640625, -28.11474609375, -27.111328125, -26.10791015625, -25.1044921875, -24.10107421875, -23.09765625, -22.09423828125, -21.0908203125, -20.08740234375, -19.083984375, -18.08056640625, -17.0771484375, -16.07373046875, -15.0703125, -14.06689453125, -13.0634765625, -12.06005859375, -11.056640625, -10.05322265625, -9.0498046875, -8.04638671875, -7.04296875, -6.03955078125, -5.0361328125, -4.03271484375, -3.029296875, -2.02587890625, -1.0224609375, -0.01904296875, 0.984375, 1.98779296875, 2.9912109375, 3.99462890625, 4.998046875, 6.00146484375, 7.0048828125, 8.00830078125, 9.01171875, 10.01513671875, 11.0185546875, 12.02197265625, 13.025390625, 14.02880859375, 15.0322265625, 16.03564453125, 17.0390625, 18.04248046875, 19.0458984375, 20.04931640625, 21.052734375, 22.05615234375, 23.0595703125, 24.06298828125, 25.06640625, 26.06982421875, 27.0732421875, 28.07666015625, 29.080078125, 30.08349609375, 31.0869140625, 32.09033203125, 33.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 9.0, 3.0, 12.0, 12.0, 10.0, 15.0, 18.0, 24.0, 31.0, 36.0, 22.0, 36.0, 25.0, 46.0, 36.0, 24.0, 31.0, 49.0, 41.0, 45.0, 46.0, 35.0, 35.0, 42.0, 37.0, 35.0, 32.0, 41.0, 22.0, 18.0, 14.0, 13.0, 18.0, 16.0, 9.0, 6.0, 8.0, 6.0, 9.0, 7.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.5625, -39.32861328125, -38.0947265625, -36.86083984375, -35.626953125, -34.39306640625, -33.1591796875, -31.92529296875, -30.69140625, -29.45751953125, -28.2236328125, -26.98974609375, -25.755859375, -24.52197265625, -23.2880859375, -22.05419921875, -20.8203125, -19.58642578125, -18.3525390625, -17.11865234375, -15.884765625, -14.65087890625, -13.4169921875, -12.18310546875, -10.94921875, -9.71533203125, -8.4814453125, -7.24755859375, -6.013671875, -4.77978515625, -3.5458984375, -2.31201171875, -1.078125, 0.15576171875, 1.3896484375, 2.62353515625, 3.857421875, 5.09130859375, 6.3251953125, 7.55908203125, 8.79296875, 10.02685546875, 11.2607421875, 12.49462890625, 13.728515625, 14.96240234375, 16.1962890625, 17.43017578125, 18.6640625, 19.89794921875, 21.1318359375, 22.36572265625, 23.599609375, 24.83349609375, 26.0673828125, 27.30126953125, 28.53515625, 29.76904296875, 31.0029296875, 32.23681640625, 33.470703125, 34.70458984375, 35.9384765625, 37.17236328125, 38.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 12.0, 22.0, 21.0, 44.0, 89.0, 129.0, 197.0, 319.0, 462.0, 800.0, 1206.0, 1957.0, 2969.0, 4681.0, 7477.0, 11325.0, 16883.0, 25114.0, 35107.0, 47775.0, 62118.0, 76535.0, 88967.0, 97963.0, 100552.0, 96898.0, 87565.0, 74443.0, 59414.0, 45460.0, 33374.0, 23403.0, 15913.0, 10544.0, 6800.0, 4335.0, 2758.0, 1802.0, 1187.0, 685.0, 398.0, 289.0, 202.0, 126.0, 79.0, 50.0, 39.0, 27.0, 16.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.546875, -15.052001953125, -14.55712890625, -14.062255859375, -13.5673828125, -13.072509765625, -12.57763671875, -12.082763671875, -11.587890625, -11.093017578125, -10.59814453125, -10.103271484375, -9.6083984375, -9.113525390625, -8.61865234375, -8.123779296875, -7.62890625, -7.134033203125, -6.63916015625, -6.144287109375, -5.6494140625, -5.154541015625, -4.65966796875, -4.164794921875, -3.669921875, -3.175048828125, -2.68017578125, -2.185302734375, -1.6904296875, -1.195556640625, -0.70068359375, -0.205810546875, 0.2890625, 0.783935546875, 1.27880859375, 1.773681640625, 2.2685546875, 2.763427734375, 3.25830078125, 3.753173828125, 4.248046875, 4.742919921875, 5.23779296875, 5.732666015625, 6.2275390625, 6.722412109375, 7.21728515625, 7.712158203125, 8.20703125, 8.701904296875, 9.19677734375, 9.691650390625, 10.1865234375, 10.681396484375, 11.17626953125, 11.671142578125, 12.166015625, 12.660888671875, 13.15576171875, 13.650634765625, 14.1455078125, 14.640380859375, 15.13525390625, 15.630126953125, 16.125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 3.0, 7.0, 3.0, 13.0, 10.0, 11.0, 10.0, 22.0, 21.0, 22.0, 26.0, 33.0, 33.0, 37.0, 44.0, 37.0, 34.0, 44.0, 37.0, 39.0, 49.0, 38.0, 42.0, 50.0, 39.0, 45.0, 28.0, 34.0, 28.0, 23.0, 22.0, 23.0, 13.0, 6.0, 14.0, 16.0, 11.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020885467529296875, -0.002025127410888672, -0.0019617080688476562, -0.0018982887268066406, -0.001834869384765625, -0.0017714500427246094, -0.0017080307006835938, -0.0016446113586425781, -0.0015811920166015625, -0.0015177726745605469, -0.0014543533325195312, -0.0013909339904785156, -0.0013275146484375, -0.0012640953063964844, -0.0012006759643554688, -0.0011372566223144531, -0.0010738372802734375, -0.0010104179382324219, -0.0009469985961914062, -0.0008835792541503906, -0.000820159912109375, -0.0007567405700683594, -0.0006933212280273438, -0.0006299018859863281, -0.0005664825439453125, -0.0005030632019042969, -0.00043964385986328125, -0.0003762245178222656, -0.00031280517578125, -0.0002493858337402344, -0.00018596649169921875, -0.00012254714965820312, -5.91278076171875e-05, 4.291534423828125e-06, 6.771087646484375e-05, 0.00013113021850585938, 0.000194549560546875, 0.0002579689025878906, 0.00032138824462890625, 0.0003848075866699219, 0.0004482269287109375, 0.0005116462707519531, 0.0005750656127929688, 0.0006384849548339844, 0.000701904296875, 0.0007653236389160156, 0.0008287429809570312, 0.0008921623229980469, 0.0009555816650390625, 0.0010190010070800781, 0.0010824203491210938, 0.0011458396911621094, 0.001209259033203125, 0.0012726783752441406, 0.0013360977172851562, 0.0013995170593261719, 0.0014629364013671875, 0.0015263557434082031, 0.0015897750854492188, 0.0016531944274902344, 0.00171661376953125, 0.0017800331115722656, 0.0018434524536132812, 0.0019068717956542969, 0.0019702911376953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 25.0, 43.0, 58.0, 84.0, 156.0, 269.0, 397.0, 692.0, 1048.0, 1642.0, 2656.0, 4294.0, 6642.0, 10369.0, 15784.0, 23907.0, 35077.0, 48876.0, 65059.0, 81997.0, 97103.0, 106551.0, 108292.0, 101046.0, 88325.0, 72140.0, 55019.0, 40034.0, 28203.0, 18901.0, 12270.0, 8023.0, 5202.0, 3163.0, 1971.0, 1233.0, 734.0, 496.0, 306.0, 168.0, 94.0, 76.0, 46.0, 30.0, 19.0, 8.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.65625, -20.05224609375, -19.4482421875, -18.84423828125, -18.240234375, -17.63623046875, -17.0322265625, -16.42822265625, -15.82421875, -15.22021484375, -14.6162109375, -14.01220703125, -13.408203125, -12.80419921875, -12.2001953125, -11.59619140625, -10.9921875, -10.38818359375, -9.7841796875, -9.18017578125, -8.576171875, -7.97216796875, -7.3681640625, -6.76416015625, -6.16015625, -5.55615234375, -4.9521484375, -4.34814453125, -3.744140625, -3.14013671875, -2.5361328125, -1.93212890625, -1.328125, -0.72412109375, -0.1201171875, 0.48388671875, 1.087890625, 1.69189453125, 2.2958984375, 2.89990234375, 3.50390625, 4.10791015625, 4.7119140625, 5.31591796875, 5.919921875, 6.52392578125, 7.1279296875, 7.73193359375, 8.3359375, 8.93994140625, 9.5439453125, 10.14794921875, 10.751953125, 11.35595703125, 11.9599609375, 12.56396484375, 13.16796875, 13.77197265625, 14.3759765625, 14.97998046875, 15.583984375, 16.18798828125, 16.7919921875, 17.39599609375, 18.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 2.0, 6.0, 12.0, 7.0, 10.0, 14.0, 12.0, 22.0, 16.0, 31.0, 27.0, 18.0, 20.0, 36.0, 29.0, 37.0, 37.0, 40.0, 50.0, 47.0, 51.0, 40.0, 27.0, 39.0, 47.0, 42.0, 34.0, 37.0, 28.0, 22.0, 23.0, 20.0, 22.0, 14.0, 19.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.8671875, -7.6195068359375, -7.371826171875, -7.1241455078125, -6.87646484375, -6.6287841796875, -6.381103515625, -6.1334228515625, -5.8857421875, -5.6380615234375, -5.390380859375, -5.1427001953125, -4.89501953125, -4.6473388671875, -4.399658203125, -4.1519775390625, -3.904296875, -3.6566162109375, -3.408935546875, -3.1612548828125, -2.91357421875, -2.6658935546875, -2.418212890625, -2.1705322265625, -1.9228515625, -1.6751708984375, -1.427490234375, -1.1798095703125, -0.93212890625, -0.6844482421875, -0.436767578125, -0.1890869140625, 0.05859375, 0.3062744140625, 0.553955078125, 0.8016357421875, 1.04931640625, 1.2969970703125, 1.544677734375, 1.7923583984375, 2.0400390625, 2.2877197265625, 2.535400390625, 2.7830810546875, 3.03076171875, 3.2784423828125, 3.526123046875, 3.7738037109375, 4.021484375, 4.2691650390625, 4.516845703125, 4.7645263671875, 5.01220703125, 5.2598876953125, 5.507568359375, 5.7552490234375, 6.0029296875, 6.2506103515625, 6.498291015625, 6.7459716796875, 6.99365234375, 7.2413330078125, 7.489013671875, 7.7366943359375, 7.984375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 14.0, 6.0, 11.0, 12.0, 16.0, 22.0, 12.0, 18.0, 24.0, 31.0, 25.0, 27.0, 35.0, 38.0, 30.0, 49.0, 42.0, 43.0, 53.0, 47.0, 35.0, 35.0, 42.0, 31.0, 33.0, 30.0, 27.0, 24.0, 29.0, 27.0, 22.0, 15.0, 14.0, 19.0, 3.0, 13.0, 8.0, 4.0, 8.0, 6.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.916141510009766, -59.020442962646484, -57.12474060058594, -55.229042053222656, -53.333343505859375, -51.437644958496094, -49.54194259643555, -47.646244049072266, -45.75054168701172, -43.85484313964844, -41.95914077758789, -40.06344223022461, -38.16774368286133, -36.27204132080078, -34.3763427734375, -32.48064422607422, -30.584945678710938, -28.689245223999023, -26.793546676635742, -24.897846221923828, -23.002147674560547, -21.106447219848633, -19.21074676513672, -17.315048217773438, -15.419347763061523, -13.523648262023926, -11.627948760986328, -9.732248306274414, -7.836548805236816, -5.940849304199219, -4.045148849487305, -2.149449348449707, -0.25374603271484375, 1.641953706741333, 3.5376534461975098, 5.433353424072266, 7.329052925109863, 9.224752426147461, 11.120452880859375, 13.016152381896973, 14.91185188293457, 16.807552337646484, 18.703250885009766, 20.59895133972168, 22.494651794433594, 24.390350341796875, 26.28605079650879, 28.181751251220703, 30.077449798583984, 31.9731502532959, 33.86885070800781, 35.764549255371094, 37.660247802734375, 39.555946350097656, 41.4516487121582, 43.347347259521484, 45.24304962158203, 47.13874816894531, 49.03445053100586, 50.93014907836914, 52.82584762573242, 54.72154998779297, 56.61724853515625, 58.51294708251953, 60.40864562988281]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 2.0, 5.0, 3.0, 7.0, 15.0, 10.0, 12.0, 18.0, 23.0, 21.0, 24.0, 28.0, 22.0, 29.0, 29.0, 27.0, 27.0, 30.0, 32.0, 36.0, 40.0, 45.0, 29.0, 32.0, 40.0, 28.0, 33.0, 42.0, 30.0, 38.0, 21.0, 27.0, 31.0, 29.0, 20.0, 24.0, 12.0, 14.0, 10.0, 6.0, 10.0, 6.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.048343658447266, -52.148345947265625, -50.24835205078125, -48.34835433959961, -46.44835662841797, -44.548362731933594, -42.64836502075195, -40.74836730957031, -38.84837341308594, -36.9483757019043, -35.04838180541992, -33.14838409423828, -31.248388290405273, -29.348392486572266, -27.448394775390625, -25.548398971557617, -23.64840316772461, -21.7484073638916, -19.848411560058594, -17.948413848876953, -16.048418045043945, -14.148422241210938, -12.248425483703613, -10.348428726196289, -8.448432922363281, -6.548436641693115, -4.648440361022949, -2.748444080352783, -0.8484477996826172, 1.0515480041503906, 2.951544761657715, 4.851541519165039, 6.751533508300781, 8.651529312133789, 10.551526069641113, 12.451522827148438, 14.351518630981445, 16.251514434814453, 18.151512145996094, 20.0515079498291, 21.95150375366211, 23.851499557495117, 25.751495361328125, 27.651493072509766, 29.551488876342773, 31.45148468017578, 33.35148239135742, 35.25148010253906, 37.15147399902344, 39.05147171020508, 40.95146560668945, 42.851463317871094, 44.75145721435547, 46.65145492553711, 48.55145263671875, 50.451446533203125, 52.351444244384766, 54.251441955566406, 56.15143585205078, 58.05143356323242, 59.95143127441406, 61.85142517089844, 63.75142288208008, 65.65142059326172, 67.5514144897461]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 17.0, 24.0, 33.0, 73.0, 118.0, 201.0, 353.0, 614.0, 970.0, 1711.0, 2653.0, 4267.0, 6951.0, 11057.0, 16992.0, 26008.0, 39481.0, 58360.0, 84901.0, 118129.0, 160822.0, 211544.0, 263590.0, 316971.0, 357499.0, 382161.0, 383733.0, 363903.0, 323348.0, 272912.0, 218901.0, 168699.0, 125246.0, 89028.0, 62778.0, 42033.0, 28081.0, 18458.0, 11850.0, 7437.0, 4745.0, 2932.0, 1778.0, 1114.0, 719.0, 422.0, 261.0, 147.0, 103.0, 62.0, 35.0, 25.0, 14.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.4619140625, -36.173828125, -34.8857421875, -33.59765625, -32.3095703125, -31.021484375, -29.7333984375, -28.4453125, -27.1572265625, -25.869140625, -24.5810546875, -23.29296875, -22.0048828125, -20.716796875, -19.4287109375, -18.140625, -16.8525390625, -15.564453125, -14.2763671875, -12.98828125, -11.7001953125, -10.412109375, -9.1240234375, -7.8359375, -6.5478515625, -5.259765625, -3.9716796875, -2.68359375, -1.3955078125, -0.107421875, 1.1806640625, 2.46875, 3.7568359375, 5.044921875, 6.3330078125, 7.62109375, 8.9091796875, 10.197265625, 11.4853515625, 12.7734375, 14.0615234375, 15.349609375, 16.6376953125, 17.92578125, 19.2138671875, 20.501953125, 21.7900390625, 23.078125, 24.3662109375, 25.654296875, 26.9423828125, 28.23046875, 29.5185546875, 30.806640625, 32.0947265625, 33.3828125, 34.6708984375, 35.958984375, 37.2470703125, 38.53515625, 39.8232421875, 41.111328125, 42.3994140625, 43.6875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 9.0, 15.0, 9.0, 18.0, 17.0, 24.0, 20.0, 31.0, 25.0, 21.0, 30.0, 36.0, 24.0, 25.0, 34.0, 39.0, 32.0, 41.0, 42.0, 32.0, 40.0, 29.0, 31.0, 45.0, 29.0, 34.0, 33.0, 24.0, 25.0, 37.0, 19.0, 26.0, 11.0, 15.0, 11.0, 7.0, 9.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.46875, -46.72705078125, -44.9853515625, -43.24365234375, -41.501953125, -39.76025390625, -38.0185546875, -36.27685546875, -34.53515625, -32.79345703125, -31.0517578125, -29.31005859375, -27.568359375, -25.82666015625, -24.0849609375, -22.34326171875, -20.6015625, -18.85986328125, -17.1181640625, -15.37646484375, -13.634765625, -11.89306640625, -10.1513671875, -8.40966796875, -6.66796875, -4.92626953125, -3.1845703125, -1.44287109375, 0.298828125, 2.04052734375, 3.7822265625, 5.52392578125, 7.265625, 9.00732421875, 10.7490234375, 12.49072265625, 14.232421875, 15.97412109375, 17.7158203125, 19.45751953125, 21.19921875, 22.94091796875, 24.6826171875, 26.42431640625, 28.166015625, 29.90771484375, 31.6494140625, 33.39111328125, 35.1328125, 36.87451171875, 38.6162109375, 40.35791015625, 42.099609375, 43.84130859375, 45.5830078125, 47.32470703125, 49.06640625, 50.80810546875, 52.5498046875, 54.29150390625, 56.033203125, 57.77490234375, 59.5166015625, 61.25830078125, 63.0]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 28.0, 46.0, 84.0, 148.0, 252.0, 369.0, 622.0, 1061.0, 1709.0, 2756.0, 4360.0, 6850.0, 10948.0, 16603.0, 24801.0, 37314.0, 53669.0, 75767.0, 104097.0, 139289.0, 179036.0, 222311.0, 265658.0, 303367.0, 332588.0, 347208.0, 345121.0, 327577.0, 297288.0, 258002.0, 214419.0, 171073.0, 131602.0, 97494.0, 70836.0, 50413.0, 34444.0, 22847.0, 15467.0, 9894.0, 6457.0, 3948.0, 2520.0, 1557.0, 961.0, 572.0, 360.0, 192.0, 128.0, 70.0, 42.0, 27.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.8125, -39.533203125, -38.25390625, -36.974609375, -35.6953125, -34.416015625, -33.13671875, -31.857421875, -30.578125, -29.298828125, -28.01953125, -26.740234375, -25.4609375, -24.181640625, -22.90234375, -21.623046875, -20.34375, -19.064453125, -17.78515625, -16.505859375, -15.2265625, -13.947265625, -12.66796875, -11.388671875, -10.109375, -8.830078125, -7.55078125, -6.271484375, -4.9921875, -3.712890625, -2.43359375, -1.154296875, 0.125, 1.404296875, 2.68359375, 3.962890625, 5.2421875, 6.521484375, 7.80078125, 9.080078125, 10.359375, 11.638671875, 12.91796875, 14.197265625, 15.4765625, 16.755859375, 18.03515625, 19.314453125, 20.59375, 21.873046875, 23.15234375, 24.431640625, 25.7109375, 26.990234375, 28.26953125, 29.548828125, 30.828125, 32.107421875, 33.38671875, 34.666015625, 35.9453125, 37.224609375, 38.50390625, 39.783203125, 41.0625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 12.0, 12.0, 11.0, 17.0, 26.0, 23.0, 33.0, 56.0, 48.0, 74.0, 77.0, 85.0, 110.0, 113.0, 125.0, 146.0, 139.0, 153.0, 152.0, 186.0, 182.0, 193.0, 180.0, 176.0, 162.0, 164.0, 178.0, 152.0, 133.0, 129.0, 115.0, 114.0, 96.0, 74.0, 82.0, 59.0, 44.0, 53.0, 41.0, 32.0, 35.0, 16.0, 15.0, 7.0, 7.0, 13.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.59375, -23.836669921875, -23.07958984375, -22.322509765625, -21.5654296875, -20.808349609375, -20.05126953125, -19.294189453125, -18.537109375, -17.780029296875, -17.02294921875, -16.265869140625, -15.5087890625, -14.751708984375, -13.99462890625, -13.237548828125, -12.48046875, -11.723388671875, -10.96630859375, -10.209228515625, -9.4521484375, -8.695068359375, -7.93798828125, -7.180908203125, -6.423828125, -5.666748046875, -4.90966796875, -4.152587890625, -3.3955078125, -2.638427734375, -1.88134765625, -1.124267578125, -0.3671875, 0.389892578125, 1.14697265625, 1.904052734375, 2.6611328125, 3.418212890625, 4.17529296875, 4.932373046875, 5.689453125, 6.446533203125, 7.20361328125, 7.960693359375, 8.7177734375, 9.474853515625, 10.23193359375, 10.989013671875, 11.74609375, 12.503173828125, 13.26025390625, 14.017333984375, 14.7744140625, 15.531494140625, 16.28857421875, 17.045654296875, 17.802734375, 18.559814453125, 19.31689453125, 20.073974609375, 20.8310546875, 21.588134765625, 22.34521484375, 23.102294921875, 23.859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 7.0, 8.0, 17.0, 14.0, 16.0, 22.0, 21.0, 22.0, 31.0, 30.0, 36.0, 30.0, 30.0, 43.0, 43.0, 56.0, 48.0, 45.0, 35.0, 27.0, 38.0, 40.0, 32.0, 27.0, 37.0, 28.0, 23.0, 22.0, 25.0, 20.0, 14.0, 8.0, 10.0, 14.0, 12.0, 8.0, 12.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.678443908691406, -55.83201599121094, -53.98558807373047, -52.13916015625, -50.29273223876953, -48.44630432128906, -46.599876403808594, -44.753448486328125, -42.907020568847656, -41.06059265136719, -39.21416473388672, -37.36773681640625, -35.52130889892578, -33.67488098144531, -31.828453063964844, -29.982025146484375, -28.135595321655273, -26.289167404174805, -24.442739486694336, -22.596311569213867, -20.7498836517334, -18.903453826904297, -17.057025909423828, -15.210598945617676, -13.364171028137207, -11.517743110656738, -9.67131519317627, -7.824886798858643, -5.978458881378174, -4.132030487060547, -2.285602569580078, -0.4391746520996094, 1.4072532653808594, 3.253681182861328, 5.100109100341797, 6.946537494659424, 8.792964935302734, 10.63939380645752, 12.485821723937988, 14.332249641418457, 16.17867660522461, 18.025104522705078, 19.871532440185547, 21.717960357666016, 23.564388275146484, 25.410816192626953, 27.257244110107422, 29.10367202758789, 30.950101852416992, 32.796531677246094, 34.64295959472656, 36.48938751220703, 38.3358154296875, 40.18224334716797, 42.02867126464844, 43.875099182128906, 45.721527099609375, 47.567955017089844, 49.41438293457031, 51.26081085205078, 53.10723876953125, 54.95366668701172, 56.80009460449219, 58.646522521972656, 60.492950439453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 10.0, 13.0, 7.0, 16.0, 20.0, 13.0, 23.0, 22.0, 20.0, 22.0, 25.0, 24.0, 32.0, 26.0, 41.0, 35.0, 42.0, 32.0, 35.0, 41.0, 38.0, 43.0, 42.0, 32.0, 25.0, 32.0, 29.0, 20.0, 26.0, 23.0, 27.0, 21.0, 17.0, 11.0, 10.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.211090087890625, -53.36396789550781, -51.516849517822266, -49.66972732543945, -47.822608947753906, -45.975486755371094, -44.12836456298828, -42.281246185302734, -40.43412780761719, -38.587005615234375, -36.73988723754883, -34.892765045166016, -33.04564666748047, -31.198524475097656, -29.351404190063477, -27.504283905029297, -25.657161712646484, -23.810041427612305, -21.962921142578125, -20.115798950195312, -18.268680572509766, -16.421558380126953, -14.574438095092773, -12.727317810058594, -10.880197525024414, -9.033077239990234, -7.1859564781188965, -5.338835716247559, -3.491715431213379, -1.6445951461791992, 0.20252609252929688, 2.0496463775634766, 3.8967628479003906, 5.74388313293457, 7.591003894805908, 9.438124656677246, 11.285244941711426, 13.132365226745605, 14.979486465454102, 16.82660675048828, 18.67372703552246, 20.52084732055664, 22.36796760559082, 24.215087890625, 26.062210083007812, 27.90932846069336, 29.756450653076172, 31.60357093811035, 33.45069122314453, 35.297813415527344, 37.14493179321289, 38.9920539855957, 40.83917236328125, 42.68629455566406, 44.533416748046875, 46.38053512573242, 48.22765350341797, 50.07477569580078, 51.92189407348633, 53.76901626586914, 55.61613464355469, 57.4632568359375, 59.31037902832031, 61.15749740600586, 63.00461959838867]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 21.0, 26.0, 34.0, 57.0, 84.0, 158.0, 224.0, 367.0, 575.0, 908.0, 1398.0, 2225.0, 3475.0, 5626.0, 8444.0, 13188.0, 19503.0, 29327.0, 42111.0, 58614.0, 76939.0, 95321.0, 108730.0, 113762.0, 110012.0, 95378.0, 76982.0, 58046.0, 41855.0, 29095.0, 19587.0, 12955.0, 8494.0, 5497.0, 3491.0, 2183.0, 1426.0, 886.0, 530.0, 321.0, 246.0, 171.0, 97.0, 61.0, 42.0, 25.0, 18.0, 7.0, 12.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.41015625, -8.125, -7.83984375, -7.5546875, -7.26953125, -6.984375, -6.69921875, -6.4140625, -6.12890625, -5.84375, -5.55859375, -5.2734375, -4.98828125, -4.703125, -4.41796875, -4.1328125, -3.84765625, -3.5625, -3.27734375, -2.9921875, -2.70703125, -2.421875, -2.13671875, -1.8515625, -1.56640625, -1.28125, -0.99609375, -0.7109375, -0.42578125, -0.140625, 0.14453125, 0.4296875, 0.71484375, 1.0, 1.28515625, 1.5703125, 1.85546875, 2.140625, 2.42578125, 2.7109375, 2.99609375, 3.28125, 3.56640625, 3.8515625, 4.13671875, 4.421875, 4.70703125, 4.9921875, 5.27734375, 5.5625, 5.84765625, 6.1328125, 6.41796875, 6.703125, 6.98828125, 7.2734375, 7.55859375, 7.84375, 8.12890625, 8.4140625, 8.69921875, 8.984375, 9.26953125, 9.5546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 11.0, 12.0, 8.0, 18.0, 16.0, 15.0, 23.0, 21.0, 21.0, 22.0, 26.0, 22.0, 30.0, 27.0, 41.0, 37.0, 42.0, 32.0, 37.0, 39.0, 38.0, 43.0, 41.0, 31.0, 27.0, 30.0, 29.0, 22.0, 26.0, 23.0, 27.0, 20.0, 16.0, 11.0, 12.0, 13.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.5, -53.64990234375, -51.7998046875, -49.94970703125, -48.099609375, -46.24951171875, -44.3994140625, -42.54931640625, -40.69921875, -38.84912109375, -36.9990234375, -35.14892578125, -33.298828125, -31.44873046875, -29.5986328125, -27.74853515625, -25.8984375, -24.04833984375, -22.1982421875, -20.34814453125, -18.498046875, -16.64794921875, -14.7978515625, -12.94775390625, -11.09765625, -9.24755859375, -7.3974609375, -5.54736328125, -3.697265625, -1.84716796875, 0.0029296875, 1.85302734375, 3.703125, 5.55322265625, 7.4033203125, 9.25341796875, 11.103515625, 12.95361328125, 14.8037109375, 16.65380859375, 18.50390625, 20.35400390625, 22.2041015625, 24.05419921875, 25.904296875, 27.75439453125, 29.6044921875, 31.45458984375, 33.3046875, 35.15478515625, 37.0048828125, 38.85498046875, 40.705078125, 42.55517578125, 44.4052734375, 46.25537109375, 48.10546875, 49.95556640625, 51.8056640625, 53.65576171875, 55.505859375, 57.35595703125, 59.2060546875, 61.05615234375, 62.90625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 12.0, 18.0, 26.0, 47.0, 72.0, 123.0, 184.0, 308.0, 486.0, 825.0, 1305.0, 2129.0, 3541.0, 5729.0, 9385.0, 15718.0, 28512.0, 188235.0, 705318.0, 38353.0, 19296.0, 11278.0, 6842.0, 4320.0, 2490.0, 1583.0, 906.0, 611.0, 346.0, 208.0, 124.0, 90.0, 40.0, 36.0, 17.0, 10.0, 11.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.46875, -24.625, -23.78125, -22.9375, -22.09375, -21.25, -20.40625, -19.5625, -18.71875, -17.875, -17.03125, -16.1875, -15.34375, -14.5, -13.65625, -12.8125, -11.96875, -11.125, -10.28125, -9.4375, -8.59375, -7.75, -6.90625, -6.0625, -5.21875, -4.375, -3.53125, -2.6875, -1.84375, -1.0, -0.15625, 0.6875, 1.53125, 2.375, 3.21875, 4.0625, 4.90625, 5.75, 6.59375, 7.4375, 8.28125, 9.125, 9.96875, 10.8125, 11.65625, 12.5, 13.34375, 14.1875, 15.03125, 15.875, 16.71875, 17.5625, 18.40625, 19.25, 20.09375, 20.9375, 21.78125, 22.625, 23.46875, 24.3125, 25.15625, 26.0, 26.84375, 27.6875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 15.0, 16.0, 8.0, 15.0, 20.0, 17.0, 27.0, 27.0, 28.0, 16.0, 28.0, 29.0, 37.0, 33.0, 42.0, 52.0, 35.0, 37.0, 48.0, 42.0, 38.0, 38.0, 32.0, 24.0, 27.0, 30.0, 34.0, 29.0, 16.0, 28.0, 12.0, 19.0, 22.0, 12.0, 12.0, 6.0, 7.0, 7.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5, -41.146484375, -39.79296875, -38.439453125, -37.0859375, -35.732421875, -34.37890625, -33.025390625, -31.671875, -30.318359375, -28.96484375, -27.611328125, -26.2578125, -24.904296875, -23.55078125, -22.197265625, -20.84375, -19.490234375, -18.13671875, -16.783203125, -15.4296875, -14.076171875, -12.72265625, -11.369140625, -10.015625, -8.662109375, -7.30859375, -5.955078125, -4.6015625, -3.248046875, -1.89453125, -0.541015625, 0.8125, 2.166015625, 3.51953125, 4.873046875, 6.2265625, 7.580078125, 8.93359375, 10.287109375, 11.640625, 12.994140625, 14.34765625, 15.701171875, 17.0546875, 18.408203125, 19.76171875, 21.115234375, 22.46875, 23.822265625, 25.17578125, 26.529296875, 27.8828125, 29.236328125, 30.58984375, 31.943359375, 33.296875, 34.650390625, 36.00390625, 37.357421875, 38.7109375, 40.064453125, 41.41796875, 42.771484375, 44.125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 20.0, 41.0, 52.0, 83.0, 143.0, 242.0, 376.0, 639.0, 1045.0, 1909.0, 3189.0, 5542.0, 10340.0, 19016.0, 38119.0, 810029.0, 99065.0, 26876.0, 14119.0, 7556.0, 4256.0, 2315.0, 1404.0, 823.0, 481.0, 306.0, 197.0, 102.0, 70.0, 43.0, 32.0, 29.0, 7.0, 7.0, 15.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.09765625, -3.003082275390625, -2.90850830078125, -2.813934326171875, -2.7193603515625, -2.624786376953125, -2.53021240234375, -2.435638427734375, -2.341064453125, -2.246490478515625, -2.15191650390625, -2.057342529296875, -1.9627685546875, -1.868194580078125, -1.77362060546875, -1.679046630859375, -1.58447265625, -1.489898681640625, -1.39532470703125, -1.300750732421875, -1.2061767578125, -1.111602783203125, -1.01702880859375, -0.922454833984375, -0.827880859375, -0.733306884765625, -0.63873291015625, -0.544158935546875, -0.4495849609375, -0.355010986328125, -0.26043701171875, -0.165863037109375, -0.0712890625, 0.023284912109375, 0.11785888671875, 0.212432861328125, 0.3070068359375, 0.401580810546875, 0.49615478515625, 0.590728759765625, 0.685302734375, 0.779876708984375, 0.87445068359375, 0.969024658203125, 1.0635986328125, 1.158172607421875, 1.25274658203125, 1.347320556640625, 1.44189453125, 1.536468505859375, 1.63104248046875, 1.725616455078125, 1.8201904296875, 1.914764404296875, 2.00933837890625, 2.103912353515625, 2.198486328125, 2.293060302734375, 2.38763427734375, 2.482208251953125, 2.5767822265625, 2.671356201171875, 2.76593017578125, 2.860504150390625, 2.955078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 13.0, 13.0, 10.0, 17.0, 24.0, 28.0, 27.0, 35.0, 28.0, 53.0, 39.0, 44.0, 53.0, 38.0, 50.0, 46.0, 57.0, 49.0, 56.0, 42.0, 31.0, 43.0, 16.0, 35.0, 27.0, 19.0, 23.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.18832015991211e-05, -6.942730396986008e-05, -6.697140634059906e-05, -6.451550871133804e-05, -6.205961108207703e-05, -5.960371345281601e-05, -5.714781582355499e-05, -5.4691918194293976e-05, -5.223602056503296e-05, -4.978012293577194e-05, -4.7324225306510925e-05, -4.486832767724991e-05, -4.241243004798889e-05, -3.9956532418727875e-05, -3.750063478946686e-05, -3.504473716020584e-05, -3.2588839530944824e-05, -3.0132941901683807e-05, -2.767704427242279e-05, -2.5221146643161774e-05, -2.2765249013900757e-05, -2.030935138463974e-05, -1.7853453755378723e-05, -1.5397556126117706e-05, -1.294165849685669e-05, -1.0485760867595673e-05, -8.029863238334656e-06, -5.573965609073639e-06, -3.118067979812622e-06, -6.621703505516052e-07, 1.7937272787094116e-06, 4.2496249079704285e-06, 6.705522537231445e-06, 9.161420166492462e-06, 1.1617317795753479e-05, 1.4073215425014496e-05, 1.6529113054275513e-05, 1.898501068353653e-05, 2.1440908312797546e-05, 2.3896805942058563e-05, 2.635270357131958e-05, 2.8808601200580597e-05, 3.1264498829841614e-05, 3.372039645910263e-05, 3.617629408836365e-05, 3.8632191717624664e-05, 4.108808934688568e-05, 4.35439869761467e-05, 4.5999884605407715e-05, 4.845578223466873e-05, 5.091167986392975e-05, 5.3367577493190765e-05, 5.582347512245178e-05, 5.82793727517128e-05, 6.0735270380973816e-05, 6.319116801023483e-05, 6.564706563949585e-05, 6.810296326875687e-05, 7.055886089801788e-05, 7.30147585272789e-05, 7.547065615653992e-05, 7.792655378580093e-05, 8.038245141506195e-05, 8.283834904432297e-05, 8.529424667358398e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 13.0, 13.0, 13.0, 18.0, 33.0, 54.0, 77.0, 104.0, 150.0, 253.0, 367.0, 536.0, 858.0, 1191.0, 1768.0, 2835.0, 4035.0, 5958.0, 8636.0, 12688.0, 18162.0, 26145.0, 36278.0, 49491.0, 66957.0, 87508.0, 107380.0, 120014.0, 116103.0, 98612.0, 77811.0, 59087.0, 42981.0, 31210.0, 22032.0, 15446.0, 10753.0, 7575.0, 5203.0, 3440.0, 2262.0, 1436.0, 1032.0, 702.0, 441.0, 294.0, 216.0, 142.0, 86.0, 57.0, 30.0, 24.0, 15.0, 19.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.9775390625, -1.9132843017578125, -1.849029541015625, -1.7847747802734375, -1.72052001953125, -1.6562652587890625, -1.592010498046875, -1.5277557373046875, -1.4635009765625, -1.3992462158203125, -1.334991455078125, -1.2707366943359375, -1.20648193359375, -1.1422271728515625, -1.077972412109375, -1.0137176513671875, -0.949462890625, -0.8852081298828125, -0.820953369140625, -0.7566986083984375, -0.69244384765625, -0.6281890869140625, -0.563934326171875, -0.4996795654296875, -0.4354248046875, -0.3711700439453125, -0.306915283203125, -0.2426605224609375, -0.17840576171875, -0.1141510009765625, -0.049896240234375, 0.0143585205078125, 0.07861328125, 0.1428680419921875, 0.207122802734375, 0.2713775634765625, 0.33563232421875, 0.3998870849609375, 0.464141845703125, 0.5283966064453125, 0.5926513671875, 0.6569061279296875, 0.721160888671875, 0.7854156494140625, 0.84967041015625, 0.9139251708984375, 0.978179931640625, 1.0424346923828125, 1.106689453125, 1.1709442138671875, 1.235198974609375, 1.2994537353515625, 1.36370849609375, 1.4279632568359375, 1.492218017578125, 1.5564727783203125, 1.6207275390625, 1.6849822998046875, 1.749237060546875, 1.8134918212890625, 1.87774658203125, 1.9420013427734375, 2.006256103515625, 2.0705108642578125, 2.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 9.0, 14.0, 21.0, 16.0, 16.0, 22.0, 30.0, 29.0, 32.0, 41.0, 55.0, 53.0, 55.0, 66.0, 73.0, 70.0, 47.0, 50.0, 42.0, 38.0, 38.0, 18.0, 25.0, 18.0, 11.0, 15.0, 15.0, 14.0, 5.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.2724609375, -1.2373580932617188, -1.2022552490234375, -1.1671524047851562, -1.132049560546875, -1.0969467163085938, -1.0618438720703125, -1.0267410278320312, -0.99163818359375, -0.9565353393554688, -0.9214324951171875, -0.8863296508789062, -0.851226806640625, -0.8161239624023438, -0.7810211181640625, -0.7459182739257812, -0.7108154296875, -0.6757125854492188, -0.6406097412109375, -0.6055068969726562, -0.570404052734375, -0.5353012084960938, -0.5001983642578125, -0.46509552001953125, -0.42999267578125, -0.39488983154296875, -0.3597869873046875, -0.32468414306640625, -0.289581298828125, -0.25447845458984375, -0.2193756103515625, -0.18427276611328125, -0.149169921875, -0.11406707763671875, -0.0789642333984375, -0.04386138916015625, -0.008758544921875, 0.02634429931640625, 0.0614471435546875, 0.09654998779296875, 0.13165283203125, 0.16675567626953125, 0.2018585205078125, 0.23696136474609375, 0.272064208984375, 0.30716705322265625, 0.3422698974609375, 0.37737274169921875, 0.4124755859375, 0.44757843017578125, 0.4826812744140625, 0.5177841186523438, 0.552886962890625, 0.5879898071289062, 0.6230926513671875, 0.6581954956054688, 0.69329833984375, 0.7284011840820312, 0.7635040283203125, 0.7986068725585938, 0.833709716796875, 0.8688125610351562, 0.9039154052734375, 0.9390182495117188, 0.97412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 11.0, 5.0, 14.0, 14.0, 14.0, 16.0, 32.0, 17.0, 22.0, 39.0, 21.0, 33.0, 28.0, 36.0, 44.0, 46.0, 53.0, 44.0, 40.0, 40.0, 23.0, 33.0, 46.0, 31.0, 34.0, 28.0, 26.0, 20.0, 27.0, 21.0, 20.0, 14.0, 11.0, 12.0, 12.0, 9.0, 11.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.98395538330078, -54.17173767089844, -52.359519958496094, -50.54730224609375, -48.73508834838867, -46.92287063598633, -45.110652923583984, -43.29843521118164, -41.48622131347656, -39.67400360107422, -37.861785888671875, -36.04956817626953, -34.23735427856445, -32.42513656616211, -30.612918853759766, -28.800701141357422, -26.988483428955078, -25.176265716552734, -23.364049911499023, -21.55183219909668, -19.73961639404297, -17.927398681640625, -16.11518096923828, -14.302964210510254, -12.490747451782227, -10.6785306930542, -8.866313934326172, -7.054096221923828, -5.241879463195801, -3.4296627044677734, -1.6174449920654297, 0.19477176666259766, 2.0069847106933594, 3.819201707839966, 5.631418704986572, 7.443635940551758, 9.255852699279785, 11.068069458007812, 12.880287170410156, 14.692503929138184, 16.50472068786621, 18.316938400268555, 20.129154205322266, 21.94137191772461, 23.753589630126953, 25.565805435180664, 27.378023147583008, 29.19023895263672, 31.002456665039062, 32.814674377441406, 34.62689208984375, 36.439109802246094, 38.25132369995117, 40.063541412353516, 41.87575912475586, 43.6879768371582, 45.50019073486328, 47.312408447265625, 49.12462615966797, 50.93684387207031, 52.74905776977539, 54.561275482177734, 56.37349319458008, 58.18571090698242, 59.997928619384766]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 14.0, 13.0, 10.0, 11.0, 18.0, 13.0, 18.0, 22.0, 20.0, 21.0, 21.0, 26.0, 25.0, 31.0, 29.0, 38.0, 36.0, 47.0, 31.0, 33.0, 43.0, 39.0, 42.0, 38.0, 30.0, 28.0, 30.0, 32.0, 17.0, 28.0, 21.0, 28.0, 20.0, 14.0, 10.0, 10.0, 17.0, 12.0, 7.0, 9.0, 7.0, 2.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-55.297603607177734, -53.44639205932617, -51.59518051147461, -49.74396896362305, -47.892757415771484, -46.04154586791992, -44.19033432006836, -42.3391227722168, -40.487911224365234, -38.63669967651367, -36.78548812866211, -34.93427658081055, -33.083065032958984, -31.231853485107422, -29.38064193725586, -27.529430389404297, -25.6782169342041, -23.82700538635254, -21.975793838500977, -20.124582290649414, -18.27337074279785, -16.422157287597656, -14.57094669342041, -12.719735145568848, -10.868523597717285, -9.017312049865723, -7.16610050201416, -5.3148884773254395, -3.463676929473877, -1.6124649047851562, 0.23874664306640625, 2.0899581909179688, 3.9411697387695312, 5.792381286621094, 7.643592834472656, 9.494804382324219, 11.346015930175781, 13.19722843170166, 15.048439979553223, 16.89965057373047, 18.75086212158203, 20.602073669433594, 22.453285217285156, 24.30449676513672, 26.15570831298828, 28.006919860839844, 29.858131408691406, 31.70934295654297, 33.56055450439453, 35.411766052246094, 37.262977600097656, 39.11418914794922, 40.96540069580078, 42.816612243652344, 44.667823791503906, 46.51903533935547, 48.3702507019043, 50.22146224975586, 52.07267379760742, 53.923885345458984, 55.77509689331055, 57.62630844116211, 59.47751998901367, 61.328731536865234, 63.1799430847168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 13.0, 27.0, 32.0, 55.0, 93.0, 219.0, 285.0, 472.0, 765.0, 1171.0, 1894.0, 3047.0, 4525.0, 6671.0, 9830.0, 14092.0, 19649.0, 26839.0, 35505.0, 45629.0, 55900.0, 66583.0, 75422.0, 82225.0, 85696.0, 85174.0, 80537.0, 73010.0, 62959.0, 53357.0, 42916.0, 32958.0, 24469.0, 17951.0, 12818.0, 8650.0, 5938.0, 4074.0, 2626.0, 1605.0, 1089.0, 690.0, 436.0, 251.0, 163.0, 103.0, 56.0, 35.0, 20.0, 12.0, 8.0, 5.0, 5.0, 0.0, 1.0], "bins": [-36.75, -35.66455078125, -34.5791015625, -33.49365234375, -32.408203125, -31.32275390625, -30.2373046875, -29.15185546875, -28.06640625, -26.98095703125, -25.8955078125, -24.81005859375, -23.724609375, -22.63916015625, -21.5537109375, -20.46826171875, -19.3828125, -18.29736328125, -17.2119140625, -16.12646484375, -15.041015625, -13.95556640625, -12.8701171875, -11.78466796875, -10.69921875, -9.61376953125, -8.5283203125, -7.44287109375, -6.357421875, -5.27197265625, -4.1865234375, -3.10107421875, -2.015625, -0.93017578125, 0.1552734375, 1.24072265625, 2.326171875, 3.41162109375, 4.4970703125, 5.58251953125, 6.66796875, 7.75341796875, 8.8388671875, 9.92431640625, 11.009765625, 12.09521484375, 13.1806640625, 14.26611328125, 15.3515625, 16.43701171875, 17.5224609375, 18.60791015625, 19.693359375, 20.77880859375, 21.8642578125, 22.94970703125, 24.03515625, 25.12060546875, 26.2060546875, 27.29150390625, 28.376953125, 29.46240234375, 30.5478515625, 31.63330078125, 32.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 11.0, 12.0, 12.0, 11.0, 16.0, 18.0, 15.0, 23.0, 21.0, 18.0, 22.0, 29.0, 23.0, 33.0, 29.0, 42.0, 37.0, 45.0, 32.0, 29.0, 52.0, 40.0, 40.0, 38.0, 27.0, 28.0, 33.0, 25.0, 19.0, 30.0, 22.0, 28.0, 15.0, 19.0, 5.0, 14.0, 14.0, 11.0, 6.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.18017578125, -50.3603515625, -48.54052734375, -46.720703125, -44.90087890625, -43.0810546875, -41.26123046875, -39.44140625, -37.62158203125, -35.8017578125, -33.98193359375, -32.162109375, -30.34228515625, -28.5224609375, -26.70263671875, -24.8828125, -23.06298828125, -21.2431640625, -19.42333984375, -17.603515625, -15.78369140625, -13.9638671875, -12.14404296875, -10.32421875, -8.50439453125, -6.6845703125, -4.86474609375, -3.044921875, -1.22509765625, 0.5947265625, 2.41455078125, 4.234375, 6.05419921875, 7.8740234375, 9.69384765625, 11.513671875, 13.33349609375, 15.1533203125, 16.97314453125, 18.79296875, 20.61279296875, 22.4326171875, 24.25244140625, 26.072265625, 27.89208984375, 29.7119140625, 31.53173828125, 33.3515625, 35.17138671875, 36.9912109375, 38.81103515625, 40.630859375, 42.45068359375, 44.2705078125, 46.09033203125, 47.91015625, 49.72998046875, 51.5498046875, 53.36962890625, 55.189453125, 57.00927734375, 58.8291015625, 60.64892578125, 62.46875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 35.0, 47.0, 81.0, 135.0, 224.0, 350.0, 651.0, 1031.0, 1714.0, 2573.0, 4155.0, 6501.0, 9964.0, 14671.0, 21252.0, 29661.0, 39735.0, 51688.0, 64677.0, 76011.0, 86322.0, 91937.0, 92887.0, 88995.0, 81114.0, 69824.0, 57813.0, 45097.0, 34303.0, 24710.0, 17287.0, 11783.0, 7862.0, 5058.0, 3211.0, 1988.0, 1245.0, 807.0, 464.0, 260.0, 179.0, 104.0, 51.0, 46.0, 23.0, 12.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.875, -31.75, -30.625, -29.5, -28.375, -27.25, -26.125, -25.0, -23.875, -22.75, -21.625, -20.5, -19.375, -18.25, -17.125, -16.0, -14.875, -13.75, -12.625, -11.5, -10.375, -9.25, -8.125, -7.0, -5.875, -4.75, -3.625, -2.5, -1.375, -0.25, 0.875, 2.0, 3.125, 4.25, 5.375, 6.5, 7.625, 8.75, 9.875, 11.0, 12.125, 13.25, 14.375, 15.5, 16.625, 17.75, 18.875, 20.0, 21.125, 22.25, 23.375, 24.5, 25.625, 26.75, 27.875, 29.0, 30.125, 31.25, 32.375, 33.5, 34.625, 35.75, 36.875, 38.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 7.0, 16.0, 17.0, 18.0, 18.0, 16.0, 21.0, 27.0, 24.0, 31.0, 34.0, 43.0, 34.0, 35.0, 46.0, 40.0, 41.0, 42.0, 52.0, 51.0, 41.0, 33.0, 29.0, 39.0, 33.0, 22.0, 28.0, 16.0, 19.0, 16.0, 10.0, 5.0, 6.0, 13.0, 10.0, 9.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.6875, -39.34912109375, -38.0107421875, -36.67236328125, -35.333984375, -33.99560546875, -32.6572265625, -31.31884765625, -29.98046875, -28.64208984375, -27.3037109375, -25.96533203125, -24.626953125, -23.28857421875, -21.9501953125, -20.61181640625, -19.2734375, -17.93505859375, -16.5966796875, -15.25830078125, -13.919921875, -12.58154296875, -11.2431640625, -9.90478515625, -8.56640625, -7.22802734375, -5.8896484375, -4.55126953125, -3.212890625, -1.87451171875, -0.5361328125, 0.80224609375, 2.140625, 3.47900390625, 4.8173828125, 6.15576171875, 7.494140625, 8.83251953125, 10.1708984375, 11.50927734375, 12.84765625, 14.18603515625, 15.5244140625, 16.86279296875, 18.201171875, 19.53955078125, 20.8779296875, 22.21630859375, 23.5546875, 24.89306640625, 26.2314453125, 27.56982421875, 28.908203125, 30.24658203125, 31.5849609375, 32.92333984375, 34.26171875, 35.60009765625, 36.9384765625, 38.27685546875, 39.615234375, 40.95361328125, 42.2919921875, 43.63037109375, 44.96875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 14.0, 28.0, 36.0, 67.0, 122.0, 181.0, 338.0, 597.0, 1064.0, 1823.0, 3356.0, 5640.0, 9884.0, 16485.0, 26135.0, 40032.0, 58425.0, 79126.0, 98928.0, 114498.0, 120140.0, 115759.0, 100933.0, 81593.0, 60842.0, 42756.0, 27630.0, 17240.0, 10482.0, 6113.0, 3592.0, 1952.0, 1201.0, 684.0, 362.0, 190.0, 126.0, 75.0, 42.0, 29.0, 16.0, 9.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.139404296875, -18.51318359375, -17.886962890625, -17.2607421875, -16.634521484375, -16.00830078125, -15.382080078125, -14.755859375, -14.129638671875, -13.50341796875, -12.877197265625, -12.2509765625, -11.624755859375, -10.99853515625, -10.372314453125, -9.74609375, -9.119873046875, -8.49365234375, -7.867431640625, -7.2412109375, -6.614990234375, -5.98876953125, -5.362548828125, -4.736328125, -4.110107421875, -3.48388671875, -2.857666015625, -2.2314453125, -1.605224609375, -0.97900390625, -0.352783203125, 0.2734375, 0.899658203125, 1.52587890625, 2.152099609375, 2.7783203125, 3.404541015625, 4.03076171875, 4.656982421875, 5.283203125, 5.909423828125, 6.53564453125, 7.161865234375, 7.7880859375, 8.414306640625, 9.04052734375, 9.666748046875, 10.29296875, 10.919189453125, 11.54541015625, 12.171630859375, 12.7978515625, 13.424072265625, 14.05029296875, 14.676513671875, 15.302734375, 15.928955078125, 16.55517578125, 17.181396484375, 17.8076171875, 18.433837890625, 19.06005859375, 19.686279296875, 20.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 18.0, 11.0, 16.0, 23.0, 21.0, 29.0, 32.0, 34.0, 40.0, 40.0, 59.0, 43.0, 60.0, 52.0, 58.0, 45.0, 56.0, 54.0, 44.0, 46.0, 35.0, 28.0, 32.0, 23.0, 12.0, 23.0, 12.0, 14.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023040771484375, -0.0022216439247131348, -0.0021392107009887695, -0.0020567774772644043, -0.001974344253540039, -0.0018919110298156738, -0.0018094778060913086, -0.0017270445823669434, -0.0016446113586425781, -0.0015621781349182129, -0.0014797449111938477, -0.0013973116874694824, -0.0013148784637451172, -0.001232445240020752, -0.0011500120162963867, -0.0010675787925720215, -0.0009851455688476562, -0.000902712345123291, -0.0008202791213989258, -0.0007378458976745605, -0.0006554126739501953, -0.0005729794502258301, -0.0004905462265014648, -0.0004081130027770996, -0.0003256797790527344, -0.00024324655532836914, -0.0001608133316040039, -7.838010787963867e-05, 4.0531158447265625e-06, 8.64863395690918e-05, 0.00016891956329345703, 0.00025135278701782227, 0.0003337860107421875, 0.00041621923446655273, 0.000498652458190918, 0.0005810856819152832, 0.0006635189056396484, 0.0007459521293640137, 0.0008283853530883789, 0.0009108185768127441, 0.0009932518005371094, 0.0010756850242614746, 0.0011581182479858398, 0.001240551471710205, 0.0013229846954345703, 0.0014054179191589355, 0.0014878511428833008, 0.001570284366607666, 0.0016527175903320312, 0.0017351508140563965, 0.0018175840377807617, 0.001900017261505127, 0.001982450485229492, 0.0020648837089538574, 0.0021473169326782227, 0.002229750156402588, 0.002312183380126953, 0.0023946166038513184, 0.0024770498275756836, 0.002559483051300049, 0.002641916275024414, 0.0027243494987487793, 0.0028067827224731445, 0.0028892159461975098, 0.002971649169921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 14.0, 12.0, 19.0, 35.0, 73.0, 106.0, 155.0, 297.0, 477.0, 818.0, 1395.0, 2105.0, 3429.0, 5541.0, 8760.0, 13368.0, 20435.0, 29650.0, 41667.0, 56821.0, 71856.0, 87974.0, 99269.0, 105014.0, 102913.0, 94723.0, 80537.0, 64981.0, 49087.0, 35965.0, 24985.0, 16607.0, 10980.0, 6953.0, 4341.0, 2754.0, 1695.0, 1091.0, 649.0, 425.0, 222.0, 144.0, 100.0, 43.0, 28.0, 14.0, 8.0, 8.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.453125, -19.828857421875, -19.20458984375, -18.580322265625, -17.9560546875, -17.331787109375, -16.70751953125, -16.083251953125, -15.458984375, -14.834716796875, -14.21044921875, -13.586181640625, -12.9619140625, -12.337646484375, -11.71337890625, -11.089111328125, -10.46484375, -9.840576171875, -9.21630859375, -8.592041015625, -7.9677734375, -7.343505859375, -6.71923828125, -6.094970703125, -5.470703125, -4.846435546875, -4.22216796875, -3.597900390625, -2.9736328125, -2.349365234375, -1.72509765625, -1.100830078125, -0.4765625, 0.147705078125, 0.77197265625, 1.396240234375, 2.0205078125, 2.644775390625, 3.26904296875, 3.893310546875, 4.517578125, 5.141845703125, 5.76611328125, 6.390380859375, 7.0146484375, 7.638916015625, 8.26318359375, 8.887451171875, 9.51171875, 10.135986328125, 10.76025390625, 11.384521484375, 12.0087890625, 12.633056640625, 13.25732421875, 13.881591796875, 14.505859375, 15.130126953125, 15.75439453125, 16.378662109375, 17.0029296875, 17.627197265625, 18.25146484375, 18.875732421875, 19.5]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 7.0, 10.0, 12.0, 14.0, 10.0, 20.0, 23.0, 16.0, 21.0, 30.0, 29.0, 38.0, 36.0, 30.0, 32.0, 41.0, 59.0, 50.0, 62.0, 53.0, 44.0, 37.0, 38.0, 43.0, 51.0, 30.0, 30.0, 27.0, 11.0, 17.0, 15.0, 10.0, 6.0, 4.0, 8.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0638427734375, -8.760498046875, -8.4571533203125, -8.15380859375, -7.8504638671875, -7.547119140625, -7.2437744140625, -6.9404296875, -6.6370849609375, -6.333740234375, -6.0303955078125, -5.72705078125, -5.4237060546875, -5.120361328125, -4.8170166015625, -4.513671875, -4.2103271484375, -3.906982421875, -3.6036376953125, -3.30029296875, -2.9969482421875, -2.693603515625, -2.3902587890625, -2.0869140625, -1.7835693359375, -1.480224609375, -1.1768798828125, -0.87353515625, -0.5701904296875, -0.266845703125, 0.0364990234375, 0.33984375, 0.6431884765625, 0.946533203125, 1.2498779296875, 1.55322265625, 1.8565673828125, 2.159912109375, 2.4632568359375, 2.7666015625, 3.0699462890625, 3.373291015625, 3.6766357421875, 3.97998046875, 4.2833251953125, 4.586669921875, 4.8900146484375, 5.193359375, 5.4967041015625, 5.800048828125, 6.1033935546875, 6.40673828125, 6.7100830078125, 7.013427734375, 7.3167724609375, 7.6201171875, 7.9234619140625, 8.226806640625, 8.5301513671875, 8.83349609375, 9.1368408203125, 9.440185546875, 9.7435302734375, 10.046875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 9.0, 17.0, 15.0, 13.0, 15.0, 22.0, 22.0, 18.0, 36.0, 35.0, 32.0, 33.0, 43.0, 48.0, 41.0, 32.0, 40.0, 38.0, 40.0, 51.0, 34.0, 43.0, 29.0, 25.0, 24.0, 24.0, 25.0, 20.0, 17.0, 16.0, 11.0, 19.0, 7.0, 7.0, 10.0, 6.0, 7.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.550498962402344, -51.78920364379883, -50.02790832519531, -48.26660919189453, -46.505313873291016, -44.7440185546875, -42.982723236083984, -41.22142791748047, -39.46012878417969, -37.69883346557617, -35.937538146972656, -34.176239013671875, -32.41494369506836, -30.653648376464844, -28.892353057861328, -27.13105583190918, -25.369760513305664, -23.60846519470215, -21.84716796875, -20.085872650146484, -18.324575424194336, -16.56328010559082, -14.801983833312988, -13.040687561035156, -11.279391288757324, -9.518095016479492, -7.75679874420166, -5.995502948760986, -4.234206676483154, -2.4729108810424805, -0.7116146087646484, 1.0496816635131836, 2.8109779357910156, 4.572274208068848, 6.33357048034668, 8.094865798950195, 9.856163024902344, 11.61745834350586, 13.378754615783691, 15.140050888061523, 16.901348114013672, 18.662643432617188, 20.423940658569336, 22.18523597717285, 23.946533203125, 25.707828521728516, 27.46912384033203, 29.23042106628418, 30.991716384887695, 32.753013610839844, 34.51430892944336, 36.275604248046875, 38.03689956665039, 39.798194885253906, 41.55949401855469, 43.3207893371582, 45.08208465576172, 46.843379974365234, 48.60467529296875, 50.36597442626953, 52.12726974487305, 53.88856506347656, 55.64986038208008, 57.411155700683594, 59.172454833984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 14.0, 16.0, 13.0, 17.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 25.0, 29.0, 39.0, 33.0, 50.0, 42.0, 33.0, 35.0, 41.0, 56.0, 37.0, 36.0, 26.0, 34.0, 33.0, 17.0, 25.0, 31.0, 20.0, 24.0, 21.0, 20.0, 8.0, 11.0, 7.0, 6.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-64.747314453125, -62.61769104003906, -60.488067626953125, -58.35844421386719, -56.22882080078125, -54.09919738769531, -51.96957015991211, -49.83994674682617, -47.710323333740234, -45.5806999206543, -43.45107650756836, -41.32145309448242, -39.19182586669922, -37.06220245361328, -34.932579040527344, -32.802955627441406, -30.67333221435547, -28.54370880126953, -26.414085388183594, -24.284460067749023, -22.154836654663086, -20.02521324157715, -17.895587921142578, -15.76596450805664, -13.636341094970703, -11.506717681884766, -9.377093315124512, -7.247469425201416, -5.11784553527832, -2.988222122192383, -0.8585977554321289, 1.271026611328125, 3.4006423950195312, 5.530266284942627, 7.659890174865723, 9.789514541625977, 11.919137954711914, 14.048761367797852, 16.178386688232422, 18.30801010131836, 20.437633514404297, 22.567256927490234, 24.696880340576172, 26.826505661010742, 28.95612907409668, 31.085752487182617, 33.21537780761719, 35.345001220703125, 37.47462463378906, 39.604248046875, 41.73387145996094, 43.863494873046875, 45.99311828613281, 48.12274169921875, 50.25236892700195, 52.38199234008789, 54.51161575317383, 56.641239166259766, 58.7708625793457, 60.90048599243164, 63.030113220214844, 65.15973663330078, 67.28936004638672, 69.41898345947266, 71.5486068725586]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 11.0, 11.0, 26.0, 21.0, 47.0, 95.0, 179.0, 308.0, 493.0, 862.0, 1508.0, 2542.0, 4451.0, 7285.0, 11939.0, 19476.0, 31068.0, 48196.0, 73790.0, 108174.0, 153667.0, 208669.0, 270833.0, 331629.0, 381947.0, 410741.0, 413483.0, 386163.0, 340370.0, 279901.0, 217450.0, 161440.0, 113742.0, 77355.0, 51429.0, 32780.0, 20434.0, 12770.0, 7775.0, 4653.0, 2692.0, 1638.0, 961.0, 545.0, 299.0, 179.0, 128.0, 47.0, 35.0, 21.0, 12.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.08349609375, -40.6357421875, -39.18798828125, -37.740234375, -36.29248046875, -34.8447265625, -33.39697265625, -31.94921875, -30.50146484375, -29.0537109375, -27.60595703125, -26.158203125, -24.71044921875, -23.2626953125, -21.81494140625, -20.3671875, -18.91943359375, -17.4716796875, -16.02392578125, -14.576171875, -13.12841796875, -11.6806640625, -10.23291015625, -8.78515625, -7.33740234375, -5.8896484375, -4.44189453125, -2.994140625, -1.54638671875, -0.0986328125, 1.34912109375, 2.796875, 4.24462890625, 5.6923828125, 7.14013671875, 8.587890625, 10.03564453125, 11.4833984375, 12.93115234375, 14.37890625, 15.82666015625, 17.2744140625, 18.72216796875, 20.169921875, 21.61767578125, 23.0654296875, 24.51318359375, 25.9609375, 27.40869140625, 28.8564453125, 30.30419921875, 31.751953125, 33.19970703125, 34.6474609375, 36.09521484375, 37.54296875, 38.99072265625, 40.4384765625, 41.88623046875, 43.333984375, 44.78173828125, 46.2294921875, 47.67724609375, 49.125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 6.0, 7.0, 16.0, 15.0, 17.0, 17.0, 22.0, 14.0, 25.0, 24.0, 28.0, 25.0, 25.0, 36.0, 36.0, 38.0, 43.0, 43.0, 29.0, 33.0, 46.0, 52.0, 45.0, 29.0, 25.0, 31.0, 32.0, 26.0, 24.0, 24.0, 24.0, 22.0, 24.0, 16.0, 14.0, 8.0, 7.0, 7.0, 6.0, 9.0, 2.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-58.53125, -56.60009765625, -54.6689453125, -52.73779296875, -50.806640625, -48.87548828125, -46.9443359375, -45.01318359375, -43.08203125, -41.15087890625, -39.2197265625, -37.28857421875, -35.357421875, -33.42626953125, -31.4951171875, -29.56396484375, -27.6328125, -25.70166015625, -23.7705078125, -21.83935546875, -19.908203125, -17.97705078125, -16.0458984375, -14.11474609375, -12.18359375, -10.25244140625, -8.3212890625, -6.39013671875, -4.458984375, -2.52783203125, -0.5966796875, 1.33447265625, 3.265625, 5.19677734375, 7.1279296875, 9.05908203125, 10.990234375, 12.92138671875, 14.8525390625, 16.78369140625, 18.71484375, 20.64599609375, 22.5771484375, 24.50830078125, 26.439453125, 28.37060546875, 30.3017578125, 32.23291015625, 34.1640625, 36.09521484375, 38.0263671875, 39.95751953125, 41.888671875, 43.81982421875, 45.7509765625, 47.68212890625, 49.61328125, 51.54443359375, 53.4755859375, 55.40673828125, 57.337890625, 59.26904296875, 61.2001953125, 63.13134765625, 65.0625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 11.0, 20.0, 41.0, 74.0, 143.0, 225.0, 396.0, 651.0, 1145.0, 1898.0, 3292.0, 5403.0, 8824.0, 13956.0, 22272.0, 34693.0, 51958.0, 76222.0, 107770.0, 147345.0, 193712.0, 245097.0, 294054.0, 336604.0, 365759.0, 376040.0, 364859.0, 336058.0, 293649.0, 244975.0, 193072.0, 147245.0, 106742.0, 75223.0, 51907.0, 34520.0, 22245.0, 14099.0, 8765.0, 5353.0, 3286.0, 1920.0, 1157.0, 656.0, 385.0, 230.0, 132.0, 84.0, 47.0, 32.0, 19.0, 14.0, 3.0, 1.0, 3.0], "bins": [-48.84375, -47.427734375, -46.01171875, -44.595703125, -43.1796875, -41.763671875, -40.34765625, -38.931640625, -37.515625, -36.099609375, -34.68359375, -33.267578125, -31.8515625, -30.435546875, -29.01953125, -27.603515625, -26.1875, -24.771484375, -23.35546875, -21.939453125, -20.5234375, -19.107421875, -17.69140625, -16.275390625, -14.859375, -13.443359375, -12.02734375, -10.611328125, -9.1953125, -7.779296875, -6.36328125, -4.947265625, -3.53125, -2.115234375, -0.69921875, 0.716796875, 2.1328125, 3.548828125, 4.96484375, 6.380859375, 7.796875, 9.212890625, 10.62890625, 12.044921875, 13.4609375, 14.876953125, 16.29296875, 17.708984375, 19.125, 20.541015625, 21.95703125, 23.373046875, 24.7890625, 26.205078125, 27.62109375, 29.037109375, 30.453125, 31.869140625, 33.28515625, 34.701171875, 36.1171875, 37.533203125, 38.94921875, 40.365234375, 41.78125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 5.0, 16.0, 9.0, 15.0, 17.0, 30.0, 29.0, 32.0, 39.0, 55.0, 64.0, 80.0, 84.0, 119.0, 117.0, 126.0, 130.0, 157.0, 158.0, 178.0, 170.0, 199.0, 200.0, 178.0, 153.0, 178.0, 159.0, 184.0, 145.0, 153.0, 114.0, 130.0, 98.0, 73.0, 69.0, 76.0, 65.0, 43.0, 42.0, 32.0, 29.0, 34.0, 24.0, 21.0, 9.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.96875, -24.1494140625, -23.330078125, -22.5107421875, -21.69140625, -20.8720703125, -20.052734375, -19.2333984375, -18.4140625, -17.5947265625, -16.775390625, -15.9560546875, -15.13671875, -14.3173828125, -13.498046875, -12.6787109375, -11.859375, -11.0400390625, -10.220703125, -9.4013671875, -8.58203125, -7.7626953125, -6.943359375, -6.1240234375, -5.3046875, -4.4853515625, -3.666015625, -2.8466796875, -2.02734375, -1.2080078125, -0.388671875, 0.4306640625, 1.25, 2.0693359375, 2.888671875, 3.7080078125, 4.52734375, 5.3466796875, 6.166015625, 6.9853515625, 7.8046875, 8.6240234375, 9.443359375, 10.2626953125, 11.08203125, 11.9013671875, 12.720703125, 13.5400390625, 14.359375, 15.1787109375, 15.998046875, 16.8173828125, 17.63671875, 18.4560546875, 19.275390625, 20.0947265625, 20.9140625, 21.7333984375, 22.552734375, 23.3720703125, 24.19140625, 25.0107421875, 25.830078125, 26.6494140625, 27.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 11.0, 18.0, 18.0, 20.0, 16.0, 21.0, 20.0, 28.0, 27.0, 36.0, 38.0, 41.0, 44.0, 54.0, 63.0, 44.0, 42.0, 44.0, 58.0, 33.0, 40.0, 28.0, 27.0, 31.0, 30.0, 22.0, 19.0, 22.0, 14.0, 9.0, 8.0, 7.0, 6.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-78.44146728515625, -76.33866882324219, -74.23587036132812, -72.1330795288086, -70.03028106689453, -67.92748260498047, -65.8246841430664, -63.721885681152344, -61.61909103393555, -59.516292572021484, -57.41349792480469, -55.310699462890625, -53.20790100097656, -51.105106353759766, -49.0023078918457, -46.899513244628906, -44.796714782714844, -42.69391632080078, -40.591121673583984, -38.48832321166992, -36.385528564453125, -34.28273010253906, -32.179931640625, -30.07713508605957, -27.97433853149414, -25.87154197692871, -23.76874542236328, -21.66594696044922, -19.56315040588379, -17.46035385131836, -15.357556343078613, -13.254758834838867, -11.151966094970703, -9.049169540405273, -6.946372032165527, -4.8435750007629395, -2.7407779693603516, -0.6379814147949219, 1.4648160934448242, 3.5676136016845703, 5.67041015625, 7.773207187652588, 9.876004219055176, 11.978801727294922, 14.081598281860352, 16.18439483642578, 18.287193298339844, 20.389989852905273, 22.492786407470703, 24.595582962036133, 26.698379516601562, 28.801177978515625, 30.903974533081055, 33.006771087646484, 35.10956954956055, 37.212364196777344, 39.315162658691406, 41.41796112060547, 43.520755767822266, 45.62355422973633, 47.726348876953125, 49.82914733886719, 51.93194580078125, 54.03474426269531, 56.13753890991211]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 8.0, 7.0, 5.0, 13.0, 17.0, 19.0, 16.0, 23.0, 20.0, 32.0, 30.0, 25.0, 41.0, 32.0, 23.0, 48.0, 42.0, 43.0, 44.0, 44.0, 43.0, 47.0, 52.0, 44.0, 34.0, 20.0, 28.0, 40.0, 25.0, 22.0, 19.0, 18.0, 13.0, 13.0, 3.0, 17.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.32952117919922, -70.92608642578125, -68.52265167236328, -66.11920928955078, -63.71577453613281, -61.312339782714844, -58.908905029296875, -56.505470275878906, -54.10203170776367, -51.6985969543457, -49.29515838623047, -46.8917236328125, -44.48828887939453, -42.0848503112793, -39.68141555786133, -37.277976989746094, -34.874542236328125, -32.471107482910156, -30.067668914794922, -27.664234161376953, -25.26079750061035, -22.85736083984375, -20.45392608642578, -18.05048942565918, -15.647052764892578, -13.243616104125977, -10.840180397033691, -8.436744689941406, -6.033308029174805, -3.629871368408203, -1.226435661315918, 1.1770000457763672, 3.5804367065429688, 5.983872890472412, 8.387309074401855, 10.79074478149414, 13.194181442260742, 15.597618103027344, 18.001052856445312, 20.404489517211914, 22.807926177978516, 25.211362838745117, 27.61479949951172, 30.018234252929688, 32.421669006347656, 34.82510757446289, 37.22854232788086, 39.631980895996094, 42.03541564941406, 44.43885040283203, 46.842288970947266, 49.245723724365234, 51.64916229248047, 54.05259704589844, 56.456031799316406, 58.859466552734375, 61.26290512084961, 63.66633987426758, 66.06977844238281, 68.47321319580078, 70.87664794921875, 73.28009033203125, 75.68352508544922, 78.08695983886719, 80.49039459228516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 9.0, 36.0, 39.0, 70.0, 94.0, 150.0, 238.0, 393.0, 568.0, 933.0, 1389.0, 2162.0, 3399.0, 5161.0, 7729.0, 11879.0, 17476.0, 25554.0, 36840.0, 50749.0, 66423.0, 84545.0, 99853.0, 108293.0, 108470.0, 99757.0, 85001.0, 66995.0, 50568.0, 36464.0, 25627.0, 17374.0, 11874.0, 7808.0, 4899.0, 3364.0, 2227.0, 1462.0, 918.0, 592.0, 364.0, 254.0, 183.0, 114.0, 83.0, 51.0, 32.0, 19.0, 20.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-8.390625, -8.12841796875, -7.8662109375, -7.60400390625, -7.341796875, -7.07958984375, -6.8173828125, -6.55517578125, -6.29296875, -6.03076171875, -5.7685546875, -5.50634765625, -5.244140625, -4.98193359375, -4.7197265625, -4.45751953125, -4.1953125, -3.93310546875, -3.6708984375, -3.40869140625, -3.146484375, -2.88427734375, -2.6220703125, -2.35986328125, -2.09765625, -1.83544921875, -1.5732421875, -1.31103515625, -1.048828125, -0.78662109375, -0.5244140625, -0.26220703125, 0.0, 0.26220703125, 0.5244140625, 0.78662109375, 1.048828125, 1.31103515625, 1.5732421875, 1.83544921875, 2.09765625, 2.35986328125, 2.6220703125, 2.88427734375, 3.146484375, 3.40869140625, 3.6708984375, 3.93310546875, 4.1953125, 4.45751953125, 4.7197265625, 4.98193359375, 5.244140625, 5.50634765625, 5.7685546875, 6.03076171875, 6.29296875, 6.55517578125, 6.8173828125, 7.07958984375, 7.341796875, 7.60400390625, 7.8662109375, 8.12841796875, 8.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 8.0, 4.0, 13.0, 19.0, 16.0, 17.0, 22.0, 22.0, 30.0, 30.0, 26.0, 41.0, 32.0, 24.0, 48.0, 40.0, 44.0, 46.0, 43.0, 43.0, 47.0, 49.0, 44.0, 35.0, 22.0, 28.0, 37.0, 28.0, 22.0, 19.0, 18.0, 12.0, 13.0, 5.0, 15.0, 4.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.8125, -71.40234375, -68.9921875, -66.58203125, -64.171875, -61.76171875, -59.3515625, -56.94140625, -54.53125, -52.12109375, -49.7109375, -47.30078125, -44.890625, -42.48046875, -40.0703125, -37.66015625, -35.25, -32.83984375, -30.4296875, -28.01953125, -25.609375, -23.19921875, -20.7890625, -18.37890625, -15.96875, -13.55859375, -11.1484375, -8.73828125, -6.328125, -3.91796875, -1.5078125, 0.90234375, 3.3125, 5.72265625, 8.1328125, 10.54296875, 12.953125, 15.36328125, 17.7734375, 20.18359375, 22.59375, 25.00390625, 27.4140625, 29.82421875, 32.234375, 34.64453125, 37.0546875, 39.46484375, 41.875, 44.28515625, 46.6953125, 49.10546875, 51.515625, 53.92578125, 56.3359375, 58.74609375, 61.15625, 63.56640625, 65.9765625, 68.38671875, 70.796875, 73.20703125, 75.6171875, 78.02734375, 80.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 6.0, 10.0, 5.0, 13.0, 17.0, 26.0, 37.0, 57.0, 82.0, 107.0, 171.0, 242.0, 349.0, 471.0, 650.0, 914.0, 1176.0, 1710.0, 2388.0, 3183.0, 4382.0, 6026.0, 8449.0, 11836.0, 17691.0, 30591.0, 203153.0, 623330.0, 58073.0, 22302.0, 14720.0, 10020.0, 7175.0, 5236.0, 3814.0, 2829.0, 2006.0, 1484.0, 1107.0, 779.0, 495.0, 429.0, 315.0, 218.0, 133.0, 95.0, 83.0, 48.0, 45.0, 25.0, 14.0, 17.0, 9.0, 10.0, 1.0, 3.0, 3.0, 3.0], "bins": [-16.109375, -15.625, -15.140625, -14.65625, -14.171875, -13.6875, -13.203125, -12.71875, -12.234375, -11.75, -11.265625, -10.78125, -10.296875, -9.8125, -9.328125, -8.84375, -8.359375, -7.875, -7.390625, -6.90625, -6.421875, -5.9375, -5.453125, -4.96875, -4.484375, -4.0, -3.515625, -3.03125, -2.546875, -2.0625, -1.578125, -1.09375, -0.609375, -0.125, 0.359375, 0.84375, 1.328125, 1.8125, 2.296875, 2.78125, 3.265625, 3.75, 4.234375, 4.71875, 5.203125, 5.6875, 6.171875, 6.65625, 7.140625, 7.625, 8.109375, 8.59375, 9.078125, 9.5625, 10.046875, 10.53125, 11.015625, 11.5, 11.984375, 12.46875, 12.953125, 13.4375, 13.921875, 14.40625, 14.890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 14.0, 14.0, 19.0, 22.0, 23.0, 20.0, 28.0, 26.0, 32.0, 28.0, 34.0, 43.0, 50.0, 58.0, 47.0, 44.0, 39.0, 52.0, 42.0, 37.0, 45.0, 47.0, 25.0, 29.0, 25.0, 21.0, 18.0, 26.0, 12.0, 16.0, 13.0, 14.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.59375, -49.8564453125, -48.119140625, -46.3818359375, -44.64453125, -42.9072265625, -41.169921875, -39.4326171875, -37.6953125, -35.9580078125, -34.220703125, -32.4833984375, -30.74609375, -29.0087890625, -27.271484375, -25.5341796875, -23.796875, -22.0595703125, -20.322265625, -18.5849609375, -16.84765625, -15.1103515625, -13.373046875, -11.6357421875, -9.8984375, -8.1611328125, -6.423828125, -4.6865234375, -2.94921875, -1.2119140625, 0.525390625, 2.2626953125, 4.0, 5.7373046875, 7.474609375, 9.2119140625, 10.94921875, 12.6865234375, 14.423828125, 16.1611328125, 17.8984375, 19.6357421875, 21.373046875, 23.1103515625, 24.84765625, 26.5849609375, 28.322265625, 30.0595703125, 31.796875, 33.5341796875, 35.271484375, 37.0087890625, 38.74609375, 40.4833984375, 42.220703125, 43.9580078125, 45.6953125, 47.4326171875, 49.169921875, 50.9072265625, 52.64453125, 54.3818359375, 56.119140625, 57.8564453125, 59.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 11.0, 11.0, 14.0, 17.0, 31.0, 41.0, 47.0, 78.0, 112.0, 135.0, 235.0, 279.0, 433.0, 627.0, 940.0, 1388.0, 2029.0, 3041.0, 4434.0, 6742.0, 10233.0, 15530.0, 24688.0, 81162.0, 790983.0, 42207.0, 21684.0, 13920.0, 9153.0, 6018.0, 4014.0, 2647.0, 1783.0, 1221.0, 825.0, 529.0, 402.0, 268.0, 166.0, 138.0, 102.0, 57.0, 56.0, 33.0, 33.0, 11.0, 8.0, 11.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.140625, -2.074493408203125, -2.00836181640625, -1.942230224609375, -1.8760986328125, -1.809967041015625, -1.74383544921875, -1.677703857421875, -1.611572265625, -1.545440673828125, -1.47930908203125, -1.413177490234375, -1.3470458984375, -1.280914306640625, -1.21478271484375, -1.148651123046875, -1.08251953125, -1.016387939453125, -0.95025634765625, -0.884124755859375, -0.8179931640625, -0.751861572265625, -0.68572998046875, -0.619598388671875, -0.553466796875, -0.487335205078125, -0.42120361328125, -0.355072021484375, -0.2889404296875, -0.222808837890625, -0.15667724609375, -0.090545654296875, -0.0244140625, 0.041717529296875, 0.10784912109375, 0.173980712890625, 0.2401123046875, 0.306243896484375, 0.37237548828125, 0.438507080078125, 0.504638671875, 0.570770263671875, 0.63690185546875, 0.703033447265625, 0.7691650390625, 0.835296630859375, 0.90142822265625, 0.967559814453125, 1.03369140625, 1.099822998046875, 1.16595458984375, 1.232086181640625, 1.2982177734375, 1.364349365234375, 1.43048095703125, 1.496612548828125, 1.562744140625, 1.628875732421875, 1.69500732421875, 1.761138916015625, 1.8272705078125, 1.893402099609375, 1.95953369140625, 2.025665283203125, 2.091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 10.0, 19.0, 14.0, 20.0, 14.0, 21.0, 28.0, 17.0, 35.0, 31.0, 38.0, 33.0, 51.0, 56.0, 35.0, 40.0, 49.0, 41.0, 54.0, 46.0, 36.0, 35.0, 39.0, 40.0, 31.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 11.0, 3.0, 9.0, 1.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-7.224082946777344e-05, -7.024593651294708e-05, -6.825104355812073e-05, -6.625615060329437e-05, -6.426125764846802e-05, -6.226636469364166e-05, -6.027147173881531e-05, -5.827657878398895e-05, -5.62816858291626e-05, -5.428679287433624e-05, -5.229189991950989e-05, -5.029700696468353e-05, -4.830211400985718e-05, -4.630722105503082e-05, -4.431232810020447e-05, -4.231743514537811e-05, -4.032254219055176e-05, -3.83276492357254e-05, -3.633275628089905e-05, -3.433786332607269e-05, -3.234297037124634e-05, -3.0348077416419983e-05, -2.8353184461593628e-05, -2.6358291506767273e-05, -2.4363398551940918e-05, -2.2368505597114563e-05, -2.0373612642288208e-05, -1.8378719687461853e-05, -1.6383826732635498e-05, -1.4388933777809143e-05, -1.2394040822982788e-05, -1.0399147868156433e-05, -8.404254913330078e-06, -6.409361958503723e-06, -4.414469003677368e-06, -2.419576048851013e-06, -4.246830940246582e-07, 1.5702098608016968e-06, 3.5651028156280518e-06, 5.559995770454407e-06, 7.554888725280762e-06, 9.549781680107117e-06, 1.1544674634933472e-05, 1.3539567589759827e-05, 1.553446054458618e-05, 1.7529353499412537e-05, 1.952424645423889e-05, 2.1519139409065247e-05, 2.35140323638916e-05, 2.5508925318717957e-05, 2.750381827354431e-05, 2.9498711228370667e-05, 3.149360418319702e-05, 3.3488497138023376e-05, 3.548339009284973e-05, 3.7478283047676086e-05, 3.947317600250244e-05, 4.1468068957328796e-05, 4.346296191215515e-05, 4.5457854866981506e-05, 4.745274782180786e-05, 4.9447640776634216e-05, 5.144253373146057e-05, 5.3437426686286926e-05, 5.543231964111328e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 11.0, 12.0, 18.0, 48.0, 45.0, 83.0, 118.0, 161.0, 238.0, 373.0, 526.0, 755.0, 1140.0, 1624.0, 2391.0, 3278.0, 4897.0, 6848.0, 9652.0, 14233.0, 19534.0, 27555.0, 38876.0, 52906.0, 70803.0, 91497.0, 110773.0, 119125.0, 112220.0, 93968.0, 73139.0, 54603.0, 40099.0, 28479.0, 20639.0, 14438.0, 10174.0, 7190.0, 4893.0, 3426.0, 2365.0, 1687.0, 1142.0, 809.0, 569.0, 411.0, 257.0, 198.0, 117.0, 91.0, 45.0, 40.0, 13.0, 19.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6256561279296875, -1.570648193359375, -1.5156402587890625, -1.46063232421875, -1.4056243896484375, -1.350616455078125, -1.2956085205078125, -1.2406005859375, -1.1855926513671875, -1.130584716796875, -1.0755767822265625, -1.02056884765625, -0.9655609130859375, -0.910552978515625, -0.8555450439453125, -0.800537109375, -0.7455291748046875, -0.690521240234375, -0.6355133056640625, -0.58050537109375, -0.5254974365234375, -0.470489501953125, -0.4154815673828125, -0.3604736328125, -0.3054656982421875, -0.250457763671875, -0.1954498291015625, -0.14044189453125, -0.0854339599609375, -0.030426025390625, 0.0245819091796875, 0.07958984375, 0.1345977783203125, 0.189605712890625, 0.2446136474609375, 0.29962158203125, 0.3546295166015625, 0.409637451171875, 0.4646453857421875, 0.5196533203125, 0.5746612548828125, 0.629669189453125, 0.6846771240234375, 0.73968505859375, 0.7946929931640625, 0.849700927734375, 0.9047088623046875, 0.959716796875, 1.0147247314453125, 1.069732666015625, 1.1247406005859375, 1.17974853515625, 1.2347564697265625, 1.289764404296875, 1.3447723388671875, 1.3997802734375, 1.4547882080078125, 1.509796142578125, 1.5648040771484375, 1.61981201171875, 1.6748199462890625, 1.729827880859375, 1.7848358154296875, 1.83984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 3.0, 12.0, 16.0, 10.0, 23.0, 30.0, 27.0, 40.0, 55.0, 32.0, 48.0, 60.0, 89.0, 89.0, 72.0, 46.0, 45.0, 38.0, 40.0, 33.0, 30.0, 24.0, 30.0, 18.0, 11.0, 9.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1164093017578125, -1.073638916015625, -1.0308685302734375, -0.98809814453125, -0.9453277587890625, -0.902557373046875, -0.8597869873046875, -0.8170166015625, -0.7742462158203125, -0.731475830078125, -0.6887054443359375, -0.64593505859375, -0.6031646728515625, -0.560394287109375, -0.5176239013671875, -0.474853515625, -0.4320831298828125, -0.389312744140625, -0.3465423583984375, -0.30377197265625, -0.2610015869140625, -0.218231201171875, -0.1754608154296875, -0.1326904296875, -0.0899200439453125, -0.047149658203125, -0.0043792724609375, 0.03839111328125, 0.0811614990234375, 0.123931884765625, 0.1667022705078125, 0.20947265625, 0.2522430419921875, 0.295013427734375, 0.3377838134765625, 0.38055419921875, 0.4233245849609375, 0.466094970703125, 0.5088653564453125, 0.5516357421875, 0.5944061279296875, 0.637176513671875, 0.6799468994140625, 0.72271728515625, 0.7654876708984375, 0.808258056640625, 0.8510284423828125, 0.893798828125, 0.9365692138671875, 0.979339599609375, 1.0221099853515625, 1.06488037109375, 1.1076507568359375, 1.150421142578125, 1.1931915283203125, 1.2359619140625, 1.2787322998046875, 1.321502685546875, 1.3642730712890625, 1.40704345703125, 1.4498138427734375, 1.492584228515625, 1.5353546142578125, 1.578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 11.0, 23.0, 17.0, 17.0, 21.0, 19.0, 24.0, 21.0, 34.0, 39.0, 36.0, 43.0, 46.0, 56.0, 55.0, 49.0, 38.0, 50.0, 51.0, 37.0, 37.0, 30.0, 35.0, 25.0, 23.0, 25.0, 22.0, 14.0, 12.0, 11.0, 10.0, 3.0, 6.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-79.88013458251953, -77.76766967773438, -75.65519714355469, -73.54273223876953, -71.43026733398438, -69.31780242919922, -67.20533752441406, -65.09286499023438, -62.98040008544922, -60.86793518066406, -58.75546646118164, -56.64299774169922, -54.53053283691406, -52.418067932128906, -50.305599212646484, -48.19313049316406, -46.080665588378906, -43.96820068359375, -41.85573196411133, -39.743263244628906, -37.63079833984375, -35.518333435058594, -33.40586471557617, -31.293397903442383, -29.180931091308594, -27.068464279174805, -24.955997467041016, -22.843530654907227, -20.731063842773438, -18.61859703063965, -16.50613021850586, -14.39366340637207, -12.281192779541016, -10.168725967407227, -8.056259155273438, -5.943792343139648, -3.8313255310058594, -1.7188587188720703, 0.39360809326171875, 2.506074905395508, 4.618541717529297, 6.731008529663086, 8.843475341796875, 10.955942153930664, 13.068408966064453, 15.180875778198242, 17.29334259033203, 19.40580940246582, 21.51827621459961, 23.6307430267334, 25.743209838867188, 27.855676651000977, 29.968143463134766, 32.08061218261719, 34.193077087402344, 36.3055419921875, 38.41801071166992, 40.530479431152344, 42.6429443359375, 44.755409240722656, 46.86787796020508, 48.9803466796875, 51.092811584472656, 53.20527648925781, 55.317745208740234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 12.0, 7.0, 5.0, 6.0, 12.0, 20.0, 16.0, 16.0, 27.0, 20.0, 36.0, 25.0, 24.0, 42.0, 29.0, 27.0, 45.0, 46.0, 40.0, 49.0, 40.0, 42.0, 48.0, 54.0, 42.0, 32.0, 24.0, 26.0, 37.0, 27.0, 22.0, 17.0, 21.0, 12.0, 11.0, 5.0, 15.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.3089828491211, -70.90727996826172, -68.50557708740234, -66.10387420654297, -63.70217514038086, -61.300472259521484, -58.89876937866211, -56.4970703125, -54.095367431640625, -51.69366455078125, -49.291961669921875, -46.8902587890625, -44.48855972290039, -42.086856842041016, -39.68515396118164, -37.28345489501953, -34.88174819946289, -32.480045318603516, -30.078344345092773, -27.6766414642334, -25.274940490722656, -22.87323760986328, -20.471534729003906, -18.069833755493164, -15.668130874633789, -13.26642894744873, -10.864727020263672, -8.463024139404297, -6.061322212219238, -3.6596202850341797, -1.2579174041748047, 1.1437835693359375, 3.5454864501953125, 5.947188377380371, 8.34889030456543, 10.750593185424805, 13.152295112609863, 15.553997039794922, 17.955699920654297, 20.35740089416504, 22.759103775024414, 25.16080665588379, 27.56250762939453, 29.964210510253906, 32.36591339111328, 34.767616271972656, 37.16931915283203, 39.57101821899414, 41.972721099853516, 44.37442398071289, 46.776126861572266, 49.177825927734375, 51.57952880859375, 53.981231689453125, 56.3829345703125, 58.784637451171875, 61.18634033203125, 63.588043212890625, 65.98974609375, 68.39144897460938, 70.79315185546875, 73.19485473632812, 75.5965576171875, 77.99825286865234, 80.39995574951172]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 9.0, 11.0, 9.0, 24.0, 55.0, 68.0, 115.0, 183.0, 337.0, 571.0, 952.0, 1479.0, 2392.0, 3854.0, 5967.0, 9128.0, 13696.0, 19649.0, 27743.0, 37418.0, 48445.0, 60860.0, 72988.0, 82096.0, 89519.0, 92336.0, 89942.0, 82454.0, 72746.0, 61235.0, 48627.0, 37195.0, 27898.0, 19510.0, 13666.0, 9235.0, 5798.0, 3930.0, 2392.0, 1568.0, 965.0, 625.0, 345.0, 220.0, 127.0, 67.0, 52.0, 26.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.71875, -37.48974609375, -36.2607421875, -35.03173828125, -33.802734375, -32.57373046875, -31.3447265625, -30.11572265625, -28.88671875, -27.65771484375, -26.4287109375, -25.19970703125, -23.970703125, -22.74169921875, -21.5126953125, -20.28369140625, -19.0546875, -17.82568359375, -16.5966796875, -15.36767578125, -14.138671875, -12.90966796875, -11.6806640625, -10.45166015625, -9.22265625, -7.99365234375, -6.7646484375, -5.53564453125, -4.306640625, -3.07763671875, -1.8486328125, -0.61962890625, 0.609375, 1.83837890625, 3.0673828125, 4.29638671875, 5.525390625, 6.75439453125, 7.9833984375, 9.21240234375, 10.44140625, 11.67041015625, 12.8994140625, 14.12841796875, 15.357421875, 16.58642578125, 17.8154296875, 19.04443359375, 20.2734375, 21.50244140625, 22.7314453125, 23.96044921875, 25.189453125, 26.41845703125, 27.6474609375, 28.87646484375, 30.10546875, 31.33447265625, 32.5634765625, 33.79248046875, 35.021484375, 36.25048828125, 37.4794921875, 38.70849609375, 39.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 7.0, 6.0, 9.0, 9.0, 18.0, 19.0, 18.0, 23.0, 21.0, 33.0, 25.0, 27.0, 40.0, 31.0, 28.0, 43.0, 45.0, 39.0, 52.0, 40.0, 46.0, 45.0, 53.0, 45.0, 29.0, 23.0, 26.0, 36.0, 30.0, 21.0, 19.0, 18.0, 12.0, 11.0, 6.0, 14.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.1875, -68.8564453125, -66.525390625, -64.1943359375, -61.86328125, -59.5322265625, -57.201171875, -54.8701171875, -52.5390625, -50.2080078125, -47.876953125, -45.5458984375, -43.21484375, -40.8837890625, -38.552734375, -36.2216796875, -33.890625, -31.5595703125, -29.228515625, -26.8974609375, -24.56640625, -22.2353515625, -19.904296875, -17.5732421875, -15.2421875, -12.9111328125, -10.580078125, -8.2490234375, -5.91796875, -3.5869140625, -1.255859375, 1.0751953125, 3.40625, 5.7373046875, 8.068359375, 10.3994140625, 12.73046875, 15.0615234375, 17.392578125, 19.7236328125, 22.0546875, 24.3857421875, 26.716796875, 29.0478515625, 31.37890625, 33.7099609375, 36.041015625, 38.3720703125, 40.703125, 43.0341796875, 45.365234375, 47.6962890625, 50.02734375, 52.3583984375, 54.689453125, 57.0205078125, 59.3515625, 61.6826171875, 64.013671875, 66.3447265625, 68.67578125, 71.0068359375, 73.337890625, 75.6689453125, 78.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 14.0, 15.0, 41.0, 67.0, 91.0, 154.0, 276.0, 423.0, 748.0, 1147.0, 1781.0, 2779.0, 4241.0, 6414.0, 9390.0, 13677.0, 19098.0, 26237.0, 34481.0, 44099.0, 54667.0, 64576.0, 73652.0, 80603.0, 83704.0, 84224.0, 81180.0, 74144.0, 65097.0, 54839.0, 44215.0, 35244.0, 26326.0, 19321.0, 13565.0, 9597.0, 6449.0, 4356.0, 2801.0, 1846.0, 1186.0, 718.0, 436.0, 261.0, 160.0, 88.0, 62.0, 26.0, 27.0, 11.0, 2.0, 7.0, 0.0, 2.0, 1.0], "bins": [-37.96875, -36.8525390625, -35.736328125, -34.6201171875, -33.50390625, -32.3876953125, -31.271484375, -30.1552734375, -29.0390625, -27.9228515625, -26.806640625, -25.6904296875, -24.57421875, -23.4580078125, -22.341796875, -21.2255859375, -20.109375, -18.9931640625, -17.876953125, -16.7607421875, -15.64453125, -14.5283203125, -13.412109375, -12.2958984375, -11.1796875, -10.0634765625, -8.947265625, -7.8310546875, -6.71484375, -5.5986328125, -4.482421875, -3.3662109375, -2.25, -1.1337890625, -0.017578125, 1.0986328125, 2.21484375, 3.3310546875, 4.447265625, 5.5634765625, 6.6796875, 7.7958984375, 8.912109375, 10.0283203125, 11.14453125, 12.2607421875, 13.376953125, 14.4931640625, 15.609375, 16.7255859375, 17.841796875, 18.9580078125, 20.07421875, 21.1904296875, 22.306640625, 23.4228515625, 24.5390625, 25.6552734375, 26.771484375, 27.8876953125, 29.00390625, 30.1201171875, 31.236328125, 32.3525390625, 33.46875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 16.0, 9.0, 8.0, 22.0, 16.0, 17.0, 29.0, 27.0, 28.0, 26.0, 29.0, 31.0, 37.0, 57.0, 41.0, 42.0, 47.0, 50.0, 44.0, 39.0, 53.0, 34.0, 37.0, 31.0, 37.0, 21.0, 33.0, 23.0, 22.0, 13.0, 18.0, 17.0, 7.0, 11.0, 6.0, 7.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5, -50.814453125, -49.12890625, -47.443359375, -45.7578125, -44.072265625, -42.38671875, -40.701171875, -39.015625, -37.330078125, -35.64453125, -33.958984375, -32.2734375, -30.587890625, -28.90234375, -27.216796875, -25.53125, -23.845703125, -22.16015625, -20.474609375, -18.7890625, -17.103515625, -15.41796875, -13.732421875, -12.046875, -10.361328125, -8.67578125, -6.990234375, -5.3046875, -3.619140625, -1.93359375, -0.248046875, 1.4375, 3.123046875, 4.80859375, 6.494140625, 8.1796875, 9.865234375, 11.55078125, 13.236328125, 14.921875, 16.607421875, 18.29296875, 19.978515625, 21.6640625, 23.349609375, 25.03515625, 26.720703125, 28.40625, 30.091796875, 31.77734375, 33.462890625, 35.1484375, 36.833984375, 38.51953125, 40.205078125, 41.890625, 43.576171875, 45.26171875, 46.947265625, 48.6328125, 50.318359375, 52.00390625, 53.689453125, 55.375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 6.0, 11.0, 14.0, 23.0, 51.0, 56.0, 82.0, 123.0, 188.0, 318.0, 449.0, 643.0, 969.0, 1493.0, 2151.0, 3158.0, 4590.0, 6668.0, 9513.0, 13259.0, 18157.0, 24046.0, 32623.0, 41651.0, 51072.0, 61334.0, 70438.0, 77668.0, 82003.0, 82957.0, 80404.0, 74972.0, 66021.0, 56546.0, 46274.0, 36882.0, 28336.0, 21183.0, 15552.0, 11294.0, 8034.0, 5517.0, 3831.0, 2558.0, 1781.0, 1224.0, 792.0, 535.0, 379.0, 249.0, 160.0, 132.0, 70.0, 45.0, 33.0, 19.0, 12.0, 9.0, 3.0, 0.0, 4.0], "bins": [-16.6875, -16.170166015625, -15.65283203125, -15.135498046875, -14.6181640625, -14.100830078125, -13.58349609375, -13.066162109375, -12.548828125, -12.031494140625, -11.51416015625, -10.996826171875, -10.4794921875, -9.962158203125, -9.44482421875, -8.927490234375, -8.41015625, -7.892822265625, -7.37548828125, -6.858154296875, -6.3408203125, -5.823486328125, -5.30615234375, -4.788818359375, -4.271484375, -3.754150390625, -3.23681640625, -2.719482421875, -2.2021484375, -1.684814453125, -1.16748046875, -0.650146484375, -0.1328125, 0.384521484375, 0.90185546875, 1.419189453125, 1.9365234375, 2.453857421875, 2.97119140625, 3.488525390625, 4.005859375, 4.523193359375, 5.04052734375, 5.557861328125, 6.0751953125, 6.592529296875, 7.10986328125, 7.627197265625, 8.14453125, 8.661865234375, 9.17919921875, 9.696533203125, 10.2138671875, 10.731201171875, 11.24853515625, 11.765869140625, 12.283203125, 12.800537109375, 13.31787109375, 13.835205078125, 14.3525390625, 14.869873046875, 15.38720703125, 15.904541015625, 16.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 5.0, 14.0, 18.0, 7.0, 9.0, 27.0, 28.0, 31.0, 36.0, 23.0, 63.0, 46.0, 37.0, 46.0, 62.0, 39.0, 51.0, 61.0, 53.0, 42.0, 35.0, 44.0, 32.0, 29.0, 30.0, 21.0, 29.0, 12.0, 11.0, 5.0, 6.0, 9.0, 12.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032806396484375, -0.0031862258911132812, -0.0030918121337890625, -0.0029973983764648438, -0.002902984619140625, -0.0028085708618164062, -0.0027141571044921875, -0.0026197433471679688, -0.00252532958984375, -0.0024309158325195312, -0.0023365020751953125, -0.0022420883178710938, -0.002147674560546875, -0.0020532608032226562, -0.0019588470458984375, -0.0018644332885742188, -0.00177001953125, -0.0016756057739257812, -0.0015811920166015625, -0.0014867782592773438, -0.001392364501953125, -0.0012979507446289062, -0.0012035369873046875, -0.0011091232299804688, -0.00101470947265625, -0.0009202957153320312, -0.0008258819580078125, -0.0007314682006835938, -0.000637054443359375, -0.0005426406860351562, -0.0004482269287109375, -0.00035381317138671875, -0.0002593994140625, -0.00016498565673828125, -7.05718994140625e-05, 2.384185791015625e-05, 0.000118255615234375, 0.00021266937255859375, 0.0003070831298828125, 0.00040149688720703125, 0.00049591064453125, 0.0005903244018554688, 0.0006847381591796875, 0.0007791519165039062, 0.000873565673828125, 0.0009679794311523438, 0.0010623931884765625, 0.0011568069458007812, 0.001251220703125, 0.0013456344604492188, 0.0014400482177734375, 0.0015344619750976562, 0.001628875732421875, 0.0017232894897460938, 0.0018177032470703125, 0.0019121170043945312, 0.00200653076171875, 0.0021009445190429688, 0.0021953582763671875, 0.0022897720336914062, 0.002384185791015625, 0.0024785995483398438, 0.0025730133056640625, 0.0026674270629882812, 0.0027618408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 9.0, 15.0, 24.0, 31.0, 69.0, 94.0, 128.0, 206.0, 340.0, 541.0, 822.0, 1354.0, 2088.0, 3173.0, 4704.0, 7286.0, 10506.0, 15118.0, 21263.0, 29241.0, 38493.0, 49037.0, 60918.0, 72173.0, 81428.0, 86658.0, 88751.0, 86516.0, 79628.0, 70329.0, 59557.0, 47971.0, 37241.0, 27825.0, 20717.0, 14372.0, 10041.0, 6753.0, 4586.0, 2971.0, 2043.0, 1285.0, 830.0, 500.0, 338.0, 230.0, 140.0, 81.0, 54.0, 29.0, 17.0, 17.0, 5.0, 6.0, 1.0, 6.0, 1.0, 3.0], "bins": [-19.6875, -19.08056640625, -18.4736328125, -17.86669921875, -17.259765625, -16.65283203125, -16.0458984375, -15.43896484375, -14.83203125, -14.22509765625, -13.6181640625, -13.01123046875, -12.404296875, -11.79736328125, -11.1904296875, -10.58349609375, -9.9765625, -9.36962890625, -8.7626953125, -8.15576171875, -7.548828125, -6.94189453125, -6.3349609375, -5.72802734375, -5.12109375, -4.51416015625, -3.9072265625, -3.30029296875, -2.693359375, -2.08642578125, -1.4794921875, -0.87255859375, -0.265625, 0.34130859375, 0.9482421875, 1.55517578125, 2.162109375, 2.76904296875, 3.3759765625, 3.98291015625, 4.58984375, 5.19677734375, 5.8037109375, 6.41064453125, 7.017578125, 7.62451171875, 8.2314453125, 8.83837890625, 9.4453125, 10.05224609375, 10.6591796875, 11.26611328125, 11.873046875, 12.47998046875, 13.0869140625, 13.69384765625, 14.30078125, 14.90771484375, 15.5146484375, 16.12158203125, 16.728515625, 17.33544921875, 17.9423828125, 18.54931640625, 19.15625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 7.0, 12.0, 11.0, 14.0, 15.0, 7.0, 28.0, 15.0, 26.0, 31.0, 29.0, 42.0, 36.0, 36.0, 51.0, 42.0, 37.0, 40.0, 55.0, 51.0, 54.0, 37.0, 27.0, 39.0, 33.0, 28.0, 33.0, 24.0, 24.0, 19.0, 15.0, 11.0, 16.0, 8.0, 11.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.503662109375, -10.15576171875, -9.807861328125, -9.4599609375, -9.112060546875, -8.76416015625, -8.416259765625, -8.068359375, -7.720458984375, -7.37255859375, -7.024658203125, -6.6767578125, -6.328857421875, -5.98095703125, -5.633056640625, -5.28515625, -4.937255859375, -4.58935546875, -4.241455078125, -3.8935546875, -3.545654296875, -3.19775390625, -2.849853515625, -2.501953125, -2.154052734375, -1.80615234375, -1.458251953125, -1.1103515625, -0.762451171875, -0.41455078125, -0.066650390625, 0.28125, 0.629150390625, 0.97705078125, 1.324951171875, 1.6728515625, 2.020751953125, 2.36865234375, 2.716552734375, 3.064453125, 3.412353515625, 3.76025390625, 4.108154296875, 4.4560546875, 4.803955078125, 5.15185546875, 5.499755859375, 5.84765625, 6.195556640625, 6.54345703125, 6.891357421875, 7.2392578125, 7.587158203125, 7.93505859375, 8.282958984375, 8.630859375, 8.978759765625, 9.32666015625, 9.674560546875, 10.0224609375, 10.370361328125, 10.71826171875, 11.066162109375, 11.4140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 5.0, 9.0, 12.0, 13.0, 21.0, 18.0, 26.0, 26.0, 33.0, 37.0, 31.0, 28.0, 47.0, 35.0, 36.0, 41.0, 45.0, 51.0, 49.0, 33.0, 38.0, 41.0, 38.0, 29.0, 27.0, 32.0, 19.0, 19.0, 27.0, 14.0, 17.0, 16.0, 12.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-68.19844055175781, -66.23094940185547, -64.26345825195312, -62.295963287353516, -60.32847213745117, -58.36098098754883, -56.39348602294922, -54.425994873046875, -52.45850372314453, -50.49101257324219, -48.523521423339844, -46.556026458740234, -44.58853530883789, -42.62104415893555, -40.65354919433594, -38.686058044433594, -36.71856689453125, -34.751075744628906, -32.78358459472656, -30.816089630126953, -28.84859848022461, -26.881107330322266, -24.91361427307129, -22.946121215820312, -20.97863006591797, -19.011138916015625, -17.04364585876465, -15.076153755187988, -13.108661651611328, -11.141169548034668, -9.173677444458008, -7.206185340881348, -5.238697052001953, -3.271204948425293, -1.3037128448486328, 0.6637792587280273, 2.6312713623046875, 4.598763465881348, 6.566255569458008, 8.533747673034668, 10.501239776611328, 12.468731880187988, 14.436223983764648, 16.403717041015625, 18.37120819091797, 20.338699340820312, 22.30619239807129, 24.273685455322266, 26.24117660522461, 28.208667755126953, 30.17616081237793, 32.143653869628906, 34.11114501953125, 36.078636169433594, 38.04612731933594, 40.01362228393555, 41.98111343383789, 43.948604583740234, 45.916099548339844, 47.88359069824219, 49.85108184814453, 51.818572998046875, 53.78606414794922, 55.75355911254883, 57.72105026245117]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 7.0, 5.0, 15.0, 13.0, 13.0, 10.0, 20.0, 23.0, 24.0, 26.0, 30.0, 26.0, 34.0, 27.0, 27.0, 40.0, 31.0, 37.0, 42.0, 42.0, 35.0, 39.0, 44.0, 36.0, 39.0, 35.0, 36.0, 28.0, 27.0, 32.0, 25.0, 16.0, 13.0, 13.0, 13.0, 9.0, 12.0, 7.0, 8.0, 3.0, 1.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.96417236328125, -69.64633178710938, -67.32849884033203, -65.01065826416016, -62.69282150268555, -60.37498474121094, -58.05714416503906, -55.73930740356445, -53.421470642089844, -51.103633880615234, -48.785797119140625, -46.46795654296875, -44.15011978149414, -41.83228302001953, -39.514442443847656, -37.19660568237305, -34.87876892089844, -32.56093215942383, -30.243093490600586, -27.925254821777344, -25.607418060302734, -23.289581298828125, -20.971742630004883, -18.65390396118164, -16.33606719970703, -14.018229484558105, -11.70039176940918, -9.382554054260254, -7.064716339111328, -4.746878623962402, -2.4290409088134766, -0.11120223999023438, 2.2066421508789062, 4.524479866027832, 6.842317581176758, 9.160155296325684, 11.47799301147461, 13.795830726623535, 16.11366844177246, 18.431507110595703, 20.749343872070312, 23.067180633544922, 25.385019302368164, 27.702857971191406, 30.020694732666016, 32.338531494140625, 34.6563720703125, 36.97420883178711, 39.29204559326172, 41.60988235473633, 43.92771911621094, 46.24555969238281, 48.56339645385742, 50.88123321533203, 53.199073791503906, 55.516910552978516, 57.834747314453125, 60.152584075927734, 62.470420837402344, 64.78826141357422, 67.10609436035156, 69.42393493652344, 71.74177551269531, 74.05961608886719, 76.37744903564453]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 8.0, 9.0, 14.0, 38.0, 37.0, 83.0, 126.0, 216.0, 372.0, 662.0, 1084.0, 1871.0, 2974.0, 5202.0, 8791.0, 14234.0, 23117.0, 37060.0, 57523.0, 87068.0, 128465.0, 179982.0, 243340.0, 308474.0, 367950.0, 409735.0, 424477.0, 410613.0, 369544.0, 309948.0, 245298.0, 182600.0, 129856.0, 88556.0, 58590.0, 37618.0, 23447.0, 14285.0, 8713.0, 5055.0, 3060.0, 1748.0, 1057.0, 586.0, 340.0, 195.0, 100.0, 62.0, 45.0, 20.0, 10.0, 16.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.59375, -46.08349609375, -44.5732421875, -43.06298828125, -41.552734375, -40.04248046875, -38.5322265625, -37.02197265625, -35.51171875, -34.00146484375, -32.4912109375, -30.98095703125, -29.470703125, -27.96044921875, -26.4501953125, -24.93994140625, -23.4296875, -21.91943359375, -20.4091796875, -18.89892578125, -17.388671875, -15.87841796875, -14.3681640625, -12.85791015625, -11.34765625, -9.83740234375, -8.3271484375, -6.81689453125, -5.306640625, -3.79638671875, -2.2861328125, -0.77587890625, 0.734375, 2.24462890625, 3.7548828125, 5.26513671875, 6.775390625, 8.28564453125, 9.7958984375, 11.30615234375, 12.81640625, 14.32666015625, 15.8369140625, 17.34716796875, 18.857421875, 20.36767578125, 21.8779296875, 23.38818359375, 24.8984375, 26.40869140625, 27.9189453125, 29.42919921875, 30.939453125, 32.44970703125, 33.9599609375, 35.47021484375, 36.98046875, 38.49072265625, 40.0009765625, 41.51123046875, 43.021484375, 44.53173828125, 46.0419921875, 47.55224609375, 49.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 7.0, 6.0, 10.0, 15.0, 16.0, 12.0, 15.0, 20.0, 23.0, 27.0, 31.0, 26.0, 33.0, 27.0, 26.0, 31.0, 47.0, 26.0, 40.0, 49.0, 33.0, 39.0, 46.0, 34.0, 36.0, 39.0, 33.0, 33.0, 28.0, 33.0, 24.0, 19.0, 11.0, 15.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 1.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.8310546875, -65.599609375, -63.3681640625, -61.13671875, -58.9052734375, -56.673828125, -54.4423828125, -52.2109375, -49.9794921875, -47.748046875, -45.5166015625, -43.28515625, -41.0537109375, -38.822265625, -36.5908203125, -34.359375, -32.1279296875, -29.896484375, -27.6650390625, -25.43359375, -23.2021484375, -20.970703125, -18.7392578125, -16.5078125, -14.2763671875, -12.044921875, -9.8134765625, -7.58203125, -5.3505859375, -3.119140625, -0.8876953125, 1.34375, 3.5751953125, 5.806640625, 8.0380859375, 10.26953125, 12.5009765625, 14.732421875, 16.9638671875, 19.1953125, 21.4267578125, 23.658203125, 25.8896484375, 28.12109375, 30.3525390625, 32.583984375, 34.8154296875, 37.046875, 39.2783203125, 41.509765625, 43.7412109375, 45.97265625, 48.2041015625, 50.435546875, 52.6669921875, 54.8984375, 57.1298828125, 59.361328125, 61.5927734375, 63.82421875, 66.0556640625, 68.287109375, 70.5185546875, 72.75]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 23.0, 35.0, 55.0, 114.0, 186.0, 368.0, 542.0, 935.0, 1610.0, 2601.0, 4214.0, 6900.0, 10964.0, 16819.0, 26021.0, 38856.0, 57466.0, 82106.0, 114107.0, 152272.0, 196654.0, 243851.0, 288975.0, 327980.0, 353175.0, 361629.0, 352701.0, 326822.0, 286397.0, 241742.0, 192602.0, 150385.0, 111531.0, 80422.0, 55833.0, 38263.0, 25322.0, 16439.0, 10412.0, 6562.0, 4106.0, 2498.0, 1541.0, 907.0, 565.0, 321.0, 208.0, 108.0, 47.0, 50.0, 19.0, 6.0, 4.0, 4.0, 2.0], "bins": [-49.53125, -48.09423828125, -46.6572265625, -45.22021484375, -43.783203125, -42.34619140625, -40.9091796875, -39.47216796875, -38.03515625, -36.59814453125, -35.1611328125, -33.72412109375, -32.287109375, -30.85009765625, -29.4130859375, -27.97607421875, -26.5390625, -25.10205078125, -23.6650390625, -22.22802734375, -20.791015625, -19.35400390625, -17.9169921875, -16.47998046875, -15.04296875, -13.60595703125, -12.1689453125, -10.73193359375, -9.294921875, -7.85791015625, -6.4208984375, -4.98388671875, -3.546875, -2.10986328125, -0.6728515625, 0.76416015625, 2.201171875, 3.63818359375, 5.0751953125, 6.51220703125, 7.94921875, 9.38623046875, 10.8232421875, 12.26025390625, 13.697265625, 15.13427734375, 16.5712890625, 18.00830078125, 19.4453125, 20.88232421875, 22.3193359375, 23.75634765625, 25.193359375, 26.63037109375, 28.0673828125, 29.50439453125, 30.94140625, 32.37841796875, 33.8154296875, 35.25244140625, 36.689453125, 38.12646484375, 39.5634765625, 41.00048828125, 42.4375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 10.0, 21.0, 21.0, 23.0, 28.0, 33.0, 55.0, 68.0, 63.0, 91.0, 92.0, 102.0, 132.0, 141.0, 150.0, 160.0, 155.0, 186.0, 188.0, 190.0, 161.0, 179.0, 185.0, 189.0, 175.0, 189.0, 141.0, 110.0, 136.0, 107.0, 82.0, 91.0, 71.0, 67.0, 55.0, 51.0, 37.0, 28.0, 23.0, 18.0, 8.0, 12.0, 10.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.796875, -28.88916015625, -27.9814453125, -27.07373046875, -26.166015625, -25.25830078125, -24.3505859375, -23.44287109375, -22.53515625, -21.62744140625, -20.7197265625, -19.81201171875, -18.904296875, -17.99658203125, -17.0888671875, -16.18115234375, -15.2734375, -14.36572265625, -13.4580078125, -12.55029296875, -11.642578125, -10.73486328125, -9.8271484375, -8.91943359375, -8.01171875, -7.10400390625, -6.1962890625, -5.28857421875, -4.380859375, -3.47314453125, -2.5654296875, -1.65771484375, -0.75, 0.15771484375, 1.0654296875, 1.97314453125, 2.880859375, 3.78857421875, 4.6962890625, 5.60400390625, 6.51171875, 7.41943359375, 8.3271484375, 9.23486328125, 10.142578125, 11.05029296875, 11.9580078125, 12.86572265625, 13.7734375, 14.68115234375, 15.5888671875, 16.49658203125, 17.404296875, 18.31201171875, 19.2197265625, 20.12744140625, 21.03515625, 21.94287109375, 22.8505859375, 23.75830078125, 24.666015625, 25.57373046875, 26.4814453125, 27.38916015625, 28.296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 4.0, 12.0, 14.0, 12.0, 12.0, 33.0, 16.0, 26.0, 11.0, 27.0, 27.0, 35.0, 30.0, 38.0, 48.0, 40.0, 46.0, 42.0, 41.0, 53.0, 39.0, 29.0, 45.0, 38.0, 40.0, 36.0, 28.0, 23.0, 16.0, 20.0, 20.0, 10.0, 15.0, 11.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.62174987792969, -69.43634796142578, -67.25094604492188, -65.06553649902344, -62.88013458251953, -60.694732666015625, -58.50933074951172, -56.32392883300781, -54.13852310180664, -51.953121185302734, -49.76771545410156, -47.582313537597656, -45.39691162109375, -43.21150588989258, -41.02610397338867, -38.8406982421875, -36.655296325683594, -34.46989440917969, -32.284488677978516, -30.09908676147461, -27.91368293762207, -25.72827911376953, -23.542877197265625, -21.357473373413086, -19.172069549560547, -16.986665725708008, -14.801262855529785, -12.615859985351562, -10.430456161499023, -8.245052337646484, -6.059649467468262, -3.874246597290039, -1.6888351440429688, 0.4965682029724121, 2.681971549987793, 4.867374897003174, 7.052778244018555, 9.238182067871094, 11.423584938049316, 13.608987808227539, 15.794391632080078, 17.979795455932617, 20.165199279785156, 22.350601196289062, 24.5360050201416, 26.72140884399414, 28.906810760498047, 31.092214584350586, 33.277618408203125, 35.46302032470703, 37.6484260559082, 39.83382797241211, 42.01923370361328, 44.20463562011719, 46.390037536621094, 48.575439453125, 50.76084518432617, 52.94624710083008, 55.13165283203125, 57.317054748535156, 59.50245666503906, 61.687862396240234, 63.87326431274414, 66.05867004394531, 68.24407196044922]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 15.0, 17.0, 10.0, 14.0, 26.0, 21.0, 15.0, 32.0, 31.0, 30.0, 33.0, 39.0, 23.0, 43.0, 37.0, 40.0, 49.0, 42.0, 41.0, 54.0, 34.0, 42.0, 37.0, 28.0, 38.0, 29.0, 20.0, 24.0, 21.0, 13.0, 11.0, 13.0, 13.0, 8.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.8331527709961, -90.14823150634766, -87.46330261230469, -84.77838134765625, -82.09346008300781, -79.40853118896484, -76.7236099243164, -74.03868103027344, -71.353759765625, -68.66883850097656, -65.9839096069336, -63.298988342285156, -60.61406326293945, -57.92913818359375, -55.24421691894531, -52.55929183959961, -49.874366760253906, -47.1894416809082, -44.5045166015625, -41.81959533691406, -39.13467025756836, -36.449745178222656, -33.76482391357422, -31.079898834228516, -28.394973754882812, -25.71004867553711, -23.02512550354004, -20.34020233154297, -17.655277252197266, -14.970353126525879, -12.285429000854492, -9.600505828857422, -6.9155731201171875, -4.230648994445801, -1.545724868774414, 1.1391992568969727, 3.8241233825683594, 6.509047508239746, 9.193971633911133, 11.878894805908203, 14.563819885253906, 17.24874496459961, 19.93366813659668, 22.61859130859375, 25.303516387939453, 27.988441467285156, 30.673364639282227, 33.3582878112793, 36.043212890625, 38.7281379699707, 41.413063049316406, 44.097984313964844, 46.78290939331055, 49.46783447265625, 52.15275573730469, 54.83768081665039, 57.522605895996094, 60.2075309753418, 62.8924560546875, 65.57737731933594, 68.26229858398438, 70.94722747802734, 73.63214874267578, 76.31707763671875, 79.00199890136719]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 16.0, 13.0, 21.0, 28.0, 28.0, 64.0, 102.0, 155.0, 258.0, 374.0, 557.0, 847.0, 1395.0, 2158.0, 3431.0, 5278.0, 8209.0, 12581.0, 19029.0, 28774.0, 42122.0, 59198.0, 80196.0, 101198.0, 117153.0, 121476.0, 112464.0, 94320.0, 73283.0, 53352.0, 37194.0, 25552.0, 16873.0, 10972.0, 7217.0, 4376.0, 2974.0, 1915.0, 1230.0, 748.0, 523.0, 310.0, 191.0, 143.0, 85.0, 60.0, 29.0, 36.0, 13.0, 8.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0], "bins": [-11.46875, -11.124755859375, -10.78076171875, -10.436767578125, -10.0927734375, -9.748779296875, -9.40478515625, -9.060791015625, -8.716796875, -8.372802734375, -8.02880859375, -7.684814453125, -7.3408203125, -6.996826171875, -6.65283203125, -6.308837890625, -5.96484375, -5.620849609375, -5.27685546875, -4.932861328125, -4.5888671875, -4.244873046875, -3.90087890625, -3.556884765625, -3.212890625, -2.868896484375, -2.52490234375, -2.180908203125, -1.8369140625, -1.492919921875, -1.14892578125, -0.804931640625, -0.4609375, -0.116943359375, 0.22705078125, 0.571044921875, 0.9150390625, 1.259033203125, 1.60302734375, 1.947021484375, 2.291015625, 2.635009765625, 2.97900390625, 3.322998046875, 3.6669921875, 4.010986328125, 4.35498046875, 4.698974609375, 5.04296875, 5.386962890625, 5.73095703125, 6.074951171875, 6.4189453125, 6.762939453125, 7.10693359375, 7.450927734375, 7.794921875, 8.138916015625, 8.48291015625, 8.826904296875, 9.1708984375, 9.514892578125, 9.85888671875, 10.202880859375, 10.546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 17.0, 10.0, 13.0, 24.0, 21.0, 17.0, 32.0, 31.0, 30.0, 32.0, 39.0, 26.0, 41.0, 36.0, 43.0, 43.0, 44.0, 45.0, 53.0, 33.0, 42.0, 37.0, 27.0, 39.0, 29.0, 21.0, 24.0, 22.0, 12.0, 11.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.125, -90.431640625, -87.73828125, -85.044921875, -82.3515625, -79.658203125, -76.96484375, -74.271484375, -71.578125, -68.884765625, -66.19140625, -63.498046875, -60.8046875, -58.111328125, -55.41796875, -52.724609375, -50.03125, -47.337890625, -44.64453125, -41.951171875, -39.2578125, -36.564453125, -33.87109375, -31.177734375, -28.484375, -25.791015625, -23.09765625, -20.404296875, -17.7109375, -15.017578125, -12.32421875, -9.630859375, -6.9375, -4.244140625, -1.55078125, 1.142578125, 3.8359375, 6.529296875, 9.22265625, 11.916015625, 14.609375, 17.302734375, 19.99609375, 22.689453125, 25.3828125, 28.076171875, 30.76953125, 33.462890625, 36.15625, 38.849609375, 41.54296875, 44.236328125, 46.9296875, 49.623046875, 52.31640625, 55.009765625, 57.703125, 60.396484375, 63.08984375, 65.783203125, 68.4765625, 71.169921875, 73.86328125, 76.556640625, 79.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 7.0, 15.0, 27.0, 25.0, 50.0, 59.0, 93.0, 145.0, 186.0, 269.0, 372.0, 547.0, 832.0, 1178.0, 1696.0, 2452.0, 3394.0, 4821.0, 7015.0, 10048.0, 14711.0, 23963.0, 74384.0, 724546.0, 101644.0, 25724.0, 15959.0, 10446.0, 7107.0, 4992.0, 3537.0, 2467.0, 1698.0, 1259.0, 911.0, 585.0, 400.0, 283.0, 209.0, 138.0, 99.0, 78.0, 59.0, 49.0, 19.0, 18.0, 5.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-21.828125, -21.15771484375, -20.4873046875, -19.81689453125, -19.146484375, -18.47607421875, -17.8056640625, -17.13525390625, -16.46484375, -15.79443359375, -15.1240234375, -14.45361328125, -13.783203125, -13.11279296875, -12.4423828125, -11.77197265625, -11.1015625, -10.43115234375, -9.7607421875, -9.09033203125, -8.419921875, -7.74951171875, -7.0791015625, -6.40869140625, -5.73828125, -5.06787109375, -4.3974609375, -3.72705078125, -3.056640625, -2.38623046875, -1.7158203125, -1.04541015625, -0.375, 0.29541015625, 0.9658203125, 1.63623046875, 2.306640625, 2.97705078125, 3.6474609375, 4.31787109375, 4.98828125, 5.65869140625, 6.3291015625, 6.99951171875, 7.669921875, 8.34033203125, 9.0107421875, 9.68115234375, 10.3515625, 11.02197265625, 11.6923828125, 12.36279296875, 13.033203125, 13.70361328125, 14.3740234375, 15.04443359375, 15.71484375, 16.38525390625, 17.0556640625, 17.72607421875, 18.396484375, 19.06689453125, 19.7373046875, 20.40771484375, 21.078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 14.0, 17.0, 20.0, 8.0, 17.0, 25.0, 12.0, 21.0, 29.0, 31.0, 36.0, 27.0, 39.0, 37.0, 37.0, 42.0, 36.0, 35.0, 40.0, 40.0, 36.0, 32.0, 31.0, 33.0, 30.0, 14.0, 30.0, 22.0, 21.0, 16.0, 26.0, 17.0, 18.0, 14.0, 16.0, 8.0, 5.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.71875, -47.09619140625, -45.4736328125, -43.85107421875, -42.228515625, -40.60595703125, -38.9833984375, -37.36083984375, -35.73828125, -34.11572265625, -32.4931640625, -30.87060546875, -29.248046875, -27.62548828125, -26.0029296875, -24.38037109375, -22.7578125, -21.13525390625, -19.5126953125, -17.89013671875, -16.267578125, -14.64501953125, -13.0224609375, -11.39990234375, -9.77734375, -8.15478515625, -6.5322265625, -4.90966796875, -3.287109375, -1.66455078125, -0.0419921875, 1.58056640625, 3.203125, 4.82568359375, 6.4482421875, 8.07080078125, 9.693359375, 11.31591796875, 12.9384765625, 14.56103515625, 16.18359375, 17.80615234375, 19.4287109375, 21.05126953125, 22.673828125, 24.29638671875, 25.9189453125, 27.54150390625, 29.1640625, 30.78662109375, 32.4091796875, 34.03173828125, 35.654296875, 37.27685546875, 38.8994140625, 40.52197265625, 42.14453125, 43.76708984375, 45.3896484375, 47.01220703125, 48.634765625, 50.25732421875, 51.8798828125, 53.50244140625, 55.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 4.0, 11.0, 14.0, 30.0, 40.0, 58.0, 80.0, 144.0, 211.0, 331.0, 531.0, 927.0, 1444.0, 2398.0, 4215.0, 6922.0, 11918.0, 20799.0, 40820.0, 817038.0, 79921.0, 25590.0, 14505.0, 8258.0, 4765.0, 2925.0, 1761.0, 1099.0, 625.0, 435.0, 255.0, 166.0, 100.0, 59.0, 42.0, 24.0, 19.0, 21.0, 9.0, 6.0, 2.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.640625, -2.5416259765625, -2.442626953125, -2.3436279296875, -2.24462890625, -2.1456298828125, -2.046630859375, -1.9476318359375, -1.8486328125, -1.7496337890625, -1.650634765625, -1.5516357421875, -1.45263671875, -1.3536376953125, -1.254638671875, -1.1556396484375, -1.056640625, -0.9576416015625, -0.858642578125, -0.7596435546875, -0.66064453125, -0.5616455078125, -0.462646484375, -0.3636474609375, -0.2646484375, -0.1656494140625, -0.066650390625, 0.0323486328125, 0.13134765625, 0.2303466796875, 0.329345703125, 0.4283447265625, 0.52734375, 0.6263427734375, 0.725341796875, 0.8243408203125, 0.92333984375, 1.0223388671875, 1.121337890625, 1.2203369140625, 1.3193359375, 1.4183349609375, 1.517333984375, 1.6163330078125, 1.71533203125, 1.8143310546875, 1.913330078125, 2.0123291015625, 2.111328125, 2.2103271484375, 2.309326171875, 2.4083251953125, 2.50732421875, 2.6063232421875, 2.705322265625, 2.8043212890625, 2.9033203125, 3.0023193359375, 3.101318359375, 3.2003173828125, 3.29931640625, 3.3983154296875, 3.497314453125, 3.5963134765625, 3.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 13.0, 17.0, 13.0, 22.0, 20.0, 21.0, 21.0, 40.0, 37.0, 42.0, 48.0, 44.0, 46.0, 52.0, 53.0, 42.0, 54.0, 45.0, 50.0, 40.0, 41.0, 22.0, 30.0, 30.0, 13.0, 26.0, 22.0, 14.0, 19.0, 10.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.185075759887695e-05, -8.923280984163284e-05, -8.661486208438873e-05, -8.399691432714462e-05, -8.137896656990051e-05, -7.87610188126564e-05, -7.614307105541229e-05, -7.352512329816818e-05, -7.090717554092407e-05, -6.828922778367996e-05, -6.567128002643585e-05, -6.305333226919174e-05, -6.043538451194763e-05, -5.781743675470352e-05, -5.519948899745941e-05, -5.25815412402153e-05, -4.996359348297119e-05, -4.734564572572708e-05, -4.472769796848297e-05, -4.210975021123886e-05, -3.949180245399475e-05, -3.687385469675064e-05, -3.425590693950653e-05, -3.163795918226242e-05, -2.902001142501831e-05, -2.64020636677742e-05, -2.378411591053009e-05, -2.116616815328598e-05, -1.854822039604187e-05, -1.593027263879776e-05, -1.331232488155365e-05, -1.069437712430954e-05, -8.07642936706543e-06, -5.45848160982132e-06, -2.8405338525772095e-06, -2.2258609533309937e-07, 2.3953616619110107e-06, 5.013309419155121e-06, 7.631257176399231e-06, 1.0249204933643341e-05, 1.2867152690887451e-05, 1.548510044813156e-05, 1.810304820537567e-05, 2.072099596261978e-05, 2.333894371986389e-05, 2.5956891477108002e-05, 2.8574839234352112e-05, 3.119278699159622e-05, 3.381073474884033e-05, 3.642868250608444e-05, 3.904663026332855e-05, 4.166457802057266e-05, 4.428252577781677e-05, 4.690047353506088e-05, 4.951842129230499e-05, 5.21363690495491e-05, 5.475431680679321e-05, 5.737226456403732e-05, 5.999021232128143e-05, 6.260816007852554e-05, 6.522610783576965e-05, 6.784405559301376e-05, 7.046200335025787e-05, 7.307995110750198e-05, 7.56978988647461e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 14.0, 12.0, 18.0, 38.0, 64.0, 119.0, 200.0, 303.0, 476.0, 866.0, 1548.0, 2549.0, 4217.0, 7221.0, 12463.0, 21180.0, 34973.0, 57077.0, 91183.0, 134474.0, 171199.0, 166988.0, 125995.0, 83971.0, 52424.0, 32261.0, 19117.0, 11356.0, 6721.0, 3987.0, 2289.0, 1353.0, 751.0, 462.0, 273.0, 144.0, 101.0, 59.0, 44.0, 23.0, 12.0, 11.0, 11.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.78515625, -2.6978759765625, -2.610595703125, -2.5233154296875, -2.43603515625, -2.3487548828125, -2.261474609375, -2.1741943359375, -2.0869140625, -1.9996337890625, -1.912353515625, -1.8250732421875, -1.73779296875, -1.6505126953125, -1.563232421875, -1.4759521484375, -1.388671875, -1.3013916015625, -1.214111328125, -1.1268310546875, -1.03955078125, -0.9522705078125, -0.864990234375, -0.7777099609375, -0.6904296875, -0.6031494140625, -0.515869140625, -0.4285888671875, -0.34130859375, -0.2540283203125, -0.166748046875, -0.0794677734375, 0.0078125, 0.0950927734375, 0.182373046875, 0.2696533203125, 0.35693359375, 0.4442138671875, 0.531494140625, 0.6187744140625, 0.7060546875, 0.7933349609375, 0.880615234375, 0.9678955078125, 1.05517578125, 1.1424560546875, 1.229736328125, 1.3170166015625, 1.404296875, 1.4915771484375, 1.578857421875, 1.6661376953125, 1.75341796875, 1.8406982421875, 1.927978515625, 2.0152587890625, 2.1025390625, 2.1898193359375, 2.277099609375, 2.3643798828125, 2.45166015625, 2.5389404296875, 2.626220703125, 2.7135009765625, 2.80078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 14.0, 10.0, 15.0, 15.0, 14.0, 16.0, 18.0, 25.0, 33.0, 30.0, 36.0, 41.0, 40.0, 57.0, 42.0, 39.0, 47.0, 56.0, 54.0, 53.0, 53.0, 34.0, 34.0, 36.0, 22.0, 25.0, 22.0, 26.0, 15.0, 14.0, 7.0, 7.0, 6.0, 3.0, 12.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3271484375, -1.2866668701171875, -1.246185302734375, -1.2057037353515625, -1.16522216796875, -1.1247406005859375, -1.084259033203125, -1.0437774658203125, -1.0032958984375, -0.9628143310546875, -0.922332763671875, -0.8818511962890625, -0.84136962890625, -0.8008880615234375, -0.760406494140625, -0.7199249267578125, -0.679443359375, -0.6389617919921875, -0.598480224609375, -0.5579986572265625, -0.51751708984375, -0.4770355224609375, -0.436553955078125, -0.3960723876953125, -0.3555908203125, -0.3151092529296875, -0.274627685546875, -0.2341461181640625, -0.19366455078125, -0.1531829833984375, -0.112701416015625, -0.0722198486328125, -0.03173828125, 0.0087432861328125, 0.049224853515625, 0.0897064208984375, 0.13018798828125, 0.1706695556640625, 0.211151123046875, 0.2516326904296875, 0.2921142578125, 0.3325958251953125, 0.373077392578125, 0.4135589599609375, 0.45404052734375, 0.4945220947265625, 0.535003662109375, 0.5754852294921875, 0.615966796875, 0.6564483642578125, 0.696929931640625, 0.7374114990234375, 0.77789306640625, 0.8183746337890625, 0.858856201171875, 0.8993377685546875, 0.9398193359375, 0.9803009033203125, 1.020782470703125, 1.0612640380859375, 1.10174560546875, 1.1422271728515625, 1.182708740234375, 1.2231903076171875, 1.263671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 11.0, 5.0, 9.0, 5.0, 5.0, 13.0, 9.0, 17.0, 16.0, 27.0, 21.0, 21.0, 18.0, 32.0, 24.0, 35.0, 30.0, 37.0, 53.0, 46.0, 36.0, 43.0, 54.0, 34.0, 47.0, 35.0, 41.0, 38.0, 35.0, 29.0, 34.0, 22.0, 23.0, 16.0, 13.0, 13.0, 11.0, 8.0, 12.0, 9.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.83599090576172, -68.6427001953125, -66.44940948486328, -64.25611114501953, -62.06282043457031, -59.869529724121094, -57.676239013671875, -55.482948303222656, -53.28965377807617, -51.09636306762695, -48.90306854248047, -46.70977783203125, -44.51648712158203, -42.32319259643555, -40.12990188598633, -37.936607360839844, -35.743316650390625, -33.550025939941406, -31.356731414794922, -29.163440704345703, -26.97014808654785, -24.77685546875, -22.58356475830078, -20.39027214050293, -18.196979522705078, -16.003686904907227, -13.810395240783691, -11.617103576660156, -9.423810958862305, -7.230518341064453, -5.037226676940918, -2.843935012817383, -0.6506423950195312, 1.542649745941162, 3.7359418869018555, 5.929234027862549, 8.122526168823242, 10.315818786621094, 12.509110450744629, 14.702402114868164, 16.895694732666016, 19.088987350463867, 21.28227996826172, 23.475570678710938, 25.66886329650879, 27.86215591430664, 30.05544662475586, 32.248741149902344, 34.44203186035156, 36.63532257080078, 38.828617095947266, 41.021907806396484, 43.21520233154297, 45.40849304199219, 47.601783752441406, 49.795074462890625, 51.98836898803711, 54.18165969848633, 56.37495422363281, 58.56824493408203, 60.76153564453125, 62.954830169677734, 65.14812469482422, 67.34141540527344, 69.53470611572266]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 11.0, 18.0, 12.0, 11.0, 25.0, 21.0, 17.0, 29.0, 29.0, 29.0, 32.0, 45.0, 24.0, 38.0, 37.0, 41.0, 44.0, 41.0, 43.0, 60.0, 34.0, 40.0, 33.0, 32.0, 38.0, 31.0, 21.0, 26.0, 17.0, 18.0, 12.0, 10.0, 12.0, 9.0, 10.0, 7.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.45228576660156, -90.76252746582031, -88.07276916503906, -85.38300323486328, -82.69324493408203, -80.00348663330078, -77.313720703125, -74.62396240234375, -71.9342041015625, -69.24444580078125, -66.5546875, -63.86492156982422, -61.17516326904297, -58.48540496826172, -55.7956428527832, -53.10588073730469, -50.41612243652344, -47.72636413574219, -45.03660202026367, -42.346839904785156, -39.657081604003906, -36.967323303222656, -34.27756118774414, -31.587800979614258, -28.898040771484375, -26.208280563354492, -23.51852035522461, -20.828760147094727, -18.138999938964844, -15.449239730834961, -12.759479522705078, -10.069719314575195, -7.3799591064453125, -4.69019889831543, -2.000438690185547, 0.6893215179443359, 3.3790817260742188, 6.068841934204102, 8.758602142333984, 11.448362350463867, 14.13812255859375, 16.827882766723633, 19.517642974853516, 22.2074031829834, 24.89716339111328, 27.586923599243164, 30.276683807373047, 32.96644592285156, 35.65620422363281, 38.34596252441406, 41.03572463989258, 43.725486755371094, 46.415245056152344, 49.105003356933594, 51.79476547241211, 54.484527587890625, 57.174285888671875, 59.864044189453125, 62.55380630493164, 65.24356842041016, 67.9333267211914, 70.62308502197266, 73.31285095214844, 76.00260925292969, 78.69236755371094]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 20.0, 34.0, 47.0, 111.0, 140.0, 215.0, 443.0, 662.0, 1145.0, 1737.0, 2901.0, 4831.0, 7677.0, 11948.0, 18496.0, 27974.0, 39692.0, 54878.0, 70863.0, 86648.0, 99660.0, 106413.0, 105433.0, 97258.0, 83167.0, 67487.0, 50953.0, 36527.0, 25468.0, 16766.0, 11006.0, 6938.0, 4235.0, 2617.0, 1585.0, 1020.0, 631.0, 376.0, 207.0, 148.0, 87.0, 39.0, 31.0, 13.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.625, -42.11474609375, -40.6044921875, -39.09423828125, -37.583984375, -36.07373046875, -34.5634765625, -33.05322265625, -31.54296875, -30.03271484375, -28.5224609375, -27.01220703125, -25.501953125, -23.99169921875, -22.4814453125, -20.97119140625, -19.4609375, -17.95068359375, -16.4404296875, -14.93017578125, -13.419921875, -11.90966796875, -10.3994140625, -8.88916015625, -7.37890625, -5.86865234375, -4.3583984375, -2.84814453125, -1.337890625, 0.17236328125, 1.6826171875, 3.19287109375, 4.703125, 6.21337890625, 7.7236328125, 9.23388671875, 10.744140625, 12.25439453125, 13.7646484375, 15.27490234375, 16.78515625, 18.29541015625, 19.8056640625, 21.31591796875, 22.826171875, 24.33642578125, 25.8466796875, 27.35693359375, 28.8671875, 30.37744140625, 31.8876953125, 33.39794921875, 34.908203125, 36.41845703125, 37.9287109375, 39.43896484375, 40.94921875, 42.45947265625, 43.9697265625, 45.47998046875, 46.990234375, 48.50048828125, 50.0107421875, 51.52099609375, 53.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 16.0, 13.0, 10.0, 25.0, 20.0, 20.0, 28.0, 25.0, 31.0, 32.0, 47.0, 23.0, 38.0, 38.0, 40.0, 43.0, 46.0, 43.0, 57.0, 36.0, 37.0, 34.0, 31.0, 43.0, 27.0, 23.0, 24.0, 19.0, 15.0, 15.0, 7.0, 13.0, 9.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.6875, -90.01953125, -87.3515625, -84.68359375, -82.015625, -79.34765625, -76.6796875, -74.01171875, -71.34375, -68.67578125, -66.0078125, -63.33984375, -60.671875, -58.00390625, -55.3359375, -52.66796875, -50.0, -47.33203125, -44.6640625, -41.99609375, -39.328125, -36.66015625, -33.9921875, -31.32421875, -28.65625, -25.98828125, -23.3203125, -20.65234375, -17.984375, -15.31640625, -12.6484375, -9.98046875, -7.3125, -4.64453125, -1.9765625, 0.69140625, 3.359375, 6.02734375, 8.6953125, 11.36328125, 14.03125, 16.69921875, 19.3671875, 22.03515625, 24.703125, 27.37109375, 30.0390625, 32.70703125, 35.375, 38.04296875, 40.7109375, 43.37890625, 46.046875, 48.71484375, 51.3828125, 54.05078125, 56.71875, 59.38671875, 62.0546875, 64.72265625, 67.390625, 70.05859375, 72.7265625, 75.39453125, 78.0625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 9.0, 9.0, 22.0, 32.0, 68.0, 71.0, 103.0, 153.0, 271.0, 414.0, 631.0, 995.0, 1500.0, 2304.0, 3505.0, 5185.0, 7791.0, 11432.0, 16503.0, 23059.0, 31627.0, 42442.0, 54730.0, 66771.0, 78688.0, 88135.0, 91781.0, 91967.0, 86992.0, 77478.0, 66007.0, 53362.0, 41624.0, 31005.0, 22592.0, 15928.0, 11040.0, 7514.0, 5101.0, 3404.0, 2209.0, 1364.0, 961.0, 616.0, 423.0, 274.0, 183.0, 111.0, 58.0, 43.0, 35.0, 15.0, 11.0, 6.0, 3.0, 1.0, 4.0, 2.0], "bins": [-47.28125, -45.8466796875, -44.412109375, -42.9775390625, -41.54296875, -40.1083984375, -38.673828125, -37.2392578125, -35.8046875, -34.3701171875, -32.935546875, -31.5009765625, -30.06640625, -28.6318359375, -27.197265625, -25.7626953125, -24.328125, -22.8935546875, -21.458984375, -20.0244140625, -18.58984375, -17.1552734375, -15.720703125, -14.2861328125, -12.8515625, -11.4169921875, -9.982421875, -8.5478515625, -7.11328125, -5.6787109375, -4.244140625, -2.8095703125, -1.375, 0.0595703125, 1.494140625, 2.9287109375, 4.36328125, 5.7978515625, 7.232421875, 8.6669921875, 10.1015625, 11.5361328125, 12.970703125, 14.4052734375, 15.83984375, 17.2744140625, 18.708984375, 20.1435546875, 21.578125, 23.0126953125, 24.447265625, 25.8818359375, 27.31640625, 28.7509765625, 30.185546875, 31.6201171875, 33.0546875, 34.4892578125, 35.923828125, 37.3583984375, 38.79296875, 40.2275390625, 41.662109375, 43.0966796875, 44.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 14.0, 12.0, 15.0, 19.0, 25.0, 20.0, 16.0, 28.0, 28.0, 36.0, 39.0, 36.0, 40.0, 42.0, 37.0, 49.0, 43.0, 38.0, 37.0, 29.0, 35.0, 49.0, 32.0, 34.0, 30.0, 23.0, 17.0, 24.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 8.0, 9.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.24755859375, -48.4638671875, -46.68017578125, -44.896484375, -43.11279296875, -41.3291015625, -39.54541015625, -37.76171875, -35.97802734375, -34.1943359375, -32.41064453125, -30.626953125, -28.84326171875, -27.0595703125, -25.27587890625, -23.4921875, -21.70849609375, -19.9248046875, -18.14111328125, -16.357421875, -14.57373046875, -12.7900390625, -11.00634765625, -9.22265625, -7.43896484375, -5.6552734375, -3.87158203125, -2.087890625, -0.30419921875, 1.4794921875, 3.26318359375, 5.046875, 6.83056640625, 8.6142578125, 10.39794921875, 12.181640625, 13.96533203125, 15.7490234375, 17.53271484375, 19.31640625, 21.10009765625, 22.8837890625, 24.66748046875, 26.451171875, 28.23486328125, 30.0185546875, 31.80224609375, 33.5859375, 35.36962890625, 37.1533203125, 38.93701171875, 40.720703125, 42.50439453125, 44.2880859375, 46.07177734375, 47.85546875, 49.63916015625, 51.4228515625, 53.20654296875, 54.990234375, 56.77392578125, 58.5576171875, 60.34130859375, 62.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 7.0, 18.0, 13.0, 38.0, 61.0, 100.0, 161.0, 280.0, 485.0, 790.0, 1352.0, 2301.0, 4096.0, 6875.0, 11507.0, 19034.0, 30302.0, 45594.0, 65563.0, 87105.0, 107075.0, 119980.0, 122091.0, 112278.0, 94523.0, 72608.0, 52559.0, 35335.0, 22484.0, 13991.0, 8297.0, 4948.0, 2803.0, 1631.0, 925.0, 538.0, 310.0, 186.0, 116.0, 67.0, 43.0, 31.0, 20.0, 11.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-23.578125, -22.867431640625, -22.15673828125, -21.446044921875, -20.7353515625, -20.024658203125, -19.31396484375, -18.603271484375, -17.892578125, -17.181884765625, -16.47119140625, -15.760498046875, -15.0498046875, -14.339111328125, -13.62841796875, -12.917724609375, -12.20703125, -11.496337890625, -10.78564453125, -10.074951171875, -9.3642578125, -8.653564453125, -7.94287109375, -7.232177734375, -6.521484375, -5.810791015625, -5.10009765625, -4.389404296875, -3.6787109375, -2.968017578125, -2.25732421875, -1.546630859375, -0.8359375, -0.125244140625, 0.58544921875, 1.296142578125, 2.0068359375, 2.717529296875, 3.42822265625, 4.138916015625, 4.849609375, 5.560302734375, 6.27099609375, 6.981689453125, 7.6923828125, 8.403076171875, 9.11376953125, 9.824462890625, 10.53515625, 11.245849609375, 11.95654296875, 12.667236328125, 13.3779296875, 14.088623046875, 14.79931640625, 15.510009765625, 16.220703125, 16.931396484375, 17.64208984375, 18.352783203125, 19.0634765625, 19.774169921875, 20.48486328125, 21.195556640625, 21.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 14.0, 25.0, 19.0, 26.0, 18.0, 38.0, 49.0, 30.0, 46.0, 49.0, 39.0, 47.0, 57.0, 49.0, 48.0, 47.0, 42.0, 45.0, 37.0, 31.0, 34.0, 32.0, 23.0, 21.0, 16.0, 14.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028400421142578125, -0.0027502477169036865, -0.0026604533195495605, -0.0025706589221954346, -0.0024808645248413086, -0.0023910701274871826, -0.0023012757301330566, -0.0022114813327789307, -0.0021216869354248047, -0.0020318925380706787, -0.0019420981407165527, -0.0018523037433624268, -0.0017625093460083008, -0.0016727149486541748, -0.0015829205513000488, -0.0014931261539459229, -0.0014033317565917969, -0.001313537359237671, -0.001223742961883545, -0.001133948564529419, -0.001044154167175293, -0.000954359769821167, -0.000864565372467041, -0.000774770975112915, -0.0006849765777587891, -0.0005951821804046631, -0.0005053877830505371, -0.00041559338569641113, -0.00032579898834228516, -0.00023600459098815918, -0.0001462101936340332, -5.6415796279907227e-05, 3.337860107421875e-05, 0.00012317299842834473, 0.0002129673957824707, 0.0003027617931365967, 0.00039255619049072266, 0.00048235058784484863, 0.0005721449851989746, 0.0006619393825531006, 0.0007517337799072266, 0.0008415281772613525, 0.0009313225746154785, 0.0010211169719696045, 0.0011109113693237305, 0.0012007057666778564, 0.0012905001640319824, 0.0013802945613861084, 0.0014700889587402344, 0.0015598833560943604, 0.0016496777534484863, 0.0017394721508026123, 0.0018292665481567383, 0.0019190609455108643, 0.0020088553428649902, 0.002098649740219116, 0.002188444137573242, 0.002278238534927368, 0.002368032932281494, 0.00245782732963562, 0.002547621726989746, 0.002637416124343872, 0.002727210521697998, 0.002817004919052124, 0.00290679931640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 14.0, 18.0, 31.0, 34.0, 63.0, 101.0, 174.0, 277.0, 415.0, 652.0, 1083.0, 1661.0, 2605.0, 4134.0, 6115.0, 9402.0, 13553.0, 19606.0, 27198.0, 37052.0, 47712.0, 59921.0, 71899.0, 82279.0, 89032.0, 91428.0, 89238.0, 82608.0, 73386.0, 61071.0, 48568.0, 37712.0, 27819.0, 20028.0, 13964.0, 9401.0, 6433.0, 4274.0, 2799.0, 1804.0, 1067.0, 768.0, 412.0, 262.0, 173.0, 110.0, 82.0, 47.0, 30.0, 11.0, 10.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0], "bins": [-17.953125, -17.4013671875, -16.849609375, -16.2978515625, -15.74609375, -15.1943359375, -14.642578125, -14.0908203125, -13.5390625, -12.9873046875, -12.435546875, -11.8837890625, -11.33203125, -10.7802734375, -10.228515625, -9.6767578125, -9.125, -8.5732421875, -8.021484375, -7.4697265625, -6.91796875, -6.3662109375, -5.814453125, -5.2626953125, -4.7109375, -4.1591796875, -3.607421875, -3.0556640625, -2.50390625, -1.9521484375, -1.400390625, -0.8486328125, -0.296875, 0.2548828125, 0.806640625, 1.3583984375, 1.91015625, 2.4619140625, 3.013671875, 3.5654296875, 4.1171875, 4.6689453125, 5.220703125, 5.7724609375, 6.32421875, 6.8759765625, 7.427734375, 7.9794921875, 8.53125, 9.0830078125, 9.634765625, 10.1865234375, 10.73828125, 11.2900390625, 11.841796875, 12.3935546875, 12.9453125, 13.4970703125, 14.048828125, 14.6005859375, 15.15234375, 15.7041015625, 16.255859375, 16.8076171875, 17.359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 11.0, 4.0, 12.0, 18.0, 22.0, 18.0, 24.0, 35.0, 36.0, 31.0, 38.0, 39.0, 38.0, 47.0, 41.0, 36.0, 56.0, 44.0, 41.0, 47.0, 33.0, 51.0, 37.0, 34.0, 32.0, 28.0, 27.0, 21.0, 18.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.8963623046875, -9.573974609375, -9.2515869140625, -8.92919921875, -8.6068115234375, -8.284423828125, -7.9620361328125, -7.6396484375, -7.3172607421875, -6.994873046875, -6.6724853515625, -6.35009765625, -6.0277099609375, -5.705322265625, -5.3829345703125, -5.060546875, -4.7381591796875, -4.415771484375, -4.0933837890625, -3.77099609375, -3.4486083984375, -3.126220703125, -2.8038330078125, -2.4814453125, -2.1590576171875, -1.836669921875, -1.5142822265625, -1.19189453125, -0.8695068359375, -0.547119140625, -0.2247314453125, 0.09765625, 0.4200439453125, 0.742431640625, 1.0648193359375, 1.38720703125, 1.7095947265625, 2.031982421875, 2.3543701171875, 2.6767578125, 2.9991455078125, 3.321533203125, 3.6439208984375, 3.96630859375, 4.2886962890625, 4.611083984375, 4.9334716796875, 5.255859375, 5.5782470703125, 5.900634765625, 6.2230224609375, 6.54541015625, 6.8677978515625, 7.190185546875, 7.5125732421875, 7.8349609375, 8.1573486328125, 8.479736328125, 8.8021240234375, 9.12451171875, 9.4468994140625, 9.769287109375, 10.0916748046875, 10.4140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 2.0, 12.0, 6.0, 11.0, 14.0, 16.0, 17.0, 24.0, 17.0, 21.0, 22.0, 29.0, 26.0, 27.0, 29.0, 33.0, 36.0, 51.0, 37.0, 33.0, 45.0, 40.0, 43.0, 39.0, 36.0, 42.0, 36.0, 36.0, 28.0, 23.0, 15.0, 19.0, 18.0, 12.0, 12.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-73.91032409667969, -71.82327270507812, -69.73622131347656, -67.64917755126953, -65.56212615966797, -63.475074768066406, -61.38802719116211, -59.30097961425781, -57.21392822265625, -55.12687683105469, -53.03982925415039, -50.952781677246094, -48.86573028564453, -46.77867889404297, -44.69163131713867, -42.604583740234375, -40.51753234863281, -38.43048095703125, -36.34343338012695, -34.256385803222656, -32.169334411621094, -30.082284927368164, -27.995235443115234, -25.908185958862305, -23.821136474609375, -21.734086990356445, -19.647037506103516, -17.559988021850586, -15.472938537597656, -13.385889053344727, -11.298839569091797, -9.211790084838867, -7.124744415283203, -5.037694931030273, -2.9506454467773438, -0.8635959625244141, 1.2234535217285156, 3.3105030059814453, 5.397552490234375, 7.484601974487305, 9.571651458740234, 11.658700942993164, 13.745750427246094, 15.832799911499023, 17.919849395751953, 20.006898880004883, 22.093948364257812, 24.180997848510742, 26.268047332763672, 28.3550968170166, 30.44214630126953, 32.529197692871094, 34.61624526977539, 36.70329284667969, 38.79034423828125, 40.87739562988281, 42.96444320678711, 45.051490783691406, 47.13854217529297, 49.22559356689453, 51.31264114379883, 53.399688720703125, 55.48674011230469, 57.57379150390625, 59.66083908081055]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 9.0, 4.0, 15.0, 9.0, 13.0, 21.0, 20.0, 16.0, 19.0, 27.0, 32.0, 30.0, 32.0, 31.0, 45.0, 42.0, 39.0, 36.0, 51.0, 45.0, 48.0, 36.0, 47.0, 42.0, 53.0, 36.0, 23.0, 24.0, 16.0, 13.0, 10.0, 21.0, 16.0, 12.0, 9.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-97.46207427978516, -94.4552993774414, -91.44853210449219, -88.44175720214844, -85.43498229980469, -82.42821502685547, -79.42144012451172, -76.4146728515625, -73.40789794921875, -70.401123046875, -67.39435577392578, -64.38758087158203, -61.38080978393555, -58.37403869628906, -55.36726379394531, -52.36049270629883, -49.353721618652344, -46.34695053100586, -43.340179443359375, -40.333404541015625, -37.32663345336914, -34.319862365722656, -31.31308937072754, -28.306316375732422, -25.299545288085938, -22.292774200439453, -19.286001205444336, -16.27922821044922, -13.272457122802734, -10.265685081481934, -7.258913040161133, -4.252140045166016, -1.245361328125, 1.7614107131958008, 4.768182754516602, 7.774954795837402, 10.781726837158203, 13.788498878479004, 16.795270919799805, 19.802043914794922, 22.808815002441406, 25.81558609008789, 28.822359085083008, 31.829132080078125, 34.83590316772461, 37.842674255371094, 40.849449157714844, 43.85622024536133, 46.86299133300781, 49.8697624206543, 52.87653350830078, 55.88330841064453, 58.890079498291016, 61.8968505859375, 64.90362548828125, 67.910400390625, 70.91716766357422, 73.92394256591797, 76.93070983886719, 79.93748474121094, 82.94425964355469, 85.9510269165039, 88.95780181884766, 91.96456909179688, 94.97134399414062]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 8.0, 12.0, 18.0, 30.0, 46.0, 45.0, 61.0, 86.0, 133.0, 173.0, 212.0, 318.0, 467.0, 525.0, 647.0, 858.0, 1179.0, 1432.0, 1762.0, 2116.0, 2523.0, 2869.0, 3354.0, 1009523.0, 4180.0, 3228.0, 2842.0, 2398.0, 1986.0, 1670.0, 1310.0, 1052.0, 854.0, 652.0, 509.0, 365.0, 290.0, 251.0, 180.0, 122.0, 89.0, 62.0, 44.0, 26.0, 19.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 8.0, 3.0], "bins": [-596.8502197265625, -579.7380981445312, -562.6259155273438, -545.5137939453125, -528.4016723632812, -511.2895202636719, -494.1773681640625, -477.06524658203125, -459.9530944824219, -442.8409423828125, -425.72882080078125, -408.6166687011719, -391.5045166015625, -374.39239501953125, -357.2802429199219, -340.1680908203125, -323.05596923828125, -305.9438171386719, -288.8316955566406, -271.71954345703125, -254.60740661621094, -237.49526977539062, -220.38311767578125, -203.27098083496094, -186.15884399414062, -169.0467071533203, -151.9345703125, -134.82241821289062, -117.71028137207031, -100.59814453125, -83.48600006103516, -66.37385559082031, -49.261688232421875, -32.1495475769043, -15.037406921386719, 2.0747337341308594, 19.186874389648438, 36.29901123046875, 53.411155700683594, 70.52330017089844, 87.63543701171875, 104.74757385253906, 121.8597183227539, 138.97186279296875, 156.08399963378906, 173.19613647460938, 190.30828857421875, 207.42042541503906, 224.53256225585938, 241.6446990966797, 258.7568359375, 275.8689880371094, 292.98114013671875, 310.09326171875, 327.2054138183594, 344.31756591796875, 361.4296875, 378.5418395996094, 395.6539611816406, 412.76611328125, 429.87823486328125, 446.9903869628906, 464.1025390625, 481.21466064453125, 498.3268127441406]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 16.0, 18.0, 32.0, 47.0, 70.0, 116.0, 170.0, 250.0, 357.0, 509.0, 735.0, 1129.0, 1613.0, 2294.0, 3526.0, 5220.0, 8417.0, 15285.0, 33200.0, 51317824.0, 37883.0, 16696.0, 8907.0, 5475.0, 3691.0, 2394.0, 1714.0, 1191.0, 830.0, 555.0, 411.0, 232.0, 171.0, 119.0, 66.0, 60.0, 37.0, 28.0, 13.0, 9.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-682.1965942382812, -659.1227416992188, -636.0489501953125, -612.97509765625, -589.9012451171875, -566.8274536132812, -543.7536010742188, -520.6798095703125, -497.60595703125, -474.5321350097656, -451.4582824707031, -428.38446044921875, -405.3106384277344, -382.23681640625, -359.1629638671875, -336.0891418457031, -313.0152893066406, -289.94146728515625, -266.86761474609375, -243.79379272460938, -220.719970703125, -197.64613342285156, -174.57229614257812, -151.49847412109375, -128.4246368408203, -105.3508071899414, -82.2769775390625, -59.20314025878906, -36.129310607910156, -13.05548095703125, 10.018356323242188, 33.09217834472656, 56.166015625, 79.2398452758789, 102.31367492675781, 125.38751220703125, 148.46133422851562, 171.53517150878906, 194.6090087890625, 217.68283081054688, 240.7566680908203, 263.83050537109375, 286.9043273925781, 309.9781494140625, 333.052001953125, 356.1258239746094, 379.19964599609375, 402.27349853515625, 425.3473205566406, 448.421142578125, 471.4949951171875, 494.5688171386719, 517.6426391601562, 540.7164916992188, 563.790283203125, 586.8641357421875, 609.93798828125, 633.0118408203125, 656.0856323242188, 679.1594848632812, 702.2333374023438, 725.30712890625, 748.3809814453125, 771.454833984375, 794.5286254882812]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 5.0, 12.0, 11.0, 12.0, 9.0, 21.0, 29.0, 28.0, 45.0, 47.0, 64.0, 63.0, 89.0, 82.0, 74.0, 84.0, 62.0, 47.0, 51.0, 34.0, 29.0, 23.0, 17.0, 14.0, 11.0, 9.0, 6.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-522.4603271484375, -500.36871337890625, -478.277099609375, -456.18548583984375, -434.0938720703125, -412.00225830078125, -389.9106140136719, -367.8190002441406, -345.7273864746094, -323.6357727050781, -301.5441589355469, -279.4525146484375, -257.36090087890625, -235.26930236816406, -213.17767333984375, -191.0860595703125, -168.99444580078125, -146.90283203125, -124.81121063232422, -102.71958923339844, -80.62797546386719, -58.53636169433594, -36.444732666015625, -14.353118896484375, 7.738494873046875, 29.83011245727539, 51.921730041503906, 74.01335144042969, 96.10496520996094, 118.19657897949219, 140.2882080078125, 162.37982177734375, 184.471435546875, 206.56304931640625, 228.6546630859375, 250.7462921142578, 272.837890625, 294.92950439453125, 317.0211486816406, 339.1127624511719, 361.2043762207031, 383.2959899902344, 405.3876037597656, 427.479248046875, 449.57086181640625, 471.6624755859375, 493.75408935546875, 515.845703125, 537.9373168945312, 560.0289306640625, 582.1205444335938, 604.212158203125, 626.3037719726562, 648.3953857421875, 670.487060546875, 692.57861328125, 714.6702880859375, 736.7619018554688, 758.853515625, 780.9451293945312, 803.0367431640625, 825.1283569335938, 847.219970703125, 869.3116455078125, 891.4031982421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 10.0, 15.0, 13.0, 17.0, 23.0, 23.0, 30.0, 24.0, 31.0, 36.0, 47.0, 29.0, 55.0, 64.0, 65.0, 56.0, 51.0, 53.0, 43.0, 38.0, 45.0, 32.0, 23.0, 29.0, 15.0, 15.0, 13.0, 19.0, 11.0, 11.0, 4.0, 9.0, 5.0, 13.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-685.2730712890625, -664.1161499023438, -642.959228515625, -621.80224609375, -600.6453247070312, -579.4884033203125, -558.3314208984375, -537.1744995117188, -516.017578125, -494.86065673828125, -473.7037048339844, -452.5467529296875, -431.38983154296875, -410.23291015625, -389.0759582519531, -367.91900634765625, -346.7620849609375, -325.60516357421875, -304.4482116699219, -283.291259765625, -262.13433837890625, -240.97740173339844, -219.82046508789062, -198.6635284423828, -177.506591796875, -156.3496551513672, -135.19271850585938, -114.03578186035156, -92.87884521484375, -71.72190856933594, -50.564971923828125, -29.408035278320312, -8.25115966796875, 12.905776977539062, 34.062713623046875, 55.21965026855469, 76.3765869140625, 97.53352355957031, 118.69046020507812, 139.84739685058594, 161.00433349609375, 182.16127014160156, 203.31820678710938, 224.4751434326172, 245.632080078125, 266.78900146484375, 287.9459533691406, 309.1029052734375, 330.25982666015625, 351.416748046875, 372.5736999511719, 393.73065185546875, 414.8875732421875, 436.04449462890625, 457.2014465332031, 478.3583984375, 499.51531982421875, 520.6722412109375, 541.8292236328125, 562.9861450195312, 584.14306640625, 605.2999877929688, 626.4569091796875, 647.6138916015625, 668.7708129882812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 19.0, 15.0, 26.0, 43.0, 34.0, 71.0, 132.0, 210.0, 231.0, 366.0, 487.0, 806.0, 1212.0, 1887.0, 2929.0, 4771.0, 8133.0, 14753.0, 30545.0, 72491.0, 218260.0, 1744524.0, 1740637.0, 212032.0, 71431.0, 30100.0, 14913.0, 8406.0, 5041.0, 3223.0, 2068.0, 1383.0, 963.0, 647.0, 433.0, 319.0, 237.0, 139.0, 97.0, 81.0, 54.0, 38.0, 21.0, 16.0, 16.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.953125, -21.26708984375, -20.5810546875, -19.89501953125, -19.208984375, -18.52294921875, -17.8369140625, -17.15087890625, -16.46484375, -15.77880859375, -15.0927734375, -14.40673828125, -13.720703125, -13.03466796875, -12.3486328125, -11.66259765625, -10.9765625, -10.29052734375, -9.6044921875, -8.91845703125, -8.232421875, -7.54638671875, -6.8603515625, -6.17431640625, -5.48828125, -4.80224609375, -4.1162109375, -3.43017578125, -2.744140625, -2.05810546875, -1.3720703125, -0.68603515625, 0.0, 0.68603515625, 1.3720703125, 2.05810546875, 2.744140625, 3.43017578125, 4.1162109375, 4.80224609375, 5.48828125, 6.17431640625, 6.8603515625, 7.54638671875, 8.232421875, 8.91845703125, 9.6044921875, 10.29052734375, 10.9765625, 11.66259765625, 12.3486328125, 13.03466796875, 13.720703125, 14.40673828125, 15.0927734375, 15.77880859375, 16.46484375, 17.15087890625, 17.8369140625, 18.52294921875, 19.208984375, 19.89501953125, 20.5810546875, 21.26708984375, 21.953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 15.0, 26.0, 28.0, 45.0, 56.0, 71.0, 89.0, 106.0, 103.0, 92.0, 97.0, 49.0, 49.0, 35.0, 29.0, 18.0, 12.0, 8.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.27099609375, -2.1962890625, -2.12158203125, -2.046875, -1.97216796875, -1.8974609375, -1.82275390625, -1.748046875, -1.67333984375, -1.5986328125, -1.52392578125, -1.44921875, -1.37451171875, -1.2998046875, -1.22509765625, -1.150390625, -1.07568359375, -1.0009765625, -0.92626953125, -0.8515625, -0.77685546875, -0.7021484375, -0.62744140625, -0.552734375, -0.47802734375, -0.4033203125, -0.32861328125, -0.25390625, -0.17919921875, -0.1044921875, -0.02978515625, 0.044921875, 0.11962890625, 0.1943359375, 0.26904296875, 0.34375, 0.41845703125, 0.4931640625, 0.56787109375, 0.642578125, 0.71728515625, 0.7919921875, 0.86669921875, 0.94140625, 1.01611328125, 1.0908203125, 1.16552734375, 1.240234375, 1.31494140625, 1.3896484375, 1.46435546875, 1.5390625, 1.61376953125, 1.6884765625, 1.76318359375, 1.837890625, 1.91259765625, 1.9873046875, 2.06201171875, 2.13671875, 2.21142578125, 2.2861328125, 2.36083984375, 2.435546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 13.0, 19.0, 39.0, 47.0, 79.0, 96.0, 165.0, 213.0, 408.0, 640.0, 1160.0, 2180.0, 4869.0, 11423.0, 29105.0, 87300.0, 318323.0, 2193349.0, 1185279.0, 245429.0, 71245.0, 24468.0, 9447.0, 4216.0, 2025.0, 1028.0, 602.0, 369.0, 228.0, 137.0, 103.0, 54.0, 52.0, 36.0, 28.0, 12.0, 19.0, 14.0, 2.0, 4.0, 2.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.7119140625, -18.064453125, -17.4169921875, -16.76953125, -16.1220703125, -15.474609375, -14.8271484375, -14.1796875, -13.5322265625, -12.884765625, -12.2373046875, -11.58984375, -10.9423828125, -10.294921875, -9.6474609375, -9.0, -8.3525390625, -7.705078125, -7.0576171875, -6.41015625, -5.7626953125, -5.115234375, -4.4677734375, -3.8203125, -3.1728515625, -2.525390625, -1.8779296875, -1.23046875, -0.5830078125, 0.064453125, 0.7119140625, 1.359375, 2.0068359375, 2.654296875, 3.3017578125, 3.94921875, 4.5966796875, 5.244140625, 5.8916015625, 6.5390625, 7.1865234375, 7.833984375, 8.4814453125, 9.12890625, 9.7763671875, 10.423828125, 11.0712890625, 11.71875, 12.3662109375, 13.013671875, 13.6611328125, 14.30859375, 14.9560546875, 15.603515625, 16.2509765625, 16.8984375, 17.5458984375, 18.193359375, 18.8408203125, 19.48828125, 20.1357421875, 20.783203125, 21.4306640625, 22.078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 12.0, 11.0, 21.0, 19.0, 38.0, 29.0, 47.0, 47.0, 53.0, 92.0, 109.0, 143.0, 186.0, 240.0, 334.0, 910.0, 463.0, 286.0, 211.0, 164.0, 132.0, 92.0, 92.0, 79.0, 44.0, 42.0, 33.0, 29.0, 19.0, 22.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.2979736328125, -5.119384765625, -4.9407958984375, -4.76220703125, -4.5836181640625, -4.405029296875, -4.2264404296875, -4.0478515625, -3.8692626953125, -3.690673828125, -3.5120849609375, -3.33349609375, -3.1549072265625, -2.976318359375, -2.7977294921875, -2.619140625, -2.4405517578125, -2.261962890625, -2.0833740234375, -1.90478515625, -1.7261962890625, -1.547607421875, -1.3690185546875, -1.1904296875, -1.0118408203125, -0.833251953125, -0.6546630859375, -0.47607421875, -0.2974853515625, -0.118896484375, 0.0596923828125, 0.23828125, 0.4168701171875, 0.595458984375, 0.7740478515625, 0.95263671875, 1.1312255859375, 1.309814453125, 1.4884033203125, 1.6669921875, 1.8455810546875, 2.024169921875, 2.2027587890625, 2.38134765625, 2.5599365234375, 2.738525390625, 2.9171142578125, 3.095703125, 3.2742919921875, 3.452880859375, 3.6314697265625, 3.81005859375, 3.9886474609375, 4.167236328125, 4.3458251953125, 4.5244140625, 4.7030029296875, 4.881591796875, 5.0601806640625, 5.23876953125, 5.4173583984375, 5.595947265625, 5.7745361328125, 5.953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 19.0, 25.0, 42.0, 74.0, 91.0, 97.0, 95.0, 106.0, 107.0, 76.0, 64.0, 48.0, 24.0, 31.0, 17.0, 18.0, 10.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.60264587402344, -37.04033279418945, -35.4780158996582, -33.91570281982422, -32.35338592529297, -30.791072845458984, -29.228757858276367, -27.66644287109375, -26.104129791259766, -24.54181480407715, -22.97949981689453, -21.417186737060547, -19.85487174987793, -18.292556762695312, -16.730241775512695, -15.167927742004395, -13.605611801147461, -12.043296813964844, -10.480982780456543, -8.918667793273926, -7.356353282928467, -5.794038772583008, -4.231723785400391, -2.66940975189209, -1.1070947647094727, 0.4552198648452759, 2.0175344944000244, 3.5798492431640625, 5.1421637535095215, 6.7044782638549805, 8.266793251037598, 9.829107284545898, 11.391422271728516, 12.953737258911133, 14.516051292419434, 16.078365325927734, 17.64068031311035, 19.20299530029297, 20.765310287475586, 22.327625274658203, 23.889938354492188, 25.452253341674805, 27.014568328857422, 28.576881408691406, 30.139196395874023, 31.70151138305664, 33.263824462890625, 34.826141357421875, 36.388458251953125, 37.95077133178711, 39.51308822631836, 41.075401306152344, 42.637718200683594, 44.20003128051758, 45.76234436035156, 47.32466125488281, 48.8869743347168, 50.44928741455078, 52.01160430908203, 53.573917388916016, 55.136234283447266, 56.69854736328125, 58.2608642578125, 59.823177337646484, 61.38549041748047]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 18.0, 23.0, 26.0, 20.0, 24.0, 23.0, 27.0, 36.0, 37.0, 40.0, 48.0, 30.0, 43.0, 45.0, 41.0, 43.0, 41.0, 36.0, 53.0, 48.0, 41.0, 25.0, 31.0, 31.0, 18.0, 15.0, 15.0, 17.0, 11.0, 9.0, 10.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.839374542236328, -27.942052841186523, -27.04473114013672, -26.147411346435547, -25.250089645385742, -24.352767944335938, -23.455446243286133, -22.558124542236328, -21.660802841186523, -20.76348114013672, -19.866159439086914, -18.96883773803711, -18.071517944335938, -17.174196243286133, -16.276874542236328, -15.379552841186523, -14.482232093811035, -13.58491039276123, -12.687589645385742, -11.790267944335938, -10.892946243286133, -9.995624542236328, -9.09830379486084, -8.200982093811035, -7.303660869598389, -6.406339645385742, -5.5090179443359375, -4.611696720123291, -3.7143752574920654, -2.81705379486084, -1.9197325706481934, -1.0224108695983887, -0.1250896453857422, 0.7722317576408386, 1.6695531606674194, 2.5668745040893555, 3.464195966720581, 4.361517429351807, 5.258838653564453, 6.156160354614258, 7.053481578826904, 7.950802803039551, 8.848124504089355, 9.745445251464844, 10.642766952514648, 11.540088653564453, 12.437410354614258, 13.334732055664062, 14.23205280303955, 15.129374504089355, 16.026695251464844, 16.92401695251465, 17.821338653564453, 18.718660354614258, 19.615982055664062, 20.513301849365234, 21.41062355041504, 22.307945251464844, 23.20526695251465, 24.102588653564453, 24.999908447265625, 25.89723014831543, 26.794551849365234, 27.69187355041504, 28.589195251464844]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 3.0, 13.0, 14.0, 21.0, 21.0, 37.0, 48.0, 74.0, 128.0, 167.0, 282.0, 450.0, 691.0, 1154.0, 2068.0, 3930.0, 8130.0, 19257.0, 51896.0, 172421.0, 447539.0, 229764.0, 66582.0, 23472.0, 9842.0, 4600.0, 2316.0, 1429.0, 795.0, 502.0, 283.0, 210.0, 129.0, 85.0, 69.0, 37.0, 27.0, 23.0, 8.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.296875, -27.42919921875, -26.5615234375, -25.69384765625, -24.826171875, -23.95849609375, -23.0908203125, -22.22314453125, -21.35546875, -20.48779296875, -19.6201171875, -18.75244140625, -17.884765625, -17.01708984375, -16.1494140625, -15.28173828125, -14.4140625, -13.54638671875, -12.6787109375, -11.81103515625, -10.943359375, -10.07568359375, -9.2080078125, -8.34033203125, -7.47265625, -6.60498046875, -5.7373046875, -4.86962890625, -4.001953125, -3.13427734375, -2.2666015625, -1.39892578125, -0.53125, 0.33642578125, 1.2041015625, 2.07177734375, 2.939453125, 3.80712890625, 4.6748046875, 5.54248046875, 6.41015625, 7.27783203125, 8.1455078125, 9.01318359375, 9.880859375, 10.74853515625, 11.6162109375, 12.48388671875, 13.3515625, 14.21923828125, 15.0869140625, 15.95458984375, 16.822265625, 17.68994140625, 18.5576171875, 19.42529296875, 20.29296875, 21.16064453125, 22.0283203125, 22.89599609375, 23.763671875, 24.63134765625, 25.4990234375, 26.36669921875, 27.234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 13.0, 15.0, 14.0, 24.0, 27.0, 40.0, 58.0, 72.0, 74.0, 93.0, 94.0, 90.0, 85.0, 59.0, 53.0, 33.0, 29.0, 24.0, 22.0, 17.0, 10.0, 3.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.691131591796875, -2.60882568359375, -2.526519775390625, -2.4442138671875, -2.361907958984375, -2.27960205078125, -2.197296142578125, -2.114990234375, -2.032684326171875, -1.95037841796875, -1.868072509765625, -1.7857666015625, -1.703460693359375, -1.62115478515625, -1.538848876953125, -1.45654296875, -1.374237060546875, -1.29193115234375, -1.209625244140625, -1.1273193359375, -1.045013427734375, -0.96270751953125, -0.880401611328125, -0.798095703125, -0.715789794921875, -0.63348388671875, -0.551177978515625, -0.4688720703125, -0.386566162109375, -0.30426025390625, -0.221954345703125, -0.1396484375, -0.057342529296875, 0.02496337890625, 0.107269287109375, 0.1895751953125, 0.271881103515625, 0.35418701171875, 0.436492919921875, 0.518798828125, 0.601104736328125, 0.68341064453125, 0.765716552734375, 0.8480224609375, 0.930328369140625, 1.01263427734375, 1.094940185546875, 1.17724609375, 1.259552001953125, 1.34185791015625, 1.424163818359375, 1.5064697265625, 1.588775634765625, 1.67108154296875, 1.753387451171875, 1.835693359375, 1.917999267578125, 2.00030517578125, 2.082611083984375, 2.1649169921875, 2.247222900390625, 2.32952880859375, 2.411834716796875, 2.494140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 5.0, 19.0, 23.0, 43.0, 65.0, 110.0, 171.0, 324.0, 553.0, 1061.0, 1866.0, 3534.0, 7058.0, 15404.0, 45879.0, 257878.0, 564194.0, 103980.0, 25249.0, 10286.0, 4982.0, 2546.0, 1390.0, 818.0, 465.0, 253.0, 134.0, 75.0, 54.0, 36.0, 30.0, 14.0, 9.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.295654296875, -28.29443359375, -27.293212890625, -26.2919921875, -25.290771484375, -24.28955078125, -23.288330078125, -22.287109375, -21.285888671875, -20.28466796875, -19.283447265625, -18.2822265625, -17.281005859375, -16.27978515625, -15.278564453125, -14.27734375, -13.276123046875, -12.27490234375, -11.273681640625, -10.2724609375, -9.271240234375, -8.27001953125, -7.268798828125, -6.267578125, -5.266357421875, -4.26513671875, -3.263916015625, -2.2626953125, -1.261474609375, -0.26025390625, 0.740966796875, 1.7421875, 2.743408203125, 3.74462890625, 4.745849609375, 5.7470703125, 6.748291015625, 7.74951171875, 8.750732421875, 9.751953125, 10.753173828125, 11.75439453125, 12.755615234375, 13.7568359375, 14.758056640625, 15.75927734375, 16.760498046875, 17.76171875, 18.762939453125, 19.76416015625, 20.765380859375, 21.7666015625, 22.767822265625, 23.76904296875, 24.770263671875, 25.771484375, 26.772705078125, 27.77392578125, 28.775146484375, 29.7763671875, 30.777587890625, 31.77880859375, 32.780029296875, 33.78125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 14.0, 16.0, 16.0, 23.0, 25.0, 41.0, 36.0, 32.0, 43.0, 36.0, 42.0, 49.0, 60.0, 50.0, 28.0, 45.0, 33.0, 48.0, 46.0, 55.0, 32.0, 27.0, 27.0, 30.0, 13.0, 16.0, 14.0, 7.0, 11.0, 7.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2578125, -14.7589111328125, -14.260009765625, -13.7611083984375, -13.26220703125, -12.7633056640625, -12.264404296875, -11.7655029296875, -11.2666015625, -10.7677001953125, -10.268798828125, -9.7698974609375, -9.27099609375, -8.7720947265625, -8.273193359375, -7.7742919921875, -7.275390625, -6.7764892578125, -6.277587890625, -5.7786865234375, -5.27978515625, -4.7808837890625, -4.281982421875, -3.7830810546875, -3.2841796875, -2.7852783203125, -2.286376953125, -1.7874755859375, -1.28857421875, -0.7896728515625, -0.290771484375, 0.2081298828125, 0.70703125, 1.2059326171875, 1.704833984375, 2.2037353515625, 2.70263671875, 3.2015380859375, 3.700439453125, 4.1993408203125, 4.6982421875, 5.1971435546875, 5.696044921875, 6.1949462890625, 6.69384765625, 7.1927490234375, 7.691650390625, 8.1905517578125, 8.689453125, 9.1883544921875, 9.687255859375, 10.1861572265625, 10.68505859375, 11.1839599609375, 11.682861328125, 12.1817626953125, 12.6806640625, 13.1795654296875, 13.678466796875, 14.1773681640625, 14.67626953125, 15.1751708984375, 15.674072265625, 16.1729736328125, 16.671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 33.0, 27.0, 66.0, 81.0, 172.0, 258.0, 482.0, 1001.0, 2461.0, 8422.0, 48094.0, 822744.0, 143427.0, 14410.0, 3862.0, 1460.0, 621.0, 337.0, 205.0, 119.0, 60.0, 38.0, 22.0, 25.0, 16.0, 13.0, 7.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-72.9375, -70.8349609375, -68.732421875, -66.6298828125, -64.52734375, -62.4248046875, -60.322265625, -58.2197265625, -56.1171875, -54.0146484375, -51.912109375, -49.8095703125, -47.70703125, -45.6044921875, -43.501953125, -41.3994140625, -39.296875, -37.1943359375, -35.091796875, -32.9892578125, -30.88671875, -28.7841796875, -26.681640625, -24.5791015625, -22.4765625, -20.3740234375, -18.271484375, -16.1689453125, -14.06640625, -11.9638671875, -9.861328125, -7.7587890625, -5.65625, -3.5537109375, -1.451171875, 0.6513671875, 2.75390625, 4.8564453125, 6.958984375, 9.0615234375, 11.1640625, 13.2666015625, 15.369140625, 17.4716796875, 19.57421875, 21.6767578125, 23.779296875, 25.8818359375, 27.984375, 30.0869140625, 32.189453125, 34.2919921875, 36.39453125, 38.4970703125, 40.599609375, 42.7021484375, 44.8046875, 46.9072265625, 49.009765625, 51.1123046875, 53.21484375, 55.3173828125, 57.419921875, 59.5224609375, 61.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 11.0, 14.0, 9.0, 13.0, 16.0, 32.0, 58.0, 69.0, 135.0, 192.0, 153.0, 115.0, 65.0, 41.0, 26.0, 18.0, 6.0, 8.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00525665283203125, -0.005105137825012207, -0.004953622817993164, -0.004802107810974121, -0.004650592803955078, -0.004499077796936035, -0.004347562789916992, -0.004196047782897949, -0.004044532775878906, -0.0038930177688598633, -0.0037415027618408203, -0.0035899877548217773, -0.0034384727478027344, -0.0032869577407836914, -0.0031354427337646484, -0.0029839277267456055, -0.0028324127197265625, -0.0026808977127075195, -0.0025293827056884766, -0.0023778676986694336, -0.0022263526916503906, -0.0020748376846313477, -0.0019233226776123047, -0.0017718076705932617, -0.0016202926635742188, -0.0014687776565551758, -0.0013172626495361328, -0.0011657476425170898, -0.0010142326354980469, -0.0008627176284790039, -0.0007112026214599609, -0.000559687614440918, -0.000408172607421875, -0.00025665760040283203, -0.00010514259338378906, 4.6372413635253906e-05, 0.00019788742065429688, 0.00034940242767333984, 0.0005009174346923828, 0.0006524324417114258, 0.0008039474487304688, 0.0009554624557495117, 0.0011069774627685547, 0.0012584924697875977, 0.0014100074768066406, 0.0015615224838256836, 0.0017130374908447266, 0.0018645524978637695, 0.0020160675048828125, 0.0021675825119018555, 0.0023190975189208984, 0.0024706125259399414, 0.0026221275329589844, 0.0027736425399780273, 0.0029251575469970703, 0.0030766725540161133, 0.0032281875610351562, 0.0033797025680541992, 0.003531217575073242, 0.003682732582092285, 0.003834247589111328, 0.003985762596130371, 0.004137277603149414, 0.004288792610168457, 0.0044403076171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 2.0, 20.0, 14.0, 29.0, 13.0, 51.0, 91.0, 182.0, 327.0, 820.0, 2665.0, 14653.0, 484495.0, 525744.0, 15086.0, 2786.0, 814.0, 351.0, 167.0, 88.0, 47.0, 36.0, 25.0, 14.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.93701171875, -57.7177734375, -55.49853515625, -53.279296875, -51.06005859375, -48.8408203125, -46.62158203125, -44.40234375, -42.18310546875, -39.9638671875, -37.74462890625, -35.525390625, -33.30615234375, -31.0869140625, -28.86767578125, -26.6484375, -24.42919921875, -22.2099609375, -19.99072265625, -17.771484375, -15.55224609375, -13.3330078125, -11.11376953125, -8.89453125, -6.67529296875, -4.4560546875, -2.23681640625, -0.017578125, 2.20166015625, 4.4208984375, 6.64013671875, 8.859375, 11.07861328125, 13.2978515625, 15.51708984375, 17.736328125, 19.95556640625, 22.1748046875, 24.39404296875, 26.61328125, 28.83251953125, 31.0517578125, 33.27099609375, 35.490234375, 37.70947265625, 39.9287109375, 42.14794921875, 44.3671875, 46.58642578125, 48.8056640625, 51.02490234375, 53.244140625, 55.46337890625, 57.6826171875, 59.90185546875, 62.12109375, 64.34033203125, 66.5595703125, 68.77880859375, 70.998046875, 73.21728515625, 75.4365234375, 77.65576171875, 79.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 16.0, 16.0, 39.0, 85.0, 148.0, 195.0, 207.0, 145.0, 75.0, 28.0, 18.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3125, -31.1923828125, -30.072265625, -28.9521484375, -27.83203125, -26.7119140625, -25.591796875, -24.4716796875, -23.3515625, -22.2314453125, -21.111328125, -19.9912109375, -18.87109375, -17.7509765625, -16.630859375, -15.5107421875, -14.390625, -13.2705078125, -12.150390625, -11.0302734375, -9.91015625, -8.7900390625, -7.669921875, -6.5498046875, -5.4296875, -4.3095703125, -3.189453125, -2.0693359375, -0.94921875, 0.1708984375, 1.291015625, 2.4111328125, 3.53125, 4.6513671875, 5.771484375, 6.8916015625, 8.01171875, 9.1318359375, 10.251953125, 11.3720703125, 12.4921875, 13.6123046875, 14.732421875, 15.8525390625, 16.97265625, 18.0927734375, 19.212890625, 20.3330078125, 21.453125, 22.5732421875, 23.693359375, 24.8134765625, 25.93359375, 27.0537109375, 28.173828125, 29.2939453125, 30.4140625, 31.5341796875, 32.654296875, 33.7744140625, 34.89453125, 36.0146484375, 37.134765625, 38.2548828125, 39.375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 35.0, 55.0, 103.0, 223.0, 246.0, 149.0, 59.0, 20.0, 17.0, 8.0, 12.0, 3.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.4444274902344, -383.82470703125, -373.2049560546875, -362.5852355957031, -351.9654846191406, -341.34576416015625, -330.72601318359375, -320.1062927246094, -309.486572265625, -298.8668518066406, -288.2471008300781, -277.62738037109375, -267.00762939453125, -256.3879089355469, -245.76817321777344, -235.1484375, -224.52870178222656, -213.90896606445312, -203.2892303466797, -192.66949462890625, -182.04977416992188, -171.43003845214844, -160.810302734375, -150.19058227539062, -139.57083129882812, -128.9510955810547, -118.33136749267578, -107.71163177490234, -97.09190368652344, -86.47216796875, -75.85243225097656, -65.23270416259766, -54.61297607421875, -43.99324417114258, -33.373512268066406, -22.75377655029297, -12.134044647216797, -1.514312744140625, 9.105422973632812, 19.72515106201172, 30.344886779785156, 40.96461868286133, 51.5843505859375, 62.20408630371094, 72.82382202148438, 83.44355010986328, 94.06328582763672, 104.68301391601562, 115.30274963378906, 125.9224853515625, 136.54222106933594, 147.16195678710938, 157.78167724609375, 168.4014129638672, 179.02114868164062, 189.640869140625, 200.2606201171875, 210.88035583496094, 221.50009155273438, 232.11981201171875, 242.7395477294922, 253.35928344726562, 263.97900390625, 274.5987548828125, 285.2184753417969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 9.0, 31.0, 35.0, 59.0, 104.0, 140.0, 171.0, 135.0, 91.0, 70.0, 35.0, 18.0, 11.0, 11.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5455627441406, -280.0285339355469, -270.511474609375, -260.99444580078125, -251.4774169921875, -241.96038818359375, -232.44334411621094, -222.92630004882812, -213.40927124023438, -203.89224243164062, -194.3751983642578, -184.858154296875, -175.34112548828125, -165.8240966796875, -156.3070526123047, -146.79000854492188, -137.27297973632812, -127.75594329833984, -118.23890686035156, -108.72187042236328, -99.204833984375, -89.68779754638672, -80.17076110839844, -70.65372467041016, -61.136688232421875, -51.619651794433594, -42.10261535644531, -32.58557891845703, -23.06854248046875, -13.551506042480469, -4.0344696044921875, 5.482566833496094, 14.999603271484375, 24.516639709472656, 34.03367614746094, 43.55071258544922, 53.0677490234375, 62.58478546142578, 72.10182189941406, 81.61885833740234, 91.13589477539062, 100.6529312133789, 110.16996765136719, 119.68700408935547, 129.20404052734375, 138.7210693359375, 148.2381134033203, 157.75515747070312, 167.27218627929688, 176.78921508789062, 186.30625915527344, 195.82330322265625, 205.34033203125, 214.85736083984375, 224.37440490722656, 233.89144897460938, 243.40847778320312, 252.92550659179688, 262.44256591796875, 271.9595947265625, 281.47662353515625, 290.99365234375, 300.51068115234375, 310.0277404785156, 319.5447692871094]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 12.0, 17.0, 16.0, 27.0, 29.0, 34.0, 58.0, 66.0, 117.0, 130.0, 231.0, 312.0, 571.0, 1040.0, 1726.0, 3427.0, 7012.0, 17711.0, 55880.0, 322847.0, 3562003.0, 164426.0, 35870.0, 11529.0, 4567.0, 2101.0, 1008.0, 593.0, 333.0, 220.0, 119.0, 76.0, 44.0, 38.0, 23.0, 24.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.1484375, -64.859375, -62.5703125, -60.28125, -57.9921875, -55.703125, -53.4140625, -51.125, -48.8359375, -46.546875, -44.2578125, -41.96875, -39.6796875, -37.390625, -35.1015625, -32.8125, -30.5234375, -28.234375, -25.9453125, -23.65625, -21.3671875, -19.078125, -16.7890625, -14.5, -12.2109375, -9.921875, -7.6328125, -5.34375, -3.0546875, -0.765625, 1.5234375, 3.8125, 6.1015625, 8.390625, 10.6796875, 12.96875, 15.2578125, 17.546875, 19.8359375, 22.125, 24.4140625, 26.703125, 28.9921875, 31.28125, 33.5703125, 35.859375, 38.1484375, 40.4375, 42.7265625, 45.015625, 47.3046875, 49.59375, 51.8828125, 54.171875, 56.4609375, 58.75, 61.0390625, 63.328125, 65.6171875, 67.90625, 70.1953125, 72.484375, 74.7734375, 77.0625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 23.0, 22.0, 28.0, 32.0, 59.0, 62.0, 69.0, 87.0, 91.0, 90.0, 68.0, 69.0, 56.0, 52.0, 38.0, 23.0, 18.0, 18.0, 8.0, 6.0, 15.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.32421875, -3.23309326171875, -3.1419677734375, -3.05084228515625, -2.959716796875, -2.86859130859375, -2.7774658203125, -2.68634033203125, -2.59521484375, -2.50408935546875, -2.4129638671875, -2.32183837890625, -2.230712890625, -2.13958740234375, -2.0484619140625, -1.95733642578125, -1.8662109375, -1.77508544921875, -1.6839599609375, -1.59283447265625, -1.501708984375, -1.41058349609375, -1.3194580078125, -1.22833251953125, -1.13720703125, -1.04608154296875, -0.9549560546875, -0.86383056640625, -0.772705078125, -0.68157958984375, -0.5904541015625, -0.49932861328125, -0.408203125, -0.31707763671875, -0.2259521484375, -0.13482666015625, -0.043701171875, 0.04742431640625, 0.1385498046875, 0.22967529296875, 0.32080078125, 0.41192626953125, 0.5030517578125, 0.59417724609375, 0.685302734375, 0.77642822265625, 0.8675537109375, 0.95867919921875, 1.0498046875, 1.14093017578125, 1.2320556640625, 1.32318115234375, 1.414306640625, 1.50543212890625, 1.5965576171875, 1.68768310546875, 1.77880859375, 1.86993408203125, 1.9610595703125, 2.05218505859375, 2.143310546875, 2.23443603515625, 2.3255615234375, 2.41668701171875, 2.5078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 19.0, 44.0, 83.0, 184.0, 305.0, 738.0, 1849.0, 6324.0, 31292.0, 249216.0, 3414587.0, 429314.0, 47003.0, 9105.0, 2504.0, 845.0, 407.0, 178.0, 87.0, 57.0, 48.0, 20.0, 5.0, 11.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -46.7724609375, -44.607421875, -42.4423828125, -40.27734375, -38.1123046875, -35.947265625, -33.7822265625, -31.6171875, -29.4521484375, -27.287109375, -25.1220703125, -22.95703125, -20.7919921875, -18.626953125, -16.4619140625, -14.296875, -12.1318359375, -9.966796875, -7.8017578125, -5.63671875, -3.4716796875, -1.306640625, 0.8583984375, 3.0234375, 5.1884765625, 7.353515625, 9.5185546875, 11.68359375, 13.8486328125, 16.013671875, 18.1787109375, 20.34375, 22.5087890625, 24.673828125, 26.8388671875, 29.00390625, 31.1689453125, 33.333984375, 35.4990234375, 37.6640625, 39.8291015625, 41.994140625, 44.1591796875, 46.32421875, 48.4892578125, 50.654296875, 52.8193359375, 54.984375, 57.1494140625, 59.314453125, 61.4794921875, 63.64453125, 65.8095703125, 67.974609375, 70.1396484375, 72.3046875, 74.4697265625, 76.634765625, 78.7998046875, 80.96484375, 83.1298828125, 85.294921875, 87.4599609375, 89.625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 12.0, 10.0, 15.0, 21.0, 34.0, 27.0, 60.0, 72.0, 91.0, 169.0, 257.0, 342.0, 791.0, 977.0, 391.0, 211.0, 152.0, 110.0, 84.0, 67.0, 35.0, 27.0, 26.0, 26.0, 14.0, 12.0, 5.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640625, -6.4266357421875, -6.212646484375, -5.9986572265625, -5.78466796875, -5.5706787109375, -5.356689453125, -5.1427001953125, -4.9287109375, -4.7147216796875, -4.500732421875, -4.2867431640625, -4.07275390625, -3.8587646484375, -3.644775390625, -3.4307861328125, -3.216796875, -3.0028076171875, -2.788818359375, -2.5748291015625, -2.36083984375, -2.1468505859375, -1.932861328125, -1.7188720703125, -1.5048828125, -1.2908935546875, -1.076904296875, -0.8629150390625, -0.64892578125, -0.4349365234375, -0.220947265625, -0.0069580078125, 0.20703125, 0.4210205078125, 0.635009765625, 0.8489990234375, 1.06298828125, 1.2769775390625, 1.490966796875, 1.7049560546875, 1.9189453125, 2.1329345703125, 2.346923828125, 2.5609130859375, 2.77490234375, 2.9888916015625, 3.202880859375, 3.4168701171875, 3.630859375, 3.8448486328125, 4.058837890625, 4.2728271484375, 4.48681640625, 4.7008056640625, 4.914794921875, 5.1287841796875, 5.3427734375, 5.5567626953125, 5.770751953125, 5.9847412109375, 6.19873046875, 6.4127197265625, 6.626708984375, 6.8406982421875, 7.0546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 12.0, 11.0, 20.0, 42.0, 111.0, 139.0, 193.0, 199.0, 108.0, 82.0, 38.0, 13.0, 10.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.86197662353516, -87.64466857910156, -85.4273681640625, -83.2100601196289, -80.99275970458984, -78.77545166015625, -76.55815124511719, -74.3408432006836, -72.12353515625, -69.9062271118164, -67.68892669677734, -65.47161865234375, -63.25431823730469, -61.037010192871094, -58.819705963134766, -56.60240173339844, -54.385101318359375, -52.16779708862305, -49.95049285888672, -47.73318862915039, -45.51588439941406, -43.29857635498047, -41.08127212524414, -38.86396789550781, -36.646663665771484, -34.429359436035156, -32.21205520629883, -29.994749069213867, -27.77744483947754, -25.56014060974121, -23.34283447265625, -21.125530242919922, -18.90822982788086, -16.69092559814453, -14.473620414733887, -12.256315231323242, -10.039011001586914, -7.821706771850586, -5.604401588439941, -3.387096405029297, -1.1697921752929688, 1.0475125312805176, 3.264817237854004, 5.48212194442749, 7.699426651000977, 9.916730880737305, 12.13403606414795, 14.351341247558594, 16.568645477294922, 18.78594970703125, 21.003253936767578, 23.22056007385254, 25.437864303588867, 27.655168533325195, 29.872474670410156, 32.089778900146484, 34.30708312988281, 36.52438735961914, 38.74169158935547, 40.9589958190918, 43.176300048828125, 45.39360809326172, 47.61091232299805, 49.828216552734375, 52.0455207824707]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 18.0, 21.0, 21.0, 35.0, 45.0, 52.0, 47.0, 63.0, 64.0, 70.0, 72.0, 71.0, 68.0, 52.0, 58.0, 39.0, 30.0, 30.0, 13.0, 21.0, 18.0, 12.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.05409240722656, -38.81858444213867, -37.583072662353516, -36.347564697265625, -35.112056732177734, -33.87654495239258, -32.64103698730469, -31.405527114868164, -30.17001724243164, -28.934507369995117, -27.698999404907227, -26.463489532470703, -25.22797966003418, -23.992469787597656, -22.756961822509766, -21.521451950073242, -20.28594398498535, -19.050434112548828, -17.814926147460938, -16.579416275024414, -15.34390640258789, -14.108397483825684, -12.872888565063477, -11.637378692626953, -10.401869773864746, -9.166360855102539, -7.930850982666016, -6.695342063903809, -5.459832668304443, -4.224323272705078, -2.988814353942871, -1.7533044815063477, -0.5177955627441406, 0.7177137136459351, 1.9532229900360107, 3.188732147216797, 4.424241542816162, 5.659750938415527, 6.895259857177734, 8.130769729614258, 9.366278648376465, 10.601787567138672, 11.837297439575195, 13.072806358337402, 14.30831527709961, 15.543825149536133, 16.779335021972656, 18.014842987060547, 19.25035285949707, 20.485862731933594, 21.721370697021484, 22.956880569458008, 24.19239044189453, 25.427898406982422, 26.663408279418945, 27.89891815185547, 29.13442611694336, 30.369935989379883, 31.605443954467773, 32.8409538269043, 34.07646179199219, 35.311973571777344, 36.547481536865234, 37.782989501953125, 39.01850128173828]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 25.0, 40.0, 46.0, 90.0, 120.0, 238.0, 444.0, 757.0, 1428.0, 2633.0, 5027.0, 10306.0, 21847.0, 49668.0, 119740.0, 280112.0, 309627.0, 140089.0, 57074.0, 25276.0, 11755.0, 5737.0, 2960.0, 1543.0, 847.0, 442.0, 294.0, 151.0, 94.0, 46.0, 34.0, 27.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.359375, -22.693603515625, -22.02783203125, -21.362060546875, -20.6962890625, -20.030517578125, -19.36474609375, -18.698974609375, -18.033203125, -17.367431640625, -16.70166015625, -16.035888671875, -15.3701171875, -14.704345703125, -14.03857421875, -13.372802734375, -12.70703125, -12.041259765625, -11.37548828125, -10.709716796875, -10.0439453125, -9.378173828125, -8.71240234375, -8.046630859375, -7.380859375, -6.715087890625, -6.04931640625, -5.383544921875, -4.7177734375, -4.052001953125, -3.38623046875, -2.720458984375, -2.0546875, -1.388916015625, -0.72314453125, -0.057373046875, 0.6083984375, 1.274169921875, 1.93994140625, 2.605712890625, 3.271484375, 3.937255859375, 4.60302734375, 5.268798828125, 5.9345703125, 6.600341796875, 7.26611328125, 7.931884765625, 8.59765625, 9.263427734375, 9.92919921875, 10.594970703125, 11.2607421875, 11.926513671875, 12.59228515625, 13.258056640625, 13.923828125, 14.589599609375, 15.25537109375, 15.921142578125, 16.5869140625, 17.252685546875, 17.91845703125, 18.584228515625, 19.25]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 2.0, 8.0, 5.0, 11.0, 12.0, 15.0, 21.0, 16.0, 14.0, 18.0, 36.0, 25.0, 41.0, 40.0, 44.0, 46.0, 54.0, 50.0, 42.0, 50.0, 64.0, 45.0, 40.0, 44.0, 37.0, 37.0, 25.0, 17.0, 23.0, 25.0, 13.0, 17.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.9013671875, -1.8409271240234375, -1.780487060546875, -1.7200469970703125, -1.65960693359375, -1.5991668701171875, -1.538726806640625, -1.4782867431640625, -1.4178466796875, -1.3574066162109375, -1.296966552734375, -1.2365264892578125, -1.17608642578125, -1.1156463623046875, -1.055206298828125, -0.9947662353515625, -0.934326171875, -0.8738861083984375, -0.813446044921875, -0.7530059814453125, -0.69256591796875, -0.6321258544921875, -0.571685791015625, -0.5112457275390625, -0.4508056640625, -0.3903656005859375, -0.329925537109375, -0.2694854736328125, -0.20904541015625, -0.1486053466796875, -0.088165283203125, -0.0277252197265625, 0.03271484375, 0.0931549072265625, 0.153594970703125, 0.2140350341796875, 0.27447509765625, 0.3349151611328125, 0.395355224609375, 0.4557952880859375, 0.5162353515625, 0.5766754150390625, 0.637115478515625, 0.6975555419921875, 0.75799560546875, 0.8184356689453125, 0.878875732421875, 0.9393157958984375, 0.999755859375, 1.0601959228515625, 1.120635986328125, 1.1810760498046875, 1.24151611328125, 1.3019561767578125, 1.362396240234375, 1.4228363037109375, 1.4832763671875, 1.5437164306640625, 1.604156494140625, 1.6645965576171875, 1.72503662109375, 1.7854766845703125, 1.845916748046875, 1.9063568115234375, 1.966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 11.0, 15.0, 28.0, 75.0, 157.0, 430.0, 1347.0, 5086.0, 24362.0, 160063.0, 662916.0, 161562.0, 25059.0, 5258.0, 1374.0, 454.0, 164.0, 90.0, 40.0, 22.0, 14.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.03125, -29.90283203125, -28.7744140625, -27.64599609375, -26.517578125, -25.38916015625, -24.2607421875, -23.13232421875, -22.00390625, -20.87548828125, -19.7470703125, -18.61865234375, -17.490234375, -16.36181640625, -15.2333984375, -14.10498046875, -12.9765625, -11.84814453125, -10.7197265625, -9.59130859375, -8.462890625, -7.33447265625, -6.2060546875, -5.07763671875, -3.94921875, -2.82080078125, -1.6923828125, -0.56396484375, 0.564453125, 1.69287109375, 2.8212890625, 3.94970703125, 5.078125, 6.20654296875, 7.3349609375, 8.46337890625, 9.591796875, 10.72021484375, 11.8486328125, 12.97705078125, 14.10546875, 15.23388671875, 16.3623046875, 17.49072265625, 18.619140625, 19.74755859375, 20.8759765625, 22.00439453125, 23.1328125, 24.26123046875, 25.3896484375, 26.51806640625, 27.646484375, 28.77490234375, 29.9033203125, 31.03173828125, 32.16015625, 33.28857421875, 34.4169921875, 35.54541015625, 36.673828125, 37.80224609375, 38.9306640625, 40.05908203125, 41.1875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 12.0, 13.0, 15.0, 25.0, 18.0, 16.0, 20.0, 29.0, 30.0, 28.0, 27.0, 37.0, 26.0, 34.0, 37.0, 41.0, 54.0, 47.0, 39.0, 44.0, 37.0, 37.0, 38.0, 26.0, 29.0, 24.0, 23.0, 22.0, 23.0, 14.0, 15.0, 18.0, 11.0, 11.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.625, -10.297119140625, -9.96923828125, -9.641357421875, -9.3134765625, -8.985595703125, -8.65771484375, -8.329833984375, -8.001953125, -7.674072265625, -7.34619140625, -7.018310546875, -6.6904296875, -6.362548828125, -6.03466796875, -5.706787109375, -5.37890625, -5.051025390625, -4.72314453125, -4.395263671875, -4.0673828125, -3.739501953125, -3.41162109375, -3.083740234375, -2.755859375, -2.427978515625, -2.10009765625, -1.772216796875, -1.4443359375, -1.116455078125, -0.78857421875, -0.460693359375, -0.1328125, 0.195068359375, 0.52294921875, 0.850830078125, 1.1787109375, 1.506591796875, 1.83447265625, 2.162353515625, 2.490234375, 2.818115234375, 3.14599609375, 3.473876953125, 3.8017578125, 4.129638671875, 4.45751953125, 4.785400390625, 5.11328125, 5.441162109375, 5.76904296875, 6.096923828125, 6.4248046875, 6.752685546875, 7.08056640625, 7.408447265625, 7.736328125, 8.064208984375, 8.39208984375, 8.719970703125, 9.0478515625, 9.375732421875, 9.70361328125, 10.031494140625, 10.359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 11.0, 14.0, 23.0, 32.0, 63.0, 167.0, 395.0, 1006.0, 2956.0, 12642.0, 105324.0, 820626.0, 89522.0, 11428.0, 2785.0, 895.0, 353.0, 138.0, 73.0, 38.0, 22.0, 21.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-87.8125, -85.9228515625, -84.033203125, -82.1435546875, -80.25390625, -78.3642578125, -76.474609375, -74.5849609375, -72.6953125, -70.8056640625, -68.916015625, -67.0263671875, -65.13671875, -63.2470703125, -61.357421875, -59.4677734375, -57.578125, -55.6884765625, -53.798828125, -51.9091796875, -50.01953125, -48.1298828125, -46.240234375, -44.3505859375, -42.4609375, -40.5712890625, -38.681640625, -36.7919921875, -34.90234375, -33.0126953125, -31.123046875, -29.2333984375, -27.34375, -25.4541015625, -23.564453125, -21.6748046875, -19.78515625, -17.8955078125, -16.005859375, -14.1162109375, -12.2265625, -10.3369140625, -8.447265625, -6.5576171875, -4.66796875, -2.7783203125, -0.888671875, 1.0009765625, 2.890625, 4.7802734375, 6.669921875, 8.5595703125, 10.44921875, 12.3388671875, 14.228515625, 16.1181640625, 18.0078125, 19.8974609375, 21.787109375, 23.6767578125, 25.56640625, 27.4560546875, 29.345703125, 31.2353515625, 33.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 11.0, 13.0, 17.0, 36.0, 49.0, 75.0, 124.0, 195.0, 156.0, 123.0, 67.0, 49.0, 26.0, 16.0, 5.0, 4.0, 9.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002899169921875, -0.002813190221786499, -0.002727210521697998, -0.002641230821609497, -0.002555251121520996, -0.002469271421432495, -0.002383291721343994, -0.002297312021255493, -0.002211332321166992, -0.002125352621078491, -0.0020393729209899902, -0.0019533932209014893, -0.0018674135208129883, -0.0017814338207244873, -0.0016954541206359863, -0.0016094744205474854, -0.0015234947204589844, -0.0014375150203704834, -0.0013515353202819824, -0.0012655556201934814, -0.0011795759201049805, -0.0010935962200164795, -0.0010076165199279785, -0.0009216368198394775, -0.0008356571197509766, -0.0007496774196624756, -0.0006636977195739746, -0.0005777180194854736, -0.0004917383193969727, -0.0004057586193084717, -0.0003197789192199707, -0.00023379921913146973, -0.00014781951904296875, -6.183981895446777e-05, 2.4139881134033203e-05, 0.00011011958122253418, 0.00019609928131103516, 0.00028207898139953613, 0.0003680586814880371, 0.0004540383815765381, 0.0005400180816650391, 0.00062599778175354, 0.000711977481842041, 0.000797957181930542, 0.000883936882019043, 0.0009699165821075439, 0.001055896282196045, 0.001141875982284546, 0.0012278556823730469, 0.0013138353824615479, 0.0013998150825500488, 0.0014857947826385498, 0.0015717744827270508, 0.0016577541828155518, 0.0017437338829040527, 0.0018297135829925537, 0.0019156932830810547, 0.0020016729831695557, 0.0020876526832580566, 0.0021736323833465576, 0.0022596120834350586, 0.0023455917835235596, 0.0024315714836120605, 0.0025175511837005615, 0.0026035308837890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 16.0, 14.0, 29.0, 29.0, 44.0, 64.0, 100.0, 145.0, 209.0, 330.0, 489.0, 830.0, 1295.0, 2275.0, 3955.0, 7536.0, 15347.0, 36089.0, 107575.0, 355980.0, 344240.0, 103677.0, 35351.0, 15104.0, 7298.0, 4146.0, 2367.0, 1434.0, 831.0, 552.0, 361.0, 242.0, 171.0, 121.0, 80.0, 59.0, 50.0, 28.0, 22.0, 17.0, 15.0, 11.0, 4.0, 5.0, 6.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.347900390625, -16.68017578125, -16.012451171875, -15.3447265625, -14.677001953125, -14.00927734375, -13.341552734375, -12.673828125, -12.006103515625, -11.33837890625, -10.670654296875, -10.0029296875, -9.335205078125, -8.66748046875, -7.999755859375, -7.33203125, -6.664306640625, -5.99658203125, -5.328857421875, -4.6611328125, -3.993408203125, -3.32568359375, -2.657958984375, -1.990234375, -1.322509765625, -0.65478515625, 0.012939453125, 0.6806640625, 1.348388671875, 2.01611328125, 2.683837890625, 3.3515625, 4.019287109375, 4.68701171875, 5.354736328125, 6.0224609375, 6.690185546875, 7.35791015625, 8.025634765625, 8.693359375, 9.361083984375, 10.02880859375, 10.696533203125, 11.3642578125, 12.031982421875, 12.69970703125, 13.367431640625, 14.03515625, 14.702880859375, 15.37060546875, 16.038330078125, 16.7060546875, 17.373779296875, 18.04150390625, 18.709228515625, 19.376953125, 20.044677734375, 20.71240234375, 21.380126953125, 22.0478515625, 22.715576171875, 23.38330078125, 24.051025390625, 24.71875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 4.0, 10.0, 12.0, 13.0, 18.0, 18.0, 27.0, 30.0, 55.0, 76.0, 84.0, 101.0, 106.0, 95.0, 75.0, 68.0, 43.0, 34.0, 30.0, 20.0, 11.0, 8.0, 12.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.6593017578125, -11.107666015625, -10.5560302734375, -10.00439453125, -9.4527587890625, -8.901123046875, -8.3494873046875, -7.7978515625, -7.2462158203125, -6.694580078125, -6.1429443359375, -5.59130859375, -5.0396728515625, -4.488037109375, -3.9364013671875, -3.384765625, -2.8331298828125, -2.281494140625, -1.7298583984375, -1.17822265625, -0.6265869140625, -0.074951171875, 0.4766845703125, 1.0283203125, 1.5799560546875, 2.131591796875, 2.6832275390625, 3.23486328125, 3.7864990234375, 4.338134765625, 4.8897705078125, 5.44140625, 5.9930419921875, 6.544677734375, 7.0963134765625, 7.64794921875, 8.1995849609375, 8.751220703125, 9.3028564453125, 9.8544921875, 10.4061279296875, 10.957763671875, 11.5093994140625, 12.06103515625, 12.6126708984375, 13.164306640625, 13.7159423828125, 14.267578125, 14.8192138671875, 15.370849609375, 15.9224853515625, 16.47412109375, 17.0257568359375, 17.577392578125, 18.1290283203125, 18.6806640625, 19.2322998046875, 19.783935546875, 20.3355712890625, 20.88720703125, 21.4388427734375, 21.990478515625, 22.5421142578125, 23.09375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 14.0, 29.0, 45.0, 88.0, 159.0, 206.0, 191.0, 115.0, 67.0, 33.0, 14.0, 5.0, 7.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.4331817626953, -153.01084899902344, -146.58851623535156, -140.1661834716797, -133.74383544921875, -127.3215103149414, -120.899169921875, -114.47683715820312, -108.05450439453125, -101.63217163085938, -95.2098388671875, -88.7874984741211, -82.36516571044922, -75.94283294677734, -69.52049255371094, -63.09815979003906, -56.67582702636719, -50.25349426269531, -43.83115768432617, -37.40882110595703, -30.986488342285156, -24.56415557861328, -18.14181900024414, -11.719482421875, -5.297149658203125, 1.1251850128173828, 7.547519683837891, 13.969854354858398, 20.392189025878906, 26.81452178955078, 33.23685836791992, 39.65919494628906, 46.081512451171875, 52.50384521484375, 58.92618179321289, 65.34851837158203, 71.7708511352539, 78.19318389892578, 84.61552429199219, 91.03785705566406, 97.46018981933594, 103.88252258300781, 110.30485534667969, 116.7271957397461, 123.14952850341797, 129.57186889648438, 135.99420166015625, 142.41653442382812, 148.8388671875, 155.26119995117188, 161.68353271484375, 168.10586547851562, 174.5281982421875, 180.95053100585938, 187.3728790283203, 193.7952117919922, 200.21754455566406, 206.63987731933594, 213.0622100830078, 219.4845428466797, 225.90689086914062, 232.3292236328125, 238.75155639648438, 245.17388916015625, 251.59622192382812]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 14.0, 13.0, 15.0, 19.0, 29.0, 41.0, 37.0, 50.0, 52.0, 70.0, 77.0, 100.0, 73.0, 82.0, 76.0, 52.0, 41.0, 30.0, 27.0, 19.0, 13.0, 9.0, 10.0, 5.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-132.16354370117188, -127.71258544921875, -123.26162719726562, -118.8106689453125, -114.35971069335938, -109.90875244140625, -105.45779418945312, -101.0068359375, -96.55587768554688, -92.10491943359375, -87.65396118164062, -83.2030029296875, -78.75204467773438, -74.30108642578125, -69.85012817382812, -65.399169921875, -60.948211669921875, -56.49725341796875, -52.046295166015625, -47.5953369140625, -43.144378662109375, -38.69342041015625, -34.242462158203125, -29.79150390625, -25.340545654296875, -20.88958740234375, -16.438629150390625, -11.9876708984375, -7.536712646484375, -3.08575439453125, 1.365203857421875, 5.816162109375, 10.267135620117188, 14.718093872070312, 19.169052124023438, 23.620010375976562, 28.070968627929688, 32.52192687988281, 36.97288513183594, 41.42384338378906, 45.87480163574219, 50.32575988769531, 54.77671813964844, 59.22767639160156, 63.67863464355469, 68.12959289550781, 72.58055114746094, 77.03150939941406, 81.48246765136719, 85.93342590332031, 90.38438415527344, 94.83534240722656, 99.28630065917969, 103.73725891113281, 108.18821716308594, 112.63917541503906, 117.09013366699219, 121.54109191894531, 125.99205017089844, 130.44300842285156, 134.8939666748047, 139.3449249267578, 143.79588317871094, 148.24684143066406, 152.6977996826172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 23.0, 37.0, 66.0, 126.0, 153.0, 316.0, 530.0, 876.0, 1579.0, 2877.0, 5908.0, 12889.0, 34024.0, 137679.0, 3551778.0, 358117.0, 53731.0, 17676.0, 7413.0, 3760.0, 1967.0, 1104.0, 647.0, 368.0, 218.0, 131.0, 72.0, 56.0, 27.0, 25.0, 24.0, 19.0, 14.0, 12.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.125, -54.2353515625, -52.345703125, -50.4560546875, -48.56640625, -46.6767578125, -44.787109375, -42.8974609375, -41.0078125, -39.1181640625, -37.228515625, -35.3388671875, -33.44921875, -31.5595703125, -29.669921875, -27.7802734375, -25.890625, -24.0009765625, -22.111328125, -20.2216796875, -18.33203125, -16.4423828125, -14.552734375, -12.6630859375, -10.7734375, -8.8837890625, -6.994140625, -5.1044921875, -3.21484375, -1.3251953125, 0.564453125, 2.4541015625, 4.34375, 6.2333984375, 8.123046875, 10.0126953125, 11.90234375, 13.7919921875, 15.681640625, 17.5712890625, 19.4609375, 21.3505859375, 23.240234375, 25.1298828125, 27.01953125, 28.9091796875, 30.798828125, 32.6884765625, 34.578125, 36.4677734375, 38.357421875, 40.2470703125, 42.13671875, 44.0263671875, 45.916015625, 47.8056640625, 49.6953125, 51.5849609375, 53.474609375, 55.3642578125, 57.25390625, 59.1435546875, 61.033203125, 62.9228515625, 64.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 12.0, 12.0, 13.0, 18.0, 22.0, 42.0, 38.0, 34.0, 56.0, 56.0, 59.0, 78.0, 61.0, 84.0, 76.0, 72.0, 55.0, 43.0, 35.0, 27.0, 17.0, 19.0, 17.0, 9.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.550994873046875, -2.46136474609375, -2.371734619140625, -2.2821044921875, -2.192474365234375, -2.10284423828125, -2.013214111328125, -1.923583984375, -1.833953857421875, -1.74432373046875, -1.654693603515625, -1.5650634765625, -1.475433349609375, -1.38580322265625, -1.296173095703125, -1.20654296875, -1.116912841796875, -1.02728271484375, -0.937652587890625, -0.8480224609375, -0.758392333984375, -0.66876220703125, -0.579132080078125, -0.489501953125, -0.399871826171875, -0.31024169921875, -0.220611572265625, -0.1309814453125, -0.041351318359375, 0.04827880859375, 0.137908935546875, 0.2275390625, 0.317169189453125, 0.40679931640625, 0.496429443359375, 0.5860595703125, 0.675689697265625, 0.76531982421875, 0.854949951171875, 0.944580078125, 1.034210205078125, 1.12384033203125, 1.213470458984375, 1.3031005859375, 1.392730712890625, 1.48236083984375, 1.571990966796875, 1.66162109375, 1.751251220703125, 1.84088134765625, 1.930511474609375, 2.0201416015625, 2.109771728515625, 2.19940185546875, 2.289031982421875, 2.378662109375, 2.468292236328125, 2.55792236328125, 2.647552490234375, 2.7371826171875, 2.826812744140625, 2.91644287109375, 3.006072998046875, 3.095703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 14.0, 26.0, 37.0, 52.0, 74.0, 168.0, 277.0, 624.0, 1575.0, 5280.0, 22629.0, 170816.0, 3611610.0, 335762.0, 34657.0, 7112.0, 2023.0, 774.0, 343.0, 170.0, 88.0, 49.0, 30.0, 27.0, 6.0, 7.0, 7.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.625, -67.2744140625, -64.923828125, -62.5732421875, -60.22265625, -57.8720703125, -55.521484375, -53.1708984375, -50.8203125, -48.4697265625, -46.119140625, -43.7685546875, -41.41796875, -39.0673828125, -36.716796875, -34.3662109375, -32.015625, -29.6650390625, -27.314453125, -24.9638671875, -22.61328125, -20.2626953125, -17.912109375, -15.5615234375, -13.2109375, -10.8603515625, -8.509765625, -6.1591796875, -3.80859375, -1.4580078125, 0.892578125, 3.2431640625, 5.59375, 7.9443359375, 10.294921875, 12.6455078125, 14.99609375, 17.3466796875, 19.697265625, 22.0478515625, 24.3984375, 26.7490234375, 29.099609375, 31.4501953125, 33.80078125, 36.1513671875, 38.501953125, 40.8525390625, 43.203125, 45.5537109375, 47.904296875, 50.2548828125, 52.60546875, 54.9560546875, 57.306640625, 59.6572265625, 62.0078125, 64.3583984375, 66.708984375, 69.0595703125, 71.41015625, 73.7607421875, 76.111328125, 78.4619140625, 80.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 14.0, 31.0, 30.0, 57.0, 82.0, 158.0, 262.0, 650.0, 1669.0, 490.0, 231.0, 135.0, 86.0, 51.0, 23.0, 24.0, 12.0, 17.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9820556640625, -9.682861328125, -9.3836669921875, -9.08447265625, -8.7852783203125, -8.486083984375, -8.1868896484375, -7.8876953125, -7.5885009765625, -7.289306640625, -6.9901123046875, -6.69091796875, -6.3917236328125, -6.092529296875, -5.7933349609375, -5.494140625, -5.1949462890625, -4.895751953125, -4.5965576171875, -4.29736328125, -3.9981689453125, -3.698974609375, -3.3997802734375, -3.1005859375, -2.8013916015625, -2.502197265625, -2.2030029296875, -1.90380859375, -1.6046142578125, -1.305419921875, -1.0062255859375, -0.70703125, -0.4078369140625, -0.108642578125, 0.1905517578125, 0.48974609375, 0.7889404296875, 1.088134765625, 1.3873291015625, 1.6865234375, 1.9857177734375, 2.284912109375, 2.5841064453125, 2.88330078125, 3.1824951171875, 3.481689453125, 3.7808837890625, 4.080078125, 4.3792724609375, 4.678466796875, 4.9776611328125, 5.27685546875, 5.5760498046875, 5.875244140625, 6.1744384765625, 6.4736328125, 6.7728271484375, 7.072021484375, 7.3712158203125, 7.67041015625, 7.9696044921875, 8.268798828125, 8.5679931640625, 8.8671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 16.0, 21.0, 31.0, 69.0, 120.0, 176.0, 182.0, 172.0, 93.0, 48.0, 33.0, 18.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.056697845458984, -34.79891586303711, -32.5411376953125, -30.283355712890625, -28.025575637817383, -25.76779556274414, -23.510013580322266, -21.252233505249023, -18.99445343017578, -16.73667335510254, -14.47889232635498, -12.221111297607422, -9.96333122253418, -7.7055511474609375, -5.447770118713379, -3.1899890899658203, -0.9322090148925781, 1.3255715370178223, 3.5833520889282227, 5.841132640838623, 8.098913192749023, 10.356693267822266, 12.614474296569824, 14.872255325317383, 17.130035400390625, 19.387815475463867, 21.64559555053711, 23.903377532958984, 26.161157608032227, 28.41893768310547, 30.676719665527344, 32.93450164794922, 35.192283630371094, 37.45006561279297, 39.70784378051758, 41.96562576293945, 44.22340393066406, 46.48118591308594, 48.73896789550781, 50.99674987792969, 53.2545280456543, 55.51231002807617, 57.77008819580078, 60.027870178222656, 62.28565216064453, 64.54342651367188, 66.80120849609375, 69.05899047851562, 71.3167724609375, 73.57455444335938, 75.83233642578125, 78.0901107788086, 80.34789276123047, 82.60567474365234, 84.86345672607422, 87.1212387084961, 89.37901306152344, 91.63679504394531, 93.89457702636719, 96.15235137939453, 98.4101333618164, 100.66791534423828, 102.92569732666016, 105.18347930908203, 107.4412612915039]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 10.0, 13.0, 15.0, 25.0, 20.0, 22.0, 30.0, 41.0, 35.0, 51.0, 47.0, 56.0, 56.0, 46.0, 52.0, 42.0, 46.0, 46.0, 40.0, 38.0, 44.0, 32.0, 38.0, 21.0, 19.0, 24.0, 14.0, 14.0, 10.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-32.26142120361328, -31.34774398803711, -30.434066772460938, -29.520389556884766, -28.606712341308594, -27.693035125732422, -26.77935791015625, -25.86568260192871, -24.95200538635254, -24.038328170776367, -23.124650955200195, -22.210973739624023, -21.29729652404785, -20.383621215820312, -19.46994400024414, -18.55626678466797, -17.642589569091797, -16.728912353515625, -15.815235137939453, -14.901557922363281, -13.987881660461426, -13.074204444885254, -12.160527229309082, -11.246850967407227, -10.333171844482422, -9.41949462890625, -8.505817413330078, -7.5921406745910645, -6.678463935852051, -5.764786720275879, -4.851109504699707, -3.9374327659606934, -3.0237560272216797, -2.110079050064087, -1.1964019536972046, -0.28272485733032227, 0.6309521198272705, 1.5446290969848633, 2.458306312561035, 3.371983051300049, 4.285660266876221, 5.199337482452393, 6.113014221191406, 7.026691436767578, 7.94036865234375, 8.854045867919922, 9.767723083496094, 10.68139934539795, 11.595076560974121, 12.508753776550293, 13.422430992126465, 14.33610725402832, 15.249784469604492, 16.163461685180664, 17.077138900756836, 17.990816116333008, 18.90449333190918, 19.81817054748535, 20.731847763061523, 21.645524978637695, 22.559202194213867, 23.472877502441406, 24.386554718017578, 25.30023193359375, 26.213909149169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 6.0, 10.0, 17.0, 15.0, 20.0, 38.0, 42.0, 67.0, 109.0, 308.0, 1199.0, 6348.0, 43488.0, 359241.0, 545880.0, 78401.0, 10594.0, 1960.0, 405.0, 143.0, 65.0, 30.0, 32.0, 29.0, 23.0, 13.0, 12.0, 9.0, 7.0, 6.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -54.90576171875, -53.2490234375, -51.59228515625, -49.935546875, -48.27880859375, -46.6220703125, -44.96533203125, -43.30859375, -41.65185546875, -39.9951171875, -38.33837890625, -36.681640625, -35.02490234375, -33.3681640625, -31.71142578125, -30.0546875, -28.39794921875, -26.7412109375, -25.08447265625, -23.427734375, -21.77099609375, -20.1142578125, -18.45751953125, -16.80078125, -15.14404296875, -13.4873046875, -11.83056640625, -10.173828125, -8.51708984375, -6.8603515625, -5.20361328125, -3.546875, -1.89013671875, -0.2333984375, 1.42333984375, 3.080078125, 4.73681640625, 6.3935546875, 8.05029296875, 9.70703125, 11.36376953125, 13.0205078125, 14.67724609375, 16.333984375, 17.99072265625, 19.6474609375, 21.30419921875, 22.9609375, 24.61767578125, 26.2744140625, 27.93115234375, 29.587890625, 31.24462890625, 32.9013671875, 34.55810546875, 36.21484375, 37.87158203125, 39.5283203125, 41.18505859375, 42.841796875, 44.49853515625, 46.1552734375, 47.81201171875, 49.46875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 19.0, 33.0, 52.0, 45.0, 69.0, 75.0, 92.0, 99.0, 97.0, 99.0, 78.0, 65.0, 38.0, 42.0, 26.0, 17.0, 17.0, 5.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6025543212890625, -1.487335205078125, -1.3721160888671875, -1.25689697265625, -1.1416778564453125, -1.026458740234375, -0.9112396240234375, -0.7960205078125, -0.6808013916015625, -0.565582275390625, -0.4503631591796875, -0.33514404296875, -0.2199249267578125, -0.104705810546875, 0.0105133056640625, 0.125732421875, 0.2409515380859375, 0.356170654296875, 0.4713897705078125, 0.58660888671875, 0.7018280029296875, 0.817047119140625, 0.9322662353515625, 1.0474853515625, 1.1627044677734375, 1.277923583984375, 1.3931427001953125, 1.50836181640625, 1.6235809326171875, 1.738800048828125, 1.8540191650390625, 1.96923828125, 2.0844573974609375, 2.199676513671875, 2.3148956298828125, 2.43011474609375, 2.5453338623046875, 2.660552978515625, 2.7757720947265625, 2.8909912109375, 3.0062103271484375, 3.121429443359375, 3.2366485595703125, 3.35186767578125, 3.4670867919921875, 3.582305908203125, 3.6975250244140625, 3.812744140625, 3.9279632568359375, 4.043182373046875, 4.1584014892578125, 4.27362060546875, 4.3888397216796875, 4.504058837890625, 4.6192779541015625, 4.7344970703125, 4.8497161865234375, 4.964935302734375, 5.0801544189453125, 5.19537353515625, 5.3105926513671875, 5.425811767578125, 5.5410308837890625, 5.65625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 14.0, 11.0, 14.0, 17.0, 16.0, 28.0, 31.0, 43.0, 62.0, 99.0, 107.0, 169.0, 249.0, 298.0, 458.0, 718.0, 1270.0, 2468.0, 5914.0, 16521.0, 55698.0, 189123.0, 405187.0, 252774.0, 78923.0, 23462.0, 7773.0, 2993.0, 1467.0, 776.0, 527.0, 368.0, 275.0, 178.0, 137.0, 103.0, 75.0, 57.0, 31.0, 28.0, 36.0, 18.0, 14.0, 4.0, 9.0, 0.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.25, -25.420166015625, -24.59033203125, -23.760498046875, -22.9306640625, -22.100830078125, -21.27099609375, -20.441162109375, -19.611328125, -18.781494140625, -17.95166015625, -17.121826171875, -16.2919921875, -15.462158203125, -14.63232421875, -13.802490234375, -12.97265625, -12.142822265625, -11.31298828125, -10.483154296875, -9.6533203125, -8.823486328125, -7.99365234375, -7.163818359375, -6.333984375, -5.504150390625, -4.67431640625, -3.844482421875, -3.0146484375, -2.184814453125, -1.35498046875, -0.525146484375, 0.3046875, 1.134521484375, 1.96435546875, 2.794189453125, 3.6240234375, 4.453857421875, 5.28369140625, 6.113525390625, 6.943359375, 7.773193359375, 8.60302734375, 9.432861328125, 10.2626953125, 11.092529296875, 11.92236328125, 12.752197265625, 13.58203125, 14.411865234375, 15.24169921875, 16.071533203125, 16.9013671875, 17.731201171875, 18.56103515625, 19.390869140625, 20.220703125, 21.050537109375, 21.88037109375, 22.710205078125, 23.5400390625, 24.369873046875, 25.19970703125, 26.029541015625, 26.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 12.0, 11.0, 18.0, 16.0, 17.0, 28.0, 18.0, 31.0, 28.0, 37.0, 40.0, 41.0, 31.0, 58.0, 45.0, 49.0, 40.0, 50.0, 56.0, 46.0, 27.0, 37.0, 37.0, 38.0, 16.0, 23.0, 15.0, 21.0, 21.0, 15.0, 17.0, 10.0, 6.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.1953125, -12.8140869140625, -12.432861328125, -12.0516357421875, -11.67041015625, -11.2891845703125, -10.907958984375, -10.5267333984375, -10.1455078125, -9.7642822265625, -9.383056640625, -9.0018310546875, -8.62060546875, -8.2393798828125, -7.858154296875, -7.4769287109375, -7.095703125, -6.7144775390625, -6.333251953125, -5.9520263671875, -5.57080078125, -5.1895751953125, -4.808349609375, -4.4271240234375, -4.0458984375, -3.6646728515625, -3.283447265625, -2.9022216796875, -2.52099609375, -2.1397705078125, -1.758544921875, -1.3773193359375, -0.99609375, -0.6148681640625, -0.233642578125, 0.1475830078125, 0.52880859375, 0.9100341796875, 1.291259765625, 1.6724853515625, 2.0537109375, 2.4349365234375, 2.816162109375, 3.1973876953125, 3.57861328125, 3.9598388671875, 4.341064453125, 4.7222900390625, 5.103515625, 5.4847412109375, 5.865966796875, 6.2471923828125, 6.62841796875, 7.0096435546875, 7.390869140625, 7.7720947265625, 8.1533203125, 8.5345458984375, 8.915771484375, 9.2969970703125, 9.67822265625, 10.0594482421875, 10.440673828125, 10.8218994140625, 11.203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 12.0, 16.0, 20.0, 29.0, 49.0, 90.0, 127.0, 225.0, 407.0, 753.0, 1362.0, 3100.0, 7549.0, 21899.0, 73770.0, 258416.0, 424315.0, 179603.0, 50872.0, 15546.0, 5460.0, 2395.0, 1128.0, 569.0, 303.0, 196.0, 132.0, 63.0, 42.0, 26.0, 21.0, 18.0, 18.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.613037109375, -18.77294921875, -17.932861328125, -17.0927734375, -16.252685546875, -15.41259765625, -14.572509765625, -13.732421875, -12.892333984375, -12.05224609375, -11.212158203125, -10.3720703125, -9.531982421875, -8.69189453125, -7.851806640625, -7.01171875, -6.171630859375, -5.33154296875, -4.491455078125, -3.6513671875, -2.811279296875, -1.97119140625, -1.131103515625, -0.291015625, 0.549072265625, 1.38916015625, 2.229248046875, 3.0693359375, 3.909423828125, 4.74951171875, 5.589599609375, 6.4296875, 7.269775390625, 8.10986328125, 8.949951171875, 9.7900390625, 10.630126953125, 11.47021484375, 12.310302734375, 13.150390625, 13.990478515625, 14.83056640625, 15.670654296875, 16.5107421875, 17.350830078125, 18.19091796875, 19.031005859375, 19.87109375, 20.711181640625, 21.55126953125, 22.391357421875, 23.2314453125, 24.071533203125, 24.91162109375, 25.751708984375, 26.591796875, 27.431884765625, 28.27197265625, 29.112060546875, 29.9521484375, 30.792236328125, 31.63232421875, 32.472412109375, 33.3125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 22.0, 28.0, 32.0, 33.0, 40.0, 47.0, 54.0, 83.0, 90.0, 88.0, 107.0, 66.0, 57.0, 44.0, 44.0, 30.0, 30.0, 16.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00262451171875, -0.0025433599948883057, -0.0024622082710266113, -0.002381056547164917, -0.0022999048233032227, -0.0022187530994415283, -0.002137601375579834, -0.0020564496517181396, -0.0019752979278564453, -0.001894146203994751, -0.0018129944801330566, -0.0017318427562713623, -0.001650691032409668, -0.0015695393085479736, -0.0014883875846862793, -0.001407235860824585, -0.0013260841369628906, -0.0012449324131011963, -0.001163780689239502, -0.0010826289653778076, -0.0010014772415161133, -0.0009203255176544189, -0.0008391737937927246, -0.0007580220699310303, -0.0006768703460693359, -0.0005957186222076416, -0.0005145668983459473, -0.00043341517448425293, -0.0003522634506225586, -0.00027111172676086426, -0.00018996000289916992, -0.00010880827903747559, -2.765655517578125e-05, 5.3495168685913086e-05, 0.00013464689254760742, 0.00021579861640930176, 0.0002969503402709961, 0.00037810206413269043, 0.00045925378799438477, 0.0005404055118560791, 0.0006215572357177734, 0.0007027089595794678, 0.0007838606834411621, 0.0008650124073028564, 0.0009461641311645508, 0.0010273158550262451, 0.0011084675788879395, 0.0011896193027496338, 0.0012707710266113281, 0.0013519227504730225, 0.0014330744743347168, 0.0015142261981964111, 0.0015953779220581055, 0.0016765296459197998, 0.0017576813697814941, 0.0018388330936431885, 0.0019199848175048828, 0.002001136541366577, 0.0020822882652282715, 0.002163439989089966, 0.00224459171295166, 0.0023257434368133545, 0.002406895160675049, 0.002488046884536743, 0.0025691986083984375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 7.0, 13.0, 13.0, 20.0, 18.0, 21.0, 31.0, 53.0, 65.0, 103.0, 144.0, 173.0, 336.0, 589.0, 1171.0, 2268.0, 5334.0, 14274.0, 43287.0, 153118.0, 416964.0, 286311.0, 82616.0, 25123.0, 9000.0, 3647.0, 1604.0, 879.0, 443.0, 279.0, 190.0, 125.0, 97.0, 74.0, 37.0, 29.0, 22.0, 19.0, 10.0, 8.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.33154296875, -25.4755859375, -24.61962890625, -23.763671875, -22.90771484375, -22.0517578125, -21.19580078125, -20.33984375, -19.48388671875, -18.6279296875, -17.77197265625, -16.916015625, -16.06005859375, -15.2041015625, -14.34814453125, -13.4921875, -12.63623046875, -11.7802734375, -10.92431640625, -10.068359375, -9.21240234375, -8.3564453125, -7.50048828125, -6.64453125, -5.78857421875, -4.9326171875, -4.07666015625, -3.220703125, -2.36474609375, -1.5087890625, -0.65283203125, 0.203125, 1.05908203125, 1.9150390625, 2.77099609375, 3.626953125, 4.48291015625, 5.3388671875, 6.19482421875, 7.05078125, 7.90673828125, 8.7626953125, 9.61865234375, 10.474609375, 11.33056640625, 12.1865234375, 13.04248046875, 13.8984375, 14.75439453125, 15.6103515625, 16.46630859375, 17.322265625, 18.17822265625, 19.0341796875, 19.89013671875, 20.74609375, 21.60205078125, 22.4580078125, 23.31396484375, 24.169921875, 25.02587890625, 25.8818359375, 26.73779296875, 27.59375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 8.0, 13.0, 8.0, 16.0, 18.0, 22.0, 37.0, 48.0, 35.0, 66.0, 56.0, 63.0, 81.0, 70.0, 78.0, 59.0, 60.0, 44.0, 36.0, 30.0, 27.0, 26.0, 22.0, 15.0, 3.0, 12.0, 8.0, 8.0, 8.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8812255859375, -12.496826171875, -12.1124267578125, -11.72802734375, -11.3436279296875, -10.959228515625, -10.5748291015625, -10.1904296875, -9.8060302734375, -9.421630859375, -9.0372314453125, -8.65283203125, -8.2684326171875, -7.884033203125, -7.4996337890625, -7.115234375, -6.7308349609375, -6.346435546875, -5.9620361328125, -5.57763671875, -5.1932373046875, -4.808837890625, -4.4244384765625, -4.0400390625, -3.6556396484375, -3.271240234375, -2.8868408203125, -2.50244140625, -2.1180419921875, -1.733642578125, -1.3492431640625, -0.96484375, -0.5804443359375, -0.196044921875, 0.1883544921875, 0.57275390625, 0.9571533203125, 1.341552734375, 1.7259521484375, 2.1103515625, 2.4947509765625, 2.879150390625, 3.2635498046875, 3.64794921875, 4.0323486328125, 4.416748046875, 4.8011474609375, 5.185546875, 5.5699462890625, 5.954345703125, 6.3387451171875, 6.72314453125, 7.1075439453125, 7.491943359375, 7.8763427734375, 8.2607421875, 8.6451416015625, 9.029541015625, 9.4139404296875, 9.79833984375, 10.1827392578125, 10.567138671875, 10.9515380859375, 11.3359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 11.0, 29.0, 49.0, 84.0, 164.0, 191.0, 172.0, 127.0, 75.0, 39.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.6391296386719, -249.26834106445312, -241.89755249023438, -234.52676391601562, -227.1559600830078, -219.78517150878906, -212.4143829345703, -205.04359436035156, -197.67279052734375, -190.302001953125, -182.93121337890625, -175.5604248046875, -168.1896209716797, -160.81883239746094, -153.4480438232422, -146.07725524902344, -138.7064666748047, -131.33567810058594, -123.96488189697266, -116.5940933227539, -109.22329711914062, -101.85250854492188, -94.48171997070312, -87.11093139648438, -79.7401351928711, -72.36934661865234, -64.99855041503906, -57.62776184082031, -50.2569694519043, -42.88617706298828, -35.51538848876953, -28.144596099853516, -20.7738037109375, -13.4030122756958, -6.032220840454102, 1.3385696411132812, 8.709362030029297, 16.080154418945312, 23.450942993164062, 30.821735382080078, 38.192527770996094, 45.56332015991211, 52.934112548828125, 60.304901123046875, 67.67568969726562, 75.0464859008789, 82.41727447509766, 89.78807067871094, 97.15885925292969, 104.52964782714844, 111.90044403076172, 119.27123260498047, 126.64202880859375, 134.0128173828125, 141.38360595703125, 148.75439453125, 156.12518310546875, 163.4959716796875, 170.86676025390625, 178.237548828125, 185.6083526611328, 192.97914123535156, 200.3499298095703, 207.72071838378906, 215.09152221679688]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 7.0, 12.0, 22.0, 18.0, 28.0, 33.0, 31.0, 46.0, 40.0, 47.0, 51.0, 63.0, 50.0, 64.0, 47.0, 44.0, 60.0, 49.0, 49.0, 37.0, 35.0, 30.0, 26.0, 19.0, 19.0, 15.0, 13.0, 7.0, 15.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-142.22293090820312, -138.83920288085938, -135.45547485351562, -132.07174682617188, -128.6880340576172, -125.30430603027344, -121.92057800292969, -118.53684997558594, -115.15312957763672, -111.76940155029297, -108.38568115234375, -105.001953125, -101.61822509765625, -98.23450469970703, -94.85077667236328, -91.46705627441406, -88.08332824707031, -84.69960021972656, -81.31587982177734, -77.9321517944336, -74.54842376708984, -71.16470336914062, -67.78097534179688, -64.39724731445312, -61.013519287109375, -57.62979507446289, -54.24606704711914, -50.862342834472656, -47.47861862182617, -44.09489440917969, -40.71116638183594, -37.32744216918945, -33.94371795654297, -30.55999183654785, -27.176267623901367, -23.79254150390625, -20.408817291259766, -17.02509117126465, -13.641365051269531, -10.257640838623047, -6.87391471862793, -3.49018931388855, -0.10646390914916992, 3.277261734008789, 6.66098690032959, 10.04471206665039, 13.428438186645508, 16.812162399291992, 20.19588851928711, 23.579614639282227, 26.96333885192871, 30.347064971923828, 33.73078918457031, 37.11451721191406, 40.49824142456055, 43.88196563720703, 47.26569366455078, 50.649417877197266, 54.033145904541016, 57.4168701171875, 60.800594329833984, 64.18431854248047, 67.56804656982422, 70.95176696777344, 74.33549499511719]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 13.0, 21.0, 35.0, 57.0, 97.0, 235.0, 1787.0, 42350.0, 4097835.0, 49331.0, 1845.0, 302.0, 132.0, 93.0, 42.0, 34.0, 28.0, 13.0, 12.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.75, -140.25390625, -134.7578125, -129.26171875, -123.765625, -118.26953125, -112.7734375, -107.27734375, -101.78125, -96.28515625, -90.7890625, -85.29296875, -79.796875, -74.30078125, -68.8046875, -63.30859375, -57.8125, -52.31640625, -46.8203125, -41.32421875, -35.828125, -30.33203125, -24.8359375, -19.33984375, -13.84375, -8.34765625, -2.8515625, 2.64453125, 8.140625, 13.63671875, 19.1328125, 24.62890625, 30.125, 35.62109375, 41.1171875, 46.61328125, 52.109375, 57.60546875, 63.1015625, 68.59765625, 74.09375, 79.58984375, 85.0859375, 90.58203125, 96.078125, 101.57421875, 107.0703125, 112.56640625, 118.0625, 123.55859375, 129.0546875, 134.55078125, 140.046875, 145.54296875, 151.0390625, 156.53515625, 162.03125, 167.52734375, 173.0234375, 178.51953125, 184.015625, 189.51171875, 195.0078125, 200.50390625, 206.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 19.0, 34.0, 42.0, 66.0, 70.0, 94.0, 103.0, 104.0, 89.0, 95.0, 76.0, 65.0, 40.0, 23.0, 20.0, 17.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.072021484375, -3.91748046875, -3.762939453125, -3.6083984375, -3.453857421875, -3.29931640625, -3.144775390625, -2.990234375, -2.835693359375, -2.68115234375, -2.526611328125, -2.3720703125, -2.217529296875, -2.06298828125, -1.908447265625, -1.75390625, -1.599365234375, -1.44482421875, -1.290283203125, -1.1357421875, -0.981201171875, -0.82666015625, -0.672119140625, -0.517578125, -0.363037109375, -0.20849609375, -0.053955078125, 0.1005859375, 0.255126953125, 0.40966796875, 0.564208984375, 0.71875, 0.873291015625, 1.02783203125, 1.182373046875, 1.3369140625, 1.491455078125, 1.64599609375, 1.800537109375, 1.955078125, 2.109619140625, 2.26416015625, 2.418701171875, 2.5732421875, 2.727783203125, 2.88232421875, 3.036865234375, 3.19140625, 3.345947265625, 3.50048828125, 3.655029296875, 3.8095703125, 3.964111328125, 4.11865234375, 4.273193359375, 4.427734375, 4.582275390625, 4.73681640625, 4.891357421875, 5.0458984375, 5.200439453125, 5.35498046875, 5.509521484375, 5.6640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 12.0, 7.0, 11.0, 15.0, 16.0, 21.0, 24.0, 26.0, 45.0, 60.0, 94.0, 121.0, 191.0, 313.0, 585.0, 1165.0, 2797.0, 7862.0, 26771.0, 120375.0, 1201273.0, 2622468.0, 160235.0, 34006.0, 9535.0, 3259.0, 1391.0, 655.0, 321.0, 205.0, 140.0, 76.0, 45.0, 41.0, 24.0, 24.0, 18.0, 13.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.78125, -52.248046875, -50.71484375, -49.181640625, -47.6484375, -46.115234375, -44.58203125, -43.048828125, -41.515625, -39.982421875, -38.44921875, -36.916015625, -35.3828125, -33.849609375, -32.31640625, -30.783203125, -29.25, -27.716796875, -26.18359375, -24.650390625, -23.1171875, -21.583984375, -20.05078125, -18.517578125, -16.984375, -15.451171875, -13.91796875, -12.384765625, -10.8515625, -9.318359375, -7.78515625, -6.251953125, -4.71875, -3.185546875, -1.65234375, -0.119140625, 1.4140625, 2.947265625, 4.48046875, 6.013671875, 7.546875, 9.080078125, 10.61328125, 12.146484375, 13.6796875, 15.212890625, 16.74609375, 18.279296875, 19.8125, 21.345703125, 22.87890625, 24.412109375, 25.9453125, 27.478515625, 29.01171875, 30.544921875, 32.078125, 33.611328125, 35.14453125, 36.677734375, 38.2109375, 39.744140625, 41.27734375, 42.810546875, 44.34375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 9.0, 33.0, 23.0, 49.0, 79.0, 141.0, 281.0, 725.0, 1656.0, 511.0, 203.0, 130.0, 63.0, 60.0, 35.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.015625, -15.645751953125, -15.27587890625, -14.906005859375, -14.5361328125, -14.166259765625, -13.79638671875, -13.426513671875, -13.056640625, -12.686767578125, -12.31689453125, -11.947021484375, -11.5771484375, -11.207275390625, -10.83740234375, -10.467529296875, -10.09765625, -9.727783203125, -9.35791015625, -8.988037109375, -8.6181640625, -8.248291015625, -7.87841796875, -7.508544921875, -7.138671875, -6.768798828125, -6.39892578125, -6.029052734375, -5.6591796875, -5.289306640625, -4.91943359375, -4.549560546875, -4.1796875, -3.809814453125, -3.43994140625, -3.070068359375, -2.7001953125, -2.330322265625, -1.96044921875, -1.590576171875, -1.220703125, -0.850830078125, -0.48095703125, -0.111083984375, 0.2587890625, 0.628662109375, 0.99853515625, 1.368408203125, 1.73828125, 2.108154296875, 2.47802734375, 2.847900390625, 3.2177734375, 3.587646484375, 3.95751953125, 4.327392578125, 4.697265625, 5.067138671875, 5.43701171875, 5.806884765625, 6.1767578125, 6.546630859375, 6.91650390625, 7.286376953125, 7.65625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 14.0, 50.0, 118.0, 200.0, 263.0, 172.0, 107.0, 42.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.45655822753906, -179.21998596191406, -174.9833984375, -170.746826171875, -166.51025390625, -162.273681640625, -158.037109375, -153.80052185058594, -149.56394958496094, -145.32737731933594, -141.09078979492188, -136.85421752929688, -132.61764526367188, -128.38107299804688, -124.14449310302734, -119.90791320800781, -115.67134094238281, -111.43476867675781, -107.19818878173828, -102.96160888671875, -98.72503662109375, -94.48846435546875, -90.25188446044922, -86.01530456542969, -81.77873229980469, -77.54216003417969, -73.30558013916016, -69.06900024414062, -64.83242797851562, -60.59585189819336, -56.359275817871094, -52.12269973754883, -47.88611602783203, -43.649539947509766, -39.4129638671875, -35.176387786865234, -30.93981170654297, -26.703235626220703, -22.466659545898438, -18.230083465576172, -13.993507385253906, -9.75693130493164, -5.520355224609375, -1.2837791442871094, 2.9527969360351562, 7.189373016357422, 11.425949096679688, 15.662525177001953, 19.89910125732422, 24.135677337646484, 28.37225341796875, 32.608829498291016, 36.84540557861328, 41.08198165893555, 45.31855773925781, 49.55513381958008, 53.791709899902344, 58.02828598022461, 62.264862060546875, 66.50143432617188, 70.7380142211914, 74.97459411621094, 79.21116638183594, 83.44773864746094, 87.68431854248047]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 5.0, 8.0, 10.0, 12.0, 20.0, 13.0, 31.0, 18.0, 29.0, 20.0, 33.0, 36.0, 45.0, 42.0, 43.0, 34.0, 40.0, 41.0, 35.0, 35.0, 51.0, 41.0, 41.0, 36.0, 32.0, 26.0, 31.0, 25.0, 18.0, 20.0, 17.0, 21.0, 9.0, 17.0, 8.0, 14.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.88884735107422, -30.899494171142578, -29.91014289855957, -28.92078971862793, -27.931438446044922, -26.94208526611328, -25.95273208618164, -24.963380813598633, -23.974027633666992, -22.98467445373535, -21.995323181152344, -21.005970001220703, -20.016618728637695, -19.027265548706055, -18.037914276123047, -17.048561096191406, -16.059207916259766, -15.069855690002441, -14.080503463745117, -13.091150283813477, -12.101798057556152, -11.112445831298828, -10.123093605041504, -9.13374137878418, -8.144390106201172, -7.155037879943848, -6.165685176849365, -5.176332950592041, -4.186980247497559, -3.1976280212402344, -2.20827579498291, -1.2189230918884277, -0.2295703887939453, 0.7597820162773132, 1.7491344213485718, 2.7384867668151855, 3.727839231491089, 4.717191696166992, 5.706543922424316, 6.695896625518799, 7.685248851776123, 8.674601554870605, 9.66395378112793, 10.653306007385254, 11.642658233642578, 12.632011413574219, 13.621362686157227, 14.610715866088867, 15.600068092346191, 16.589420318603516, 17.578773498535156, 18.568124771118164, 19.557477951049805, 20.546829223632812, 21.536182403564453, 22.525535583496094, 23.5148868560791, 24.504240036010742, 25.49359130859375, 26.48294448852539, 27.4722957611084, 28.46164894104004, 29.451000213623047, 30.440353393554688, 31.429706573486328]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 12.0, 8.0, 19.0, 17.0, 34.0, 28.0, 32.0, 55.0, 75.0, 125.0, 234.0, 442.0, 1133.0, 3194.0, 10380.0, 36794.0, 135507.0, 388350.0, 328191.0, 103536.0, 27934.0, 8031.0, 2475.0, 947.0, 379.0, 191.0, 107.0, 83.0, 46.0, 33.0, 32.0, 17.0, 17.0, 18.0, 8.0, 10.0, 4.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.203125, -29.284912109375, -28.36669921875, -27.448486328125, -26.5302734375, -25.612060546875, -24.69384765625, -23.775634765625, -22.857421875, -21.939208984375, -21.02099609375, -20.102783203125, -19.1845703125, -18.266357421875, -17.34814453125, -16.429931640625, -15.51171875, -14.593505859375, -13.67529296875, -12.757080078125, -11.8388671875, -10.920654296875, -10.00244140625, -9.084228515625, -8.166015625, -7.247802734375, -6.32958984375, -5.411376953125, -4.4931640625, -3.574951171875, -2.65673828125, -1.738525390625, -0.8203125, 0.097900390625, 1.01611328125, 1.934326171875, 2.8525390625, 3.770751953125, 4.68896484375, 5.607177734375, 6.525390625, 7.443603515625, 8.36181640625, 9.280029296875, 10.1982421875, 11.116455078125, 12.03466796875, 12.952880859375, 13.87109375, 14.789306640625, 15.70751953125, 16.625732421875, 17.5439453125, 18.462158203125, 19.38037109375, 20.298583984375, 21.216796875, 22.135009765625, 23.05322265625, 23.971435546875, 24.8896484375, 25.807861328125, 26.72607421875, 27.644287109375, 28.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 8.0, 26.0, 18.0, 35.0, 40.0, 60.0, 61.0, 75.0, 100.0, 91.0, 93.0, 84.0, 80.0, 62.0, 53.0, 39.0, 30.0, 16.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.03277587890625, -3.8819580078125, -3.73114013671875, -3.580322265625, -3.42950439453125, -3.2786865234375, -3.12786865234375, -2.97705078125, -2.82623291015625, -2.6754150390625, -2.52459716796875, -2.373779296875, -2.22296142578125, -2.0721435546875, -1.92132568359375, -1.7705078125, -1.61968994140625, -1.4688720703125, -1.31805419921875, -1.167236328125, -1.01641845703125, -0.8656005859375, -0.71478271484375, -0.56396484375, -0.41314697265625, -0.2623291015625, -0.11151123046875, 0.039306640625, 0.19012451171875, 0.3409423828125, 0.49176025390625, 0.642578125, 0.79339599609375, 0.9442138671875, 1.09503173828125, 1.245849609375, 1.39666748046875, 1.5474853515625, 1.69830322265625, 1.84912109375, 1.99993896484375, 2.1507568359375, 2.30157470703125, 2.452392578125, 2.60321044921875, 2.7540283203125, 2.90484619140625, 3.0556640625, 3.20648193359375, 3.3572998046875, 3.50811767578125, 3.658935546875, 3.80975341796875, 3.9605712890625, 4.11138916015625, 4.26220703125, 4.41302490234375, 4.5638427734375, 4.71466064453125, 4.865478515625, 5.01629638671875, 5.1671142578125, 5.31793212890625, 5.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 14.0, 23.0, 22.0, 44.0, 53.0, 67.0, 88.0, 120.0, 190.0, 306.0, 418.0, 626.0, 1136.0, 2296.0, 6296.0, 23377.0, 108402.0, 439809.0, 358500.0, 79307.0, 17573.0, 5044.0, 1984.0, 1025.0, 561.0, 373.0, 251.0, 178.0, 116.0, 94.0, 69.0, 40.0, 37.0, 29.0, 12.0, 15.0, 7.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.75, -30.72265625, -29.6953125, -28.66796875, -27.640625, -26.61328125, -25.5859375, -24.55859375, -23.53125, -22.50390625, -21.4765625, -20.44921875, -19.421875, -18.39453125, -17.3671875, -16.33984375, -15.3125, -14.28515625, -13.2578125, -12.23046875, -11.203125, -10.17578125, -9.1484375, -8.12109375, -7.09375, -6.06640625, -5.0390625, -4.01171875, -2.984375, -1.95703125, -0.9296875, 0.09765625, 1.125, 2.15234375, 3.1796875, 4.20703125, 5.234375, 6.26171875, 7.2890625, 8.31640625, 9.34375, 10.37109375, 11.3984375, 12.42578125, 13.453125, 14.48046875, 15.5078125, 16.53515625, 17.5625, 18.58984375, 19.6171875, 20.64453125, 21.671875, 22.69921875, 23.7265625, 24.75390625, 25.78125, 26.80859375, 27.8359375, 28.86328125, 29.890625, 30.91796875, 31.9453125, 32.97265625, 34.0]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 7.0, 12.0, 17.0, 23.0, 17.0, 33.0, 27.0, 25.0, 37.0, 34.0, 40.0, 42.0, 44.0, 49.0, 46.0, 51.0, 44.0, 50.0, 40.0, 46.0, 31.0, 39.0, 38.0, 23.0, 26.0, 17.0, 19.0, 19.0, 14.0, 8.0, 8.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0626220703125, -13.601806640625, -13.1409912109375, -12.68017578125, -12.2193603515625, -11.758544921875, -11.2977294921875, -10.8369140625, -10.3760986328125, -9.915283203125, -9.4544677734375, -8.99365234375, -8.5328369140625, -8.072021484375, -7.6112060546875, -7.150390625, -6.6895751953125, -6.228759765625, -5.7679443359375, -5.30712890625, -4.8463134765625, -4.385498046875, -3.9246826171875, -3.4638671875, -3.0030517578125, -2.542236328125, -2.0814208984375, -1.62060546875, -1.1597900390625, -0.698974609375, -0.2381591796875, 0.22265625, 0.6834716796875, 1.144287109375, 1.6051025390625, 2.06591796875, 2.5267333984375, 2.987548828125, 3.4483642578125, 3.9091796875, 4.3699951171875, 4.830810546875, 5.2916259765625, 5.75244140625, 6.2132568359375, 6.674072265625, 7.1348876953125, 7.595703125, 8.0565185546875, 8.517333984375, 8.9781494140625, 9.43896484375, 9.8997802734375, 10.360595703125, 10.8214111328125, 11.2822265625, 11.7430419921875, 12.203857421875, 12.6646728515625, 13.12548828125, 13.5863037109375, 14.047119140625, 14.5079345703125, 14.96875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 16.0, 19.0, 35.0, 54.0, 74.0, 152.0, 214.0, 420.0, 741.0, 1674.0, 4044.0, 11536.0, 41975.0, 210372.0, 545070.0, 178645.0, 36264.0, 10246.0, 3722.0, 1567.0, 773.0, 353.0, 240.0, 116.0, 80.0, 39.0, 26.0, 19.0, 17.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.755615234375, -20.93310546875, -20.110595703125, -19.2880859375, -18.465576171875, -17.64306640625, -16.820556640625, -15.998046875, -15.175537109375, -14.35302734375, -13.530517578125, -12.7080078125, -11.885498046875, -11.06298828125, -10.240478515625, -9.41796875, -8.595458984375, -7.77294921875, -6.950439453125, -6.1279296875, -5.305419921875, -4.48291015625, -3.660400390625, -2.837890625, -2.015380859375, -1.19287109375, -0.370361328125, 0.4521484375, 1.274658203125, 2.09716796875, 2.919677734375, 3.7421875, 4.564697265625, 5.38720703125, 6.209716796875, 7.0322265625, 7.854736328125, 8.67724609375, 9.499755859375, 10.322265625, 11.144775390625, 11.96728515625, 12.789794921875, 13.6123046875, 14.434814453125, 15.25732421875, 16.079833984375, 16.90234375, 17.724853515625, 18.54736328125, 19.369873046875, 20.1923828125, 21.014892578125, 21.83740234375, 22.659912109375, 23.482421875, 24.304931640625, 25.12744140625, 25.949951171875, 26.7724609375, 27.594970703125, 28.41748046875, 29.239990234375, 30.0625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 12.0, 10.0, 24.0, 34.0, 40.0, 39.0, 47.0, 72.0, 74.0, 77.0, 89.0, 75.0, 69.0, 65.0, 62.0, 42.0, 41.0, 21.0, 20.0, 15.0, 16.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017547607421875, -0.0016904175281524658, -0.0016260743141174316, -0.0015617311000823975, -0.0014973878860473633, -0.001433044672012329, -0.001368701457977295, -0.0013043582439422607, -0.0012400150299072266, -0.0011756718158721924, -0.0011113286018371582, -0.001046985387802124, -0.0009826421737670898, -0.0009182989597320557, -0.0008539557456970215, -0.0007896125316619873, -0.0007252693176269531, -0.0006609261035919189, -0.0005965828895568848, -0.0005322396755218506, -0.0004678964614868164, -0.0004035532474517822, -0.00033921003341674805, -0.00027486681938171387, -0.0002105236053466797, -0.0001461803913116455, -8.183717727661133e-05, -1.749396324157715e-05, 4.684925079345703e-05, 0.00011119246482849121, 0.0001755356788635254, 0.00023987889289855957, 0.00030422210693359375, 0.00036856532096862793, 0.0004329085350036621, 0.0004972517490386963, 0.0005615949630737305, 0.0006259381771087646, 0.0006902813911437988, 0.000754624605178833, 0.0008189678192138672, 0.0008833110332489014, 0.0009476542472839355, 0.0010119974613189697, 0.001076340675354004, 0.001140683889389038, 0.0012050271034240723, 0.0012693703174591064, 0.0013337135314941406, 0.0013980567455291748, 0.001462399959564209, 0.0015267431735992432, 0.0015910863876342773, 0.0016554296016693115, 0.0017197728157043457, 0.0017841160297393799, 0.001848459243774414, 0.0019128024578094482, 0.0019771456718444824, 0.0020414888858795166, 0.0021058320999145508, 0.002170175313949585, 0.002234518527984619, 0.0022988617420196533, 0.0023632049560546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 9.0, 14.0, 18.0, 34.0, 46.0, 71.0, 132.0, 232.0, 393.0, 780.0, 1727.0, 4260.0, 16191.0, 121039.0, 637198.0, 229432.0, 26747.0, 5893.0, 2169.0, 948.0, 506.0, 296.0, 138.0, 104.0, 64.0, 26.0, 17.0, 15.0, 4.0, 8.0, 5.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.59375, -44.382568359375, -43.17138671875, -41.960205078125, -40.7490234375, -39.537841796875, -38.32666015625, -37.115478515625, -35.904296875, -34.693115234375, -33.48193359375, -32.270751953125, -31.0595703125, -29.848388671875, -28.63720703125, -27.426025390625, -26.21484375, -25.003662109375, -23.79248046875, -22.581298828125, -21.3701171875, -20.158935546875, -18.94775390625, -17.736572265625, -16.525390625, -15.314208984375, -14.10302734375, -12.891845703125, -11.6806640625, -10.469482421875, -9.25830078125, -8.047119140625, -6.8359375, -5.624755859375, -4.41357421875, -3.202392578125, -1.9912109375, -0.780029296875, 0.43115234375, 1.642333984375, 2.853515625, 4.064697265625, 5.27587890625, 6.487060546875, 7.6982421875, 8.909423828125, 10.12060546875, 11.331787109375, 12.54296875, 13.754150390625, 14.96533203125, 16.176513671875, 17.3876953125, 18.598876953125, 19.81005859375, 21.021240234375, 22.232421875, 23.443603515625, 24.65478515625, 25.865966796875, 27.0771484375, 28.288330078125, 29.49951171875, 30.710693359375, 31.921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 12.0, 10.0, 23.0, 34.0, 51.0, 66.0, 78.0, 79.0, 88.0, 95.0, 95.0, 76.0, 68.0, 58.0, 46.0, 33.0, 19.0, 19.0, 13.0, 7.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.4141845703125, -13.804931640625, -13.1956787109375, -12.58642578125, -11.9771728515625, -11.367919921875, -10.7586669921875, -10.1494140625, -9.5401611328125, -8.930908203125, -8.3216552734375, -7.71240234375, -7.1031494140625, -6.493896484375, -5.8846435546875, -5.275390625, -4.6661376953125, -4.056884765625, -3.4476318359375, -2.83837890625, -2.2291259765625, -1.619873046875, -1.0106201171875, -0.4013671875, 0.2078857421875, 0.817138671875, 1.4263916015625, 2.03564453125, 2.6448974609375, 3.254150390625, 3.8634033203125, 4.47265625, 5.0819091796875, 5.691162109375, 6.3004150390625, 6.90966796875, 7.5189208984375, 8.128173828125, 8.7374267578125, 9.3466796875, 9.9559326171875, 10.565185546875, 11.1744384765625, 11.78369140625, 12.3929443359375, 13.002197265625, 13.6114501953125, 14.220703125, 14.8299560546875, 15.439208984375, 16.0484619140625, 16.65771484375, 17.2669677734375, 17.876220703125, 18.4854736328125, 19.0947265625, 19.7039794921875, 20.313232421875, 20.9224853515625, 21.53173828125, 22.1409912109375, 22.750244140625, 23.3594970703125, 23.96875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 11.0, 34.0, 112.0, 229.0, 309.0, 192.0, 83.0, 20.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-598.8878173828125, -586.2535400390625, -573.6192626953125, -560.9849853515625, -548.3506469726562, -535.7163696289062, -523.0820922851562, -510.44781494140625, -497.81353759765625, -485.17926025390625, -472.5449523925781, -459.9106750488281, -447.2763977050781, -434.6421203613281, -422.0078125, -409.37353515625, -396.7392578125, -384.10498046875, -371.4706726074219, -358.8363952636719, -346.2021179199219, -333.5678405761719, -320.93353271484375, -308.29925537109375, -295.6649475097656, -283.0306701660156, -270.3963623046875, -257.7620849609375, -245.1278076171875, -232.49351501464844, -219.85922241210938, -207.22494506835938, -194.59066772460938, -181.9563751220703, -169.3220977783203, -156.68780517578125, -144.05352783203125, -131.4192352294922, -118.78495025634766, -106.15066528320312, -93.5163803100586, -80.88209533691406, -68.24781036376953, -55.613521575927734, -42.9792366027832, -30.344951629638672, -17.710662841796875, -5.076377868652344, 7.5579071044921875, 20.19219207763672, 32.82647705078125, 45.46076583862305, 58.09505081176758, 70.72933959960938, 83.3636245727539, 95.99790954589844, 108.63219451904297, 121.2664794921875, 133.90077209472656, 146.53504943847656, 159.16934204101562, 171.80361938476562, 184.4379119873047, 197.07220458984375, 209.70648193359375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 19.0, 27.0, 39.0, 40.0, 33.0, 51.0, 47.0, 49.0, 41.0, 49.0, 62.0, 44.0, 41.0, 57.0, 49.0, 47.0, 44.0, 37.0, 30.0, 37.0, 16.0, 20.0, 9.0, 14.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.0939483642578, -127.42398071289062, -123.75401306152344, -120.08403778076172, -116.41407012939453, -112.74410247802734, -109.07412719726562, -105.40415954589844, -101.73419189453125, -98.06422424316406, -94.39425659179688, -90.72428131103516, -87.05431365966797, -83.38434600830078, -79.71437072753906, -76.04440307617188, -72.37443542480469, -68.7044677734375, -65.03450012207031, -61.364524841308594, -57.694557189941406, -54.02458953857422, -50.354618072509766, -46.68464660644531, -43.014678955078125, -39.34471130371094, -35.674739837646484, -32.00476837158203, -28.334800720214844, -24.664831161499023, -20.994861602783203, -17.324892044067383, -13.654922485351562, -9.984952926635742, -6.314983367919922, -2.6450138092041016, 1.0249557495117188, 4.694925308227539, 8.36489486694336, 12.03486442565918, 15.704833984375, 19.37480354309082, 23.04477310180664, 26.71474266052246, 30.38471221923828, 34.05467987060547, 37.72465133666992, 41.394622802734375, 45.06459045410156, 48.73455810546875, 52.4045295715332, 56.074501037597656, 59.744468688964844, 63.41443634033203, 67.08441162109375, 70.75437927246094, 74.42434692382812, 78.09431457519531, 81.7642822265625, 85.43425750732422, 89.1042251586914, 92.7741928100586, 96.44416809082031, 100.1141357421875, 103.78410339355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 6.0, 3.0, 7.0, 12.0, 11.0, 18.0, 28.0, 37.0, 36.0, 52.0, 89.0, 139.0, 272.0, 449.0, 924.0, 1971.0, 4639.0, 13197.0, 45641.0, 272647.0, 3532624.0, 255167.0, 44081.0, 13010.0, 4775.0, 2015.0, 1013.0, 478.0, 274.0, 211.0, 119.0, 81.0, 55.0, 48.0, 30.0, 23.0, 23.0, 19.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.78125, -36.455078125, -35.12890625, -33.802734375, -32.4765625, -31.150390625, -29.82421875, -28.498046875, -27.171875, -25.845703125, -24.51953125, -23.193359375, -21.8671875, -20.541015625, -19.21484375, -17.888671875, -16.5625, -15.236328125, -13.91015625, -12.583984375, -11.2578125, -9.931640625, -8.60546875, -7.279296875, -5.953125, -4.626953125, -3.30078125, -1.974609375, -0.6484375, 0.677734375, 2.00390625, 3.330078125, 4.65625, 5.982421875, 7.30859375, 8.634765625, 9.9609375, 11.287109375, 12.61328125, 13.939453125, 15.265625, 16.591796875, 17.91796875, 19.244140625, 20.5703125, 21.896484375, 23.22265625, 24.548828125, 25.875, 27.201171875, 28.52734375, 29.853515625, 31.1796875, 32.505859375, 33.83203125, 35.158203125, 36.484375, 37.810546875, 39.13671875, 40.462890625, 41.7890625, 43.115234375, 44.44140625, 45.767578125, 47.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 24.0, 34.0, 23.0, 32.0, 54.0, 50.0, 64.0, 79.0, 78.0, 68.0, 57.0, 48.0, 51.0, 68.0, 50.0, 44.0, 20.0, 24.0, 32.0, 14.0, 15.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.469329833984375, -3.34295654296875, -3.216583251953125, -3.0902099609375, -2.963836669921875, -2.83746337890625, -2.711090087890625, -2.584716796875, -2.458343505859375, -2.33197021484375, -2.205596923828125, -2.0792236328125, -1.952850341796875, -1.82647705078125, -1.700103759765625, -1.57373046875, -1.447357177734375, -1.32098388671875, -1.194610595703125, -1.0682373046875, -0.941864013671875, -0.81549072265625, -0.689117431640625, -0.562744140625, -0.436370849609375, -0.30999755859375, -0.183624267578125, -0.0572509765625, 0.069122314453125, 0.19549560546875, 0.321868896484375, 0.4482421875, 0.574615478515625, 0.70098876953125, 0.827362060546875, 0.9537353515625, 1.080108642578125, 1.20648193359375, 1.332855224609375, 1.459228515625, 1.585601806640625, 1.71197509765625, 1.838348388671875, 1.9647216796875, 2.091094970703125, 2.21746826171875, 2.343841552734375, 2.47021484375, 2.596588134765625, 2.72296142578125, 2.849334716796875, 2.9757080078125, 3.102081298828125, 3.22845458984375, 3.354827880859375, 3.481201171875, 3.607574462890625, 3.73394775390625, 3.860321044921875, 3.9866943359375, 4.113067626953125, 4.23944091796875, 4.365814208984375, 4.4921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 6.0, 10.0, 9.0, 10.0, 11.0, 21.0, 16.0, 29.0, 21.0, 34.0, 44.0, 61.0, 107.0, 238.0, 588.0, 1898.0, 11325.0, 149555.0, 3819637.0, 194009.0, 13147.0, 2219.0, 590.0, 202.0, 117.0, 74.0, 58.0, 47.0, 23.0, 26.0, 20.0, 20.0, 19.0, 15.0, 10.0, 12.0, 11.0, 14.0, 3.0, 1.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.4609375, -67.109375, -64.7578125, -62.40625, -60.0546875, -57.703125, -55.3515625, -53.0, -50.6484375, -48.296875, -45.9453125, -43.59375, -41.2421875, -38.890625, -36.5390625, -34.1875, -31.8359375, -29.484375, -27.1328125, -24.78125, -22.4296875, -20.078125, -17.7265625, -15.375, -13.0234375, -10.671875, -8.3203125, -5.96875, -3.6171875, -1.265625, 1.0859375, 3.4375, 5.7890625, 8.140625, 10.4921875, 12.84375, 15.1953125, 17.546875, 19.8984375, 22.25, 24.6015625, 26.953125, 29.3046875, 31.65625, 34.0078125, 36.359375, 38.7109375, 41.0625, 43.4140625, 45.765625, 48.1171875, 50.46875, 52.8203125, 55.171875, 57.5234375, 59.875, 62.2265625, 64.578125, 66.9296875, 69.28125, 71.6328125, 73.984375, 76.3359375, 78.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 15.0, 28.0, 55.0, 155.0, 496.0, 2310.0, 697.0, 186.0, 75.0, 27.0, 16.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.0706787109375, -8.352294921875, -7.6339111328125, -6.91552734375, -6.1971435546875, -5.478759765625, -4.7603759765625, -4.0419921875, -3.3236083984375, -2.605224609375, -1.8868408203125, -1.16845703125, -0.4500732421875, 0.268310546875, 0.9866943359375, 1.705078125, 2.4234619140625, 3.141845703125, 3.8602294921875, 4.57861328125, 5.2969970703125, 6.015380859375, 6.7337646484375, 7.4521484375, 8.1705322265625, 8.888916015625, 9.6072998046875, 10.32568359375, 11.0440673828125, 11.762451171875, 12.4808349609375, 13.19921875, 13.9176025390625, 14.635986328125, 15.3543701171875, 16.07275390625, 16.7911376953125, 17.509521484375, 18.2279052734375, 18.9462890625, 19.6646728515625, 20.383056640625, 21.1014404296875, 21.81982421875, 22.5382080078125, 23.256591796875, 23.9749755859375, 24.693359375, 25.4117431640625, 26.130126953125, 26.8485107421875, 27.56689453125, 28.2852783203125, 29.003662109375, 29.7220458984375, 30.4404296875, 31.1588134765625, 31.877197265625, 32.5955810546875, 33.31396484375, 34.0323486328125, 34.750732421875, 35.4691162109375, 36.1875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 15.0, 19.0, 36.0, 72.0, 115.0, 165.0, 184.0, 123.0, 105.0, 76.0, 27.0, 23.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.16114807128906, -78.63786315917969, -76.11457824707031, -73.59130096435547, -71.0680160522461, -68.54473114013672, -66.02144622802734, -63.49816131591797, -60.97488021850586, -58.451595306396484, -55.928314208984375, -53.405029296875, -50.881744384765625, -48.358463287353516, -45.83517837524414, -43.31189727783203, -40.788612365722656, -38.26532745361328, -35.74204635620117, -33.2187614440918, -30.695478439331055, -28.172195434570312, -25.648910522460938, -23.125627517700195, -20.602344512939453, -18.07906150817871, -15.555777549743652, -13.032493591308594, -10.509210586547852, -7.985927581787109, -5.462643623352051, -2.939359664916992, -0.41606903076171875, 2.1072144508361816, 4.630497932434082, 7.153781414031982, 9.677064895629883, 12.200347900390625, 14.723631858825684, 17.246915817260742, 19.770198822021484, 22.293481826782227, 24.81676483154297, 27.340049743652344, 29.863332748413086, 32.38661575317383, 34.9099006652832, 37.43318176269531, 39.95646667480469, 42.47975158691406, 45.00303268432617, 47.52631759643555, 50.049598693847656, 52.57288360595703, 55.096168518066406, 57.61945343017578, 60.14273452758789, 62.666019439697266, 65.18930053710938, 67.71258544921875, 70.23587036132812, 72.7591552734375, 75.28243255615234, 77.80571746826172, 80.3290023803711]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 11.0, 10.0, 7.0, 19.0, 28.0, 18.0, 35.0, 44.0, 47.0, 55.0, 63.0, 74.0, 61.0, 69.0, 61.0, 60.0, 51.0, 51.0, 53.0, 37.0, 37.0, 25.0, 18.0, 13.0, 18.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.13761901855469, -55.70052719116211, -54.26343536376953, -52.82634353637695, -51.389251708984375, -49.9521598815918, -48.51506805419922, -47.07797622680664, -45.64088439941406, -44.203792572021484, -42.766700744628906, -41.32960891723633, -39.89251708984375, -38.45542526245117, -37.018333435058594, -35.581241607666016, -34.14414978027344, -32.70705795288086, -31.26996612548828, -29.832874298095703, -28.395782470703125, -26.958690643310547, -25.52159881591797, -24.08450698852539, -22.647415161132812, -21.210323333740234, -19.773231506347656, -18.336139678955078, -16.8990478515625, -15.461956024169922, -14.024864196777344, -12.587772369384766, -11.150680541992188, -9.71358871459961, -8.276496887207031, -6.839405059814453, -5.402313232421875, -3.965221405029297, -2.5281295776367188, -1.0910377502441406, 0.3460540771484375, 1.7831459045410156, 3.2202377319335938, 4.657329559326172, 6.09442138671875, 7.531513214111328, 8.968605041503906, 10.405696868896484, 11.842788696289062, 13.27988052368164, 14.716972351074219, 16.154064178466797, 17.591156005859375, 19.028247833251953, 20.46533966064453, 21.90243148803711, 23.339523315429688, 24.776615142822266, 26.213706970214844, 27.650798797607422, 29.087890625, 30.524982452392578, 31.962074279785156, 33.399166107177734, 34.83625793457031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 11.0, 12.0, 15.0, 33.0, 32.0, 64.0, 78.0, 139.0, 226.0, 408.0, 813.0, 1567.0, 3395.0, 7340.0, 18487.0, 47728.0, 120080.0, 252779.0, 306068.0, 170344.0, 71385.0, 27563.0, 10951.0, 4665.0, 2077.0, 1055.0, 524.0, 269.0, 157.0, 104.0, 55.0, 37.0, 20.0, 14.0, 14.0, 10.0, 7.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-20.71875, -20.1466064453125, -19.574462890625, -19.0023193359375, -18.43017578125, -17.8580322265625, -17.285888671875, -16.7137451171875, -16.1416015625, -15.5694580078125, -14.997314453125, -14.4251708984375, -13.85302734375, -13.2808837890625, -12.708740234375, -12.1365966796875, -11.564453125, -10.9923095703125, -10.420166015625, -9.8480224609375, -9.27587890625, -8.7037353515625, -8.131591796875, -7.5594482421875, -6.9873046875, -6.4151611328125, -5.843017578125, -5.2708740234375, -4.69873046875, -4.1265869140625, -3.554443359375, -2.9822998046875, -2.41015625, -1.8380126953125, -1.265869140625, -0.6937255859375, -0.12158203125, 0.4505615234375, 1.022705078125, 1.5948486328125, 2.1669921875, 2.7391357421875, 3.311279296875, 3.8834228515625, 4.45556640625, 5.0277099609375, 5.599853515625, 6.1719970703125, 6.744140625, 7.3162841796875, 7.888427734375, 8.4605712890625, 9.03271484375, 9.6048583984375, 10.177001953125, 10.7491455078125, 11.3212890625, 11.8934326171875, 12.465576171875, 13.0377197265625, 13.60986328125, 14.1820068359375, 14.754150390625, 15.3262939453125, 15.8984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 3.0, 9.0, 9.0, 12.0, 9.0, 19.0, 19.0, 17.0, 27.0, 22.0, 24.0, 30.0, 32.0, 38.0, 38.0, 53.0, 56.0, 46.0, 45.0, 42.0, 32.0, 42.0, 33.0, 42.0, 36.0, 42.0, 28.0, 38.0, 29.0, 23.0, 9.0, 20.0, 13.0, 18.0, 13.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.2625732421875, -2.179443359375, -2.0963134765625, -2.01318359375, -1.9300537109375, -1.846923828125, -1.7637939453125, -1.6806640625, -1.5975341796875, -1.514404296875, -1.4312744140625, -1.34814453125, -1.2650146484375, -1.181884765625, -1.0987548828125, -1.015625, -0.9324951171875, -0.849365234375, -0.7662353515625, -0.68310546875, -0.5999755859375, -0.516845703125, -0.4337158203125, -0.3505859375, -0.2674560546875, -0.184326171875, -0.1011962890625, -0.01806640625, 0.0650634765625, 0.148193359375, 0.2313232421875, 0.314453125, 0.3975830078125, 0.480712890625, 0.5638427734375, 0.64697265625, 0.7301025390625, 0.813232421875, 0.8963623046875, 0.9794921875, 1.0626220703125, 1.145751953125, 1.2288818359375, 1.31201171875, 1.3951416015625, 1.478271484375, 1.5614013671875, 1.64453125, 1.7276611328125, 1.810791015625, 1.8939208984375, 1.97705078125, 2.0601806640625, 2.143310546875, 2.2264404296875, 2.3095703125, 2.3927001953125, 2.475830078125, 2.5589599609375, 2.64208984375, 2.7252197265625, 2.808349609375, 2.8914794921875, 2.974609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 9.0, 8.0, 19.0, 27.0, 31.0, 44.0, 69.0, 75.0, 136.0, 172.0, 193.0, 304.0, 455.0, 631.0, 1106.0, 2261.0, 5325.0, 16657.0, 58467.0, 196333.0, 409294.0, 246134.0, 76359.0, 21660.0, 6691.0, 2625.0, 1192.0, 696.0, 453.0, 299.0, 231.0, 169.0, 119.0, 84.0, 69.0, 41.0, 32.0, 21.0, 17.0, 15.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.703125, -19.059326171875, -18.41552734375, -17.771728515625, -17.1279296875, -16.484130859375, -15.84033203125, -15.196533203125, -14.552734375, -13.908935546875, -13.26513671875, -12.621337890625, -11.9775390625, -11.333740234375, -10.68994140625, -10.046142578125, -9.40234375, -8.758544921875, -8.11474609375, -7.470947265625, -6.8271484375, -6.183349609375, -5.53955078125, -4.895751953125, -4.251953125, -3.608154296875, -2.96435546875, -2.320556640625, -1.6767578125, -1.032958984375, -0.38916015625, 0.254638671875, 0.8984375, 1.542236328125, 2.18603515625, 2.829833984375, 3.4736328125, 4.117431640625, 4.76123046875, 5.405029296875, 6.048828125, 6.692626953125, 7.33642578125, 7.980224609375, 8.6240234375, 9.267822265625, 9.91162109375, 10.555419921875, 11.19921875, 11.843017578125, 12.48681640625, 13.130615234375, 13.7744140625, 14.418212890625, 15.06201171875, 15.705810546875, 16.349609375, 16.993408203125, 17.63720703125, 18.281005859375, 18.9248046875, 19.568603515625, 20.21240234375, 20.856201171875, 21.5]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 8.0, 11.0, 13.0, 19.0, 29.0, 19.0, 18.0, 42.0, 40.0, 28.0, 45.0, 40.0, 40.0, 40.0, 42.0, 46.0, 41.0, 55.0, 51.0, 50.0, 39.0, 32.0, 28.0, 27.0, 27.0, 18.0, 23.0, 16.0, 18.0, 14.0, 8.0, 6.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5, -12.0701904296875, -11.640380859375, -11.2105712890625, -10.78076171875, -10.3509521484375, -9.921142578125, -9.4913330078125, -9.0615234375, -8.6317138671875, -8.201904296875, -7.7720947265625, -7.34228515625, -6.9124755859375, -6.482666015625, -6.0528564453125, -5.623046875, -5.1932373046875, -4.763427734375, -4.3336181640625, -3.90380859375, -3.4739990234375, -3.044189453125, -2.6143798828125, -2.1845703125, -1.7547607421875, -1.324951171875, -0.8951416015625, -0.46533203125, -0.0355224609375, 0.394287109375, 0.8240966796875, 1.25390625, 1.6837158203125, 2.113525390625, 2.5433349609375, 2.97314453125, 3.4029541015625, 3.832763671875, 4.2625732421875, 4.6923828125, 5.1221923828125, 5.552001953125, 5.9818115234375, 6.41162109375, 6.8414306640625, 7.271240234375, 7.7010498046875, 8.130859375, 8.5606689453125, 8.990478515625, 9.4202880859375, 9.85009765625, 10.2799072265625, 10.709716796875, 11.1395263671875, 11.5693359375, 11.9991455078125, 12.428955078125, 12.8587646484375, 13.28857421875, 13.7183837890625, 14.148193359375, 14.5780029296875, 15.0078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 7.0, 12.0, 11.0, 25.0, 37.0, 73.0, 93.0, 159.0, 329.0, 593.0, 1502.0, 4325.0, 17947.0, 172213.0, 725797.0, 106006.0, 13367.0, 3493.0, 1255.0, 577.0, 313.0, 173.0, 97.0, 58.0, 36.0, 19.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.4375, -21.618896484375, -20.80029296875, -19.981689453125, -19.1630859375, -18.344482421875, -17.52587890625, -16.707275390625, -15.888671875, -15.070068359375, -14.25146484375, -13.432861328125, -12.6142578125, -11.795654296875, -10.97705078125, -10.158447265625, -9.33984375, -8.521240234375, -7.70263671875, -6.884033203125, -6.0654296875, -5.246826171875, -4.42822265625, -3.609619140625, -2.791015625, -1.972412109375, -1.15380859375, -0.335205078125, 0.4833984375, 1.302001953125, 2.12060546875, 2.939208984375, 3.7578125, 4.576416015625, 5.39501953125, 6.213623046875, 7.0322265625, 7.850830078125, 8.66943359375, 9.488037109375, 10.306640625, 11.125244140625, 11.94384765625, 12.762451171875, 13.5810546875, 14.399658203125, 15.21826171875, 16.036865234375, 16.85546875, 17.674072265625, 18.49267578125, 19.311279296875, 20.1298828125, 20.948486328125, 21.76708984375, 22.585693359375, 23.404296875, 24.222900390625, 25.04150390625, 25.860107421875, 26.6787109375, 27.497314453125, 28.31591796875, 29.134521484375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 9.0, 17.0, 17.0, 29.0, 25.0, 33.0, 42.0, 43.0, 84.0, 85.0, 95.0, 114.0, 82.0, 61.0, 46.0, 48.0, 32.0, 20.0, 25.0, 19.0, 11.0, 5.0, 1.0, 11.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014190673828125, -0.0013680458068847656, -0.0013170242309570312, -0.0012660026550292969, -0.0012149810791015625, -0.0011639595031738281, -0.0011129379272460938, -0.0010619163513183594, -0.001010894775390625, -0.0009598731994628906, -0.0009088516235351562, -0.0008578300476074219, -0.0008068084716796875, -0.0007557868957519531, -0.0007047653198242188, -0.0006537437438964844, -0.00060272216796875, -0.0005517005920410156, -0.0005006790161132812, -0.0004496574401855469, -0.0003986358642578125, -0.0003476142883300781, -0.00029659271240234375, -0.0002455711364746094, -0.000194549560546875, -0.00014352798461914062, -9.250640869140625e-05, -4.1484832763671875e-05, 9.5367431640625e-06, 6.0558319091796875e-05, 0.00011157989501953125, 0.00016260147094726562, 0.000213623046875, 0.0002646446228027344, 0.00031566619873046875, 0.0003666877746582031, 0.0004177093505859375, 0.0004687309265136719, 0.0005197525024414062, 0.0005707740783691406, 0.000621795654296875, 0.0006728172302246094, 0.0007238388061523438, 0.0007748603820800781, 0.0008258819580078125, 0.0008769035339355469, 0.0009279251098632812, 0.0009789466857910156, 0.00102996826171875, 0.0010809898376464844, 0.0011320114135742188, 0.0011830329895019531, 0.0012340545654296875, 0.0012850761413574219, 0.0013360977172851562, 0.0013871192932128906, 0.001438140869140625, 0.0014891624450683594, 0.0015401840209960938, 0.0015912055969238281, 0.0016422271728515625, 0.0016932487487792969, 0.0017442703247070312, 0.0017952919006347656, 0.0018463134765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 5.0, 16.0, 22.0, 32.0, 58.0, 103.0, 184.0, 378.0, 855.0, 2815.0, 14848.0, 222504.0, 751103.0, 46721.0, 6180.0, 1504.0, 600.0, 275.0, 125.0, 74.0, 52.0, 29.0, 16.0, 9.0, 8.0, 2.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.40625, -47.260498046875, -46.11474609375, -44.968994140625, -43.8232421875, -42.677490234375, -41.53173828125, -40.385986328125, -39.240234375, -38.094482421875, -36.94873046875, -35.802978515625, -34.6572265625, -33.511474609375, -32.36572265625, -31.219970703125, -30.07421875, -28.928466796875, -27.78271484375, -26.636962890625, -25.4912109375, -24.345458984375, -23.19970703125, -22.053955078125, -20.908203125, -19.762451171875, -18.61669921875, -17.470947265625, -16.3251953125, -15.179443359375, -14.03369140625, -12.887939453125, -11.7421875, -10.596435546875, -9.45068359375, -8.304931640625, -7.1591796875, -6.013427734375, -4.86767578125, -3.721923828125, -2.576171875, -1.430419921875, -0.28466796875, 0.861083984375, 2.0068359375, 3.152587890625, 4.29833984375, 5.444091796875, 6.58984375, 7.735595703125, 8.88134765625, 10.027099609375, 11.1728515625, 12.318603515625, 13.46435546875, 14.610107421875, 15.755859375, 16.901611328125, 18.04736328125, 19.193115234375, 20.3388671875, 21.484619140625, 22.63037109375, 23.776123046875, 24.921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 11.0, 11.0, 12.0, 33.0, 43.0, 61.0, 75.0, 81.0, 113.0, 101.0, 105.0, 91.0, 62.0, 53.0, 37.0, 20.0, 18.0, 17.0, 15.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.874267578125, -8.43603515625, -7.997802734375, -7.5595703125, -7.121337890625, -6.68310546875, -6.244873046875, -5.806640625, -5.368408203125, -4.93017578125, -4.491943359375, -4.0537109375, -3.615478515625, -3.17724609375, -2.739013671875, -2.30078125, -1.862548828125, -1.42431640625, -0.986083984375, -0.5478515625, -0.109619140625, 0.32861328125, 0.766845703125, 1.205078125, 1.643310546875, 2.08154296875, 2.519775390625, 2.9580078125, 3.396240234375, 3.83447265625, 4.272705078125, 4.7109375, 5.149169921875, 5.58740234375, 6.025634765625, 6.4638671875, 6.902099609375, 7.34033203125, 7.778564453125, 8.216796875, 8.655029296875, 9.09326171875, 9.531494140625, 9.9697265625, 10.407958984375, 10.84619140625, 11.284423828125, 11.72265625, 12.160888671875, 12.59912109375, 13.037353515625, 13.4755859375, 13.913818359375, 14.35205078125, 14.790283203125, 15.228515625, 15.666748046875, 16.10498046875, 16.543212890625, 16.9814453125, 17.419677734375, 17.85791015625, 18.296142578125, 18.734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 22.0, 32.0, 64.0, 99.0, 142.0, 158.0, 159.0, 120.0, 84.0, 47.0, 30.0, 17.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.94647216796875, -160.3875274658203, -154.82859802246094, -149.2696533203125, -143.71072387695312, -138.1517791748047, -132.59283447265625, -127.03389739990234, -121.47496032714844, -115.91602325439453, -110.35708618164062, -104.79814147949219, -99.23920440673828, -93.68026733398438, -88.12132263183594, -82.56238555908203, -77.00344848632812, -71.44451141357422, -65.88557434082031, -60.326629638671875, -54.76769256591797, -49.20875549316406, -43.64981460571289, -38.09087371826172, -32.53193664550781, -26.972997665405273, -21.414058685302734, -15.855119705200195, -10.296180725097656, -4.737241744995117, 0.8216972351074219, 6.380638122558594, 11.9395751953125, 17.49851417541504, 23.057453155517578, 28.616392135620117, 34.175331115722656, 39.73426818847656, 45.293209075927734, 50.852149963378906, 56.41108703613281, 61.97002410888672, 67.52896118164062, 73.08790588378906, 78.64684295654297, 84.20578002929688, 89.76472473144531, 95.32366180419922, 100.88259887695312, 106.44153594970703, 112.00047302246094, 117.55941772460938, 123.11835479736328, 128.6772918701172, 134.23623657226562, 139.795166015625, 145.35411071777344, 150.91305541992188, 156.47198486328125, 162.0309295654297, 167.58987426757812, 173.1488037109375, 178.70774841308594, 184.26669311523438, 189.82562255859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 4.0, 9.0, 9.0, 11.0, 17.0, 18.0, 27.0, 35.0, 30.0, 27.0, 45.0, 38.0, 41.0, 34.0, 38.0, 52.0, 44.0, 41.0, 53.0, 51.0, 40.0, 40.0, 38.0, 45.0, 22.0, 20.0, 28.0, 31.0, 17.0, 14.0, 11.0, 13.0, 5.0, 7.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.92521667480469, -88.2435302734375, -85.56185150146484, -82.88017272949219, -80.198486328125, -77.51679992675781, -74.83512115478516, -72.1534423828125, -69.47175598144531, -66.79006958007812, -64.10839080810547, -61.42670822143555, -58.745025634765625, -56.0633430480957, -53.38166046142578, -50.69997787475586, -48.01829528808594, -45.336612701416016, -42.654930114746094, -39.97324752807617, -37.29156494140625, -34.60988235473633, -31.928199768066406, -29.246517181396484, -26.564834594726562, -23.88315200805664, -21.20146942138672, -18.519786834716797, -15.838104248046875, -13.156421661376953, -10.474739074707031, -7.793056488037109, -5.111366271972656, -2.4296836853027344, 0.2519989013671875, 2.9336814880371094, 5.615364074707031, 8.297046661376953, 10.978729248046875, 13.660411834716797, 16.34209442138672, 19.02377700805664, 21.705459594726562, 24.387142181396484, 27.068824768066406, 29.750507354736328, 32.43218994140625, 35.11387252807617, 37.795555114746094, 40.477237701416016, 43.15892028808594, 45.84060287475586, 48.52228546142578, 51.2039680480957, 53.885650634765625, 56.56733322143555, 59.24901580810547, 61.93069839477539, 64.61238098144531, 67.2940673828125, 69.97574615478516, 72.65742492675781, 75.339111328125, 78.02079772949219, 80.70247650146484]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 10.0, 15.0, 20.0, 32.0, 67.0, 103.0, 200.0, 504.0, 1018.0, 2261.0, 5891.0, 17608.0, 70589.0, 730587.0, 3214596.0, 111527.0, 25110.0, 8064.0, 3359.0, 1385.0, 665.0, 330.0, 159.0, 77.0, 44.0, 22.0, 15.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.03125, -38.033935546875, -37.03662109375, -36.039306640625, -35.0419921875, -34.044677734375, -33.04736328125, -32.050048828125, -31.052734375, -30.055419921875, -29.05810546875, -28.060791015625, -27.0634765625, -26.066162109375, -25.06884765625, -24.071533203125, -23.07421875, -22.076904296875, -21.07958984375, -20.082275390625, -19.0849609375, -18.087646484375, -17.09033203125, -16.093017578125, -15.095703125, -14.098388671875, -13.10107421875, -12.103759765625, -11.1064453125, -10.109130859375, -9.11181640625, -8.114501953125, -7.1171875, -6.119873046875, -5.12255859375, -4.125244140625, -3.1279296875, -2.130615234375, -1.13330078125, -0.135986328125, 0.861328125, 1.858642578125, 2.85595703125, 3.853271484375, 4.8505859375, 5.847900390625, 6.84521484375, 7.842529296875, 8.83984375, 9.837158203125, 10.83447265625, 11.831787109375, 12.8291015625, 13.826416015625, 14.82373046875, 15.821044921875, 16.818359375, 17.815673828125, 18.81298828125, 19.810302734375, 20.8076171875, 21.804931640625, 22.80224609375, 23.799560546875, 24.796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 4.0, 15.0, 16.0, 25.0, 31.0, 28.0, 36.0, 31.0, 44.0, 51.0, 46.0, 60.0, 42.0, 47.0, 48.0, 58.0, 55.0, 46.0, 42.0, 35.0, 43.0, 26.0, 26.0, 27.0, 20.0, 13.0, 9.0, 10.0, 13.0, 4.0, 8.0, 8.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.081695556640625, -2.98565673828125, -2.889617919921875, -2.7935791015625, -2.697540283203125, -2.60150146484375, -2.505462646484375, -2.409423828125, -2.313385009765625, -2.21734619140625, -2.121307373046875, -2.0252685546875, -1.929229736328125, -1.83319091796875, -1.737152099609375, -1.64111328125, -1.545074462890625, -1.44903564453125, -1.352996826171875, -1.2569580078125, -1.160919189453125, -1.06488037109375, -0.968841552734375, -0.872802734375, -0.776763916015625, -0.68072509765625, -0.584686279296875, -0.4886474609375, -0.392608642578125, -0.29656982421875, -0.200531005859375, -0.1044921875, -0.008453369140625, 0.08758544921875, 0.183624267578125, 0.2796630859375, 0.375701904296875, 0.47174072265625, 0.567779541015625, 0.663818359375, 0.759857177734375, 0.85589599609375, 0.951934814453125, 1.0479736328125, 1.144012451171875, 1.24005126953125, 1.336090087890625, 1.43212890625, 1.528167724609375, 1.62420654296875, 1.720245361328125, 1.8162841796875, 1.912322998046875, 2.00836181640625, 2.104400634765625, 2.200439453125, 2.296478271484375, 2.39251708984375, 2.488555908203125, 2.5845947265625, 2.680633544921875, 2.77667236328125, 2.872711181640625, 2.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 10.0, 8.0, 12.0, 15.0, 15.0, 26.0, 33.0, 55.0, 86.0, 132.0, 215.0, 365.0, 592.0, 1204.0, 2277.0, 4653.0, 10766.0, 27214.0, 77887.0, 277390.0, 2438005.0, 1068519.0, 190012.0, 57828.0, 20613.0, 8569.0, 3807.0, 1781.0, 940.0, 501.0, 319.0, 150.0, 92.0, 65.0, 38.0, 27.0, 20.0, 16.0, 4.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.591552734375, -15.01123046875, -14.430908203125, -13.8505859375, -13.270263671875, -12.68994140625, -12.109619140625, -11.529296875, -10.948974609375, -10.36865234375, -9.788330078125, -9.2080078125, -8.627685546875, -8.04736328125, -7.467041015625, -6.88671875, -6.306396484375, -5.72607421875, -5.145751953125, -4.5654296875, -3.985107421875, -3.40478515625, -2.824462890625, -2.244140625, -1.663818359375, -1.08349609375, -0.503173828125, 0.0771484375, 0.657470703125, 1.23779296875, 1.818115234375, 2.3984375, 2.978759765625, 3.55908203125, 4.139404296875, 4.7197265625, 5.300048828125, 5.88037109375, 6.460693359375, 7.041015625, 7.621337890625, 8.20166015625, 8.781982421875, 9.3623046875, 9.942626953125, 10.52294921875, 11.103271484375, 11.68359375, 12.263916015625, 12.84423828125, 13.424560546875, 14.0048828125, 14.585205078125, 15.16552734375, 15.745849609375, 16.326171875, 16.906494140625, 17.48681640625, 18.067138671875, 18.6474609375, 19.227783203125, 19.80810546875, 20.388427734375, 20.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 11.0, 3.0, 11.0, 12.0, 17.0, 27.0, 47.0, 70.0, 75.0, 86.0, 110.0, 162.0, 274.0, 438.0, 1137.0, 580.0, 307.0, 185.0, 129.0, 81.0, 80.0, 58.0, 40.0, 28.0, 19.0, 19.0, 10.0, 13.0, 6.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.4921875, -5.32904052734375, -5.1658935546875, -5.00274658203125, -4.839599609375, -4.67645263671875, -4.5133056640625, -4.35015869140625, -4.18701171875, -4.02386474609375, -3.8607177734375, -3.69757080078125, -3.534423828125, -3.37127685546875, -3.2081298828125, -3.04498291015625, -2.8818359375, -2.71868896484375, -2.5555419921875, -2.39239501953125, -2.229248046875, -2.06610107421875, -1.9029541015625, -1.73980712890625, -1.57666015625, -1.41351318359375, -1.2503662109375, -1.08721923828125, -0.924072265625, -0.76092529296875, -0.5977783203125, -0.43463134765625, -0.271484375, -0.10833740234375, 0.0548095703125, 0.21795654296875, 0.381103515625, 0.54425048828125, 0.7073974609375, 0.87054443359375, 1.03369140625, 1.19683837890625, 1.3599853515625, 1.52313232421875, 1.686279296875, 1.84942626953125, 2.0125732421875, 2.17572021484375, 2.3388671875, 2.50201416015625, 2.6651611328125, 2.82830810546875, 2.991455078125, 3.15460205078125, 3.3177490234375, 3.48089599609375, 3.64404296875, 3.80718994140625, 3.9703369140625, 4.13348388671875, 4.296630859375, 4.45977783203125, 4.6229248046875, 4.78607177734375, 4.94921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 21.0, 30.0, 48.0, 100.0, 111.0, 145.0, 165.0, 158.0, 84.0, 59.0, 34.0, 21.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-92.56082153320312, -90.71758270263672, -88.87434387207031, -87.03111267089844, -85.18787384033203, -83.34463500976562, -81.50139617919922, -79.65815734863281, -77.8149185180664, -75.9716796875, -74.1284408569336, -72.28520202636719, -70.44197082519531, -68.5987319946289, -66.7554931640625, -64.9122543334961, -63.06901931762695, -61.22578048706055, -59.382545471191406, -57.539306640625, -55.696067810058594, -53.85282897949219, -52.00959396362305, -50.16635513305664, -48.3231201171875, -46.479881286621094, -44.63664627075195, -42.79340744018555, -40.95016860961914, -39.10693359375, -37.263694763183594, -35.42045593261719, -33.57721710205078, -31.733980178833008, -29.8907413482666, -28.047504425048828, -26.204265594482422, -24.36102867126465, -22.517791748046875, -20.67455291748047, -18.831315994262695, -16.988079071044922, -15.144840240478516, -13.301603317260742, -11.458365440368652, -9.615127563476562, -7.771890640258789, -5.928652763366699, -4.085414886474609, -2.2421772480010986, -0.3989396095275879, 1.4442977905273438, 3.2875356674194336, 5.130773544311523, 6.974010467529297, 8.817248344421387, 10.660486221313477, 12.503724098205566, 14.346961975097656, 16.19019889831543, 18.033435821533203, 19.87667465209961, 21.719911575317383, 23.563148498535156, 25.406387329101562]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 17.0, 14.0, 16.0, 11.0, 23.0, 28.0, 29.0, 28.0, 35.0, 35.0, 29.0, 37.0, 54.0, 38.0, 43.0, 43.0, 46.0, 38.0, 36.0, 32.0, 40.0, 40.0, 48.0, 32.0, 26.0, 39.0, 20.0, 12.0, 16.0, 11.0, 8.0, 4.0, 11.0, 8.0, 5.0, 7.0, 4.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.20660400390625, -21.53872299194336, -20.870840072631836, -20.202959060668945, -19.535078048706055, -18.86719512939453, -18.19931411743164, -17.53143310546875, -16.863550186157227, -16.195669174194336, -15.527787208557129, -14.859905242919922, -14.192023277282715, -13.524141311645508, -12.856260299682617, -12.18837833404541, -11.52049732208252, -10.852615356445312, -10.184734344482422, -9.516852378845215, -8.848970413208008, -8.181089401245117, -7.51320743560791, -6.845325469970703, -6.177443981170654, -5.5095624923706055, -4.841680526733398, -4.17379903793335, -3.5059173107147217, -2.8380355834960938, -2.170154094696045, -1.502272129058838, -0.8343906402587891, -0.1665089726448059, 0.5013726949691772, 1.1692543029785156, 1.8371360301971436, 2.5050177574157715, 3.1728992462158203, 3.8407812118530273, 4.508662700653076, 5.176544189453125, 5.844426155090332, 6.512307643890381, 7.18018913269043, 7.848071098327637, 8.515953063964844, 9.183834075927734, 9.851716041564941, 10.519598007202148, 11.187479019165039, 11.855360984802246, 12.523242950439453, 13.191123962402344, 13.85900592803955, 14.526887893676758, 15.194768905639648, 15.862650871276855, 16.530532836914062, 17.198413848876953, 17.866294860839844, 18.534177780151367, 19.202058792114258, 19.86994171142578, 20.537822723388672]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 12.0, 19.0, 26.0, 33.0, 52.0, 109.0, 151.0, 276.0, 467.0, 844.0, 1494.0, 2945.0, 5712.0, 12337.0, 27901.0, 63312.0, 138802.0, 252186.0, 261544.0, 152215.0, 70477.0, 30570.0, 13598.0, 6409.0, 3223.0, 1620.0, 880.0, 507.0, 317.0, 171.0, 132.0, 73.0, 40.0, 25.0, 18.0, 23.0, 3.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-16.40625, -15.9752197265625, -15.544189453125, -15.1131591796875, -14.68212890625, -14.2510986328125, -13.820068359375, -13.3890380859375, -12.9580078125, -12.5269775390625, -12.095947265625, -11.6649169921875, -11.23388671875, -10.8028564453125, -10.371826171875, -9.9407958984375, -9.509765625, -9.0787353515625, -8.647705078125, -8.2166748046875, -7.78564453125, -7.3546142578125, -6.923583984375, -6.4925537109375, -6.0615234375, -5.6304931640625, -5.199462890625, -4.7684326171875, -4.33740234375, -3.9063720703125, -3.475341796875, -3.0443115234375, -2.61328125, -2.1822509765625, -1.751220703125, -1.3201904296875, -0.88916015625, -0.4581298828125, -0.027099609375, 0.4039306640625, 0.8349609375, 1.2659912109375, 1.697021484375, 2.1280517578125, 2.55908203125, 2.9901123046875, 3.421142578125, 3.8521728515625, 4.283203125, 4.7142333984375, 5.145263671875, 5.5762939453125, 6.00732421875, 6.4383544921875, 6.869384765625, 7.3004150390625, 7.7314453125, 8.1624755859375, 8.593505859375, 9.0245361328125, 9.45556640625, 9.8865966796875, 10.317626953125, 10.7486572265625, 11.1796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 13.0, 20.0, 33.0, 25.0, 24.0, 31.0, 35.0, 46.0, 39.0, 48.0, 59.0, 48.0, 47.0, 53.0, 51.0, 38.0, 46.0, 45.0, 37.0, 35.0, 30.0, 26.0, 20.0, 15.0, 17.0, 18.0, 21.0, 8.0, 8.0, 2.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62109375, -2.52734375, -2.43359375, -2.33984375, -2.24609375, -2.15234375, -2.05859375, -1.96484375, -1.87109375, -1.77734375, -1.68359375, -1.58984375, -1.49609375, -1.40234375, -1.30859375, -1.21484375, -1.12109375, -1.02734375, -0.93359375, -0.83984375, -0.74609375, -0.65234375, -0.55859375, -0.46484375, -0.37109375, -0.27734375, -0.18359375, -0.08984375, 0.00390625, 0.09765625, 0.19140625, 0.28515625, 0.37890625, 0.47265625, 0.56640625, 0.66015625, 0.75390625, 0.84765625, 0.94140625, 1.03515625, 1.12890625, 1.22265625, 1.31640625, 1.41015625, 1.50390625, 1.59765625, 1.69140625, 1.78515625, 1.87890625, 1.97265625, 2.06640625, 2.16015625, 2.25390625, 2.34765625, 2.44140625, 2.53515625, 2.62890625, 2.72265625, 2.81640625, 2.91015625, 3.00390625, 3.09765625, 3.19140625, 3.28515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 11.0, 7.0, 17.0, 11.0, 16.0, 36.0, 40.0, 60.0, 76.0, 118.0, 131.0, 181.0, 247.0, 351.0, 517.0, 817.0, 1472.0, 3274.0, 8241.0, 24338.0, 79119.0, 240144.0, 387550.0, 202691.0, 65343.0, 20237.0, 6950.0, 2751.0, 1350.0, 754.0, 484.0, 328.0, 227.0, 165.0, 134.0, 103.0, 62.0, 52.0, 40.0, 26.0, 17.0, 19.0, 12.0, 10.0, 5.0, 11.0, 2.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.03125, -16.505859375, -15.98046875, -15.455078125, -14.9296875, -14.404296875, -13.87890625, -13.353515625, -12.828125, -12.302734375, -11.77734375, -11.251953125, -10.7265625, -10.201171875, -9.67578125, -9.150390625, -8.625, -8.099609375, -7.57421875, -7.048828125, -6.5234375, -5.998046875, -5.47265625, -4.947265625, -4.421875, -3.896484375, -3.37109375, -2.845703125, -2.3203125, -1.794921875, -1.26953125, -0.744140625, -0.21875, 0.306640625, 0.83203125, 1.357421875, 1.8828125, 2.408203125, 2.93359375, 3.458984375, 3.984375, 4.509765625, 5.03515625, 5.560546875, 6.0859375, 6.611328125, 7.13671875, 7.662109375, 8.1875, 8.712890625, 9.23828125, 9.763671875, 10.2890625, 10.814453125, 11.33984375, 11.865234375, 12.390625, 12.916015625, 13.44140625, 13.966796875, 14.4921875, 15.017578125, 15.54296875, 16.068359375, 16.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 9.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 21.0, 11.0, 18.0, 13.0, 26.0, 23.0, 19.0, 27.0, 24.0, 30.0, 46.0, 39.0, 32.0, 43.0, 36.0, 32.0, 44.0, 38.0, 33.0, 54.0, 39.0, 36.0, 39.0, 26.0, 32.0, 26.0, 33.0, 24.0, 14.0, 15.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.6328125, -13.2420654296875, -12.851318359375, -12.4605712890625, -12.06982421875, -11.6790771484375, -11.288330078125, -10.8975830078125, -10.5068359375, -10.1160888671875, -9.725341796875, -9.3345947265625, -8.94384765625, -8.5531005859375, -8.162353515625, -7.7716064453125, -7.380859375, -6.9901123046875, -6.599365234375, -6.2086181640625, -5.81787109375, -5.4271240234375, -5.036376953125, -4.6456298828125, -4.2548828125, -3.8641357421875, -3.473388671875, -3.0826416015625, -2.69189453125, -2.3011474609375, -1.910400390625, -1.5196533203125, -1.12890625, -0.7381591796875, -0.347412109375, 0.0433349609375, 0.43408203125, 0.8248291015625, 1.215576171875, 1.6063232421875, 1.9970703125, 2.3878173828125, 2.778564453125, 3.1693115234375, 3.56005859375, 3.9508056640625, 4.341552734375, 4.7322998046875, 5.123046875, 5.5137939453125, 5.904541015625, 6.2952880859375, 6.68603515625, 7.0767822265625, 7.467529296875, 7.8582763671875, 8.2490234375, 8.6397705078125, 9.030517578125, 9.4212646484375, 9.81201171875, 10.2027587890625, 10.593505859375, 10.9842529296875, 11.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 3.0, 8.0, 16.0, 11.0, 11.0, 34.0, 47.0, 63.0, 84.0, 147.0, 229.0, 408.0, 704.0, 1397.0, 2943.0, 6942.0, 19973.0, 75340.0, 313443.0, 443586.0, 132638.0, 32367.0, 10162.0, 4029.0, 1762.0, 929.0, 494.0, 279.0, 169.0, 95.0, 66.0, 59.0, 37.0, 23.0, 18.0, 8.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.173828125, -9.84765625, -9.521484375, -9.1953125, -8.869140625, -8.54296875, -8.216796875, -7.890625, -7.564453125, -7.23828125, -6.912109375, -6.5859375, -6.259765625, -5.93359375, -5.607421875, -5.28125, -4.955078125, -4.62890625, -4.302734375, -3.9765625, -3.650390625, -3.32421875, -2.998046875, -2.671875, -2.345703125, -2.01953125, -1.693359375, -1.3671875, -1.041015625, -0.71484375, -0.388671875, -0.0625, 0.263671875, 0.58984375, 0.916015625, 1.2421875, 1.568359375, 1.89453125, 2.220703125, 2.546875, 2.873046875, 3.19921875, 3.525390625, 3.8515625, 4.177734375, 4.50390625, 4.830078125, 5.15625, 5.482421875, 5.80859375, 6.134765625, 6.4609375, 6.787109375, 7.11328125, 7.439453125, 7.765625, 8.091796875, 8.41796875, 8.744140625, 9.0703125, 9.396484375, 9.72265625, 10.048828125, 10.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 2.0, 11.0, 13.0, 14.0, 26.0, 32.0, 64.0, 90.0, 101.0, 145.0, 161.0, 106.0, 83.0, 47.0, 39.0, 24.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002864837646484375, -0.002793237566947937, -0.002721637487411499, -0.002650037407875061, -0.002578437328338623, -0.002506837248802185, -0.002435237169265747, -0.002363637089729309, -0.002292037010192871, -0.002220436930656433, -0.002148836851119995, -0.002077236771583557, -0.002005636692047119, -0.0019340366125106812, -0.0018624365329742432, -0.0017908364534378052, -0.0017192363739013672, -0.0016476362943649292, -0.0015760362148284912, -0.0015044361352920532, -0.0014328360557556152, -0.0013612359762191772, -0.0012896358966827393, -0.0012180358171463013, -0.0011464357376098633, -0.0010748356580734253, -0.0010032355785369873, -0.0009316354990005493, -0.0008600354194641113, -0.0007884353399276733, -0.0007168352603912354, -0.0006452351808547974, -0.0005736351013183594, -0.0005020350217819214, -0.0004304349422454834, -0.0003588348627090454, -0.0002872347831726074, -0.00021563470363616943, -0.00014403462409973145, -7.243454456329346e-05, -8.344650268554688e-07, 7.076561450958252e-05, 0.0001423656940460205, 0.0002139657735824585, 0.0002855658531188965, 0.00035716593265533447, 0.00042876601219177246, 0.0005003660917282104, 0.0005719661712646484, 0.0006435662508010864, 0.0007151663303375244, 0.0007867664098739624, 0.0008583664894104004, 0.0009299665689468384, 0.0010015666484832764, 0.0010731667280197144, 0.0011447668075561523, 0.0012163668870925903, 0.0012879669666290283, 0.0013595670461654663, 0.0014311671257019043, 0.0015027672052383423, 0.0015743672847747803, 0.0016459673643112183, 0.0017175674438476562]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 14.0, 12.0, 9.0, 20.0, 31.0, 50.0, 58.0, 100.0, 160.0, 266.0, 464.0, 880.0, 2031.0, 4737.0, 14952.0, 68718.0, 385709.0, 454937.0, 87472.0, 18147.0, 5442.0, 2087.0, 1001.0, 487.0, 246.0, 176.0, 90.0, 73.0, 45.0, 40.0, 23.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.59375, -12.1749267578125, -11.756103515625, -11.3372802734375, -10.91845703125, -10.4996337890625, -10.080810546875, -9.6619873046875, -9.2431640625, -8.8243408203125, -8.405517578125, -7.9866943359375, -7.56787109375, -7.1490478515625, -6.730224609375, -6.3114013671875, -5.892578125, -5.4737548828125, -5.054931640625, -4.6361083984375, -4.21728515625, -3.7984619140625, -3.379638671875, -2.9608154296875, -2.5419921875, -2.1231689453125, -1.704345703125, -1.2855224609375, -0.86669921875, -0.4478759765625, -0.029052734375, 0.3897705078125, 0.80859375, 1.2274169921875, 1.646240234375, 2.0650634765625, 2.48388671875, 2.9027099609375, 3.321533203125, 3.7403564453125, 4.1591796875, 4.5780029296875, 4.996826171875, 5.4156494140625, 5.83447265625, 6.2532958984375, 6.672119140625, 7.0909423828125, 7.509765625, 7.9285888671875, 8.347412109375, 8.7662353515625, 9.18505859375, 9.6038818359375, 10.022705078125, 10.4415283203125, 10.8603515625, 11.2791748046875, 11.697998046875, 12.1168212890625, 12.53564453125, 12.9544677734375, 13.373291015625, 13.7921142578125, 14.2109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 9.0, 2.0, 5.0, 5.0, 10.0, 7.0, 14.0, 13.0, 17.0, 15.0, 24.0, 29.0, 31.0, 34.0, 44.0, 49.0, 56.0, 84.0, 67.0, 66.0, 71.0, 64.0, 49.0, 33.0, 34.0, 30.0, 25.0, 22.0, 17.0, 12.0, 8.0, 12.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.01953125, -6.838134765625, -6.65673828125, -6.475341796875, -6.2939453125, -6.112548828125, -5.93115234375, -5.749755859375, -5.568359375, -5.386962890625, -5.20556640625, -5.024169921875, -4.8427734375, -4.661376953125, -4.47998046875, -4.298583984375, -4.1171875, -3.935791015625, -3.75439453125, -3.572998046875, -3.3916015625, -3.210205078125, -3.02880859375, -2.847412109375, -2.666015625, -2.484619140625, -2.30322265625, -2.121826171875, -1.9404296875, -1.759033203125, -1.57763671875, -1.396240234375, -1.21484375, -1.033447265625, -0.85205078125, -0.670654296875, -0.4892578125, -0.307861328125, -0.12646484375, 0.054931640625, 0.236328125, 0.417724609375, 0.59912109375, 0.780517578125, 0.9619140625, 1.143310546875, 1.32470703125, 1.506103515625, 1.6875, 1.868896484375, 2.05029296875, 2.231689453125, 2.4130859375, 2.594482421875, 2.77587890625, 2.957275390625, 3.138671875, 3.320068359375, 3.50146484375, 3.682861328125, 3.8642578125, 4.045654296875, 4.22705078125, 4.408447265625, 4.58984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 23.0, 28.0, 74.0, 109.0, 181.0, 190.0, 167.0, 121.0, 67.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-231.29701232910156, -225.31338500976562, -219.32974243164062, -213.34609985351562, -207.3624725341797, -201.37884521484375, -195.39520263671875, -189.41156005859375, -183.4279327392578, -177.44430541992188, -171.46066284179688, -165.47702026367188, -159.49339294433594, -153.509765625, -147.526123046875, -141.54248046875, -135.55885314941406, -129.57522583007812, -123.59158325195312, -117.60794830322266, -111.62431335449219, -105.64067840576172, -99.65704345703125, -93.67340850830078, -87.68977355957031, -81.70613861083984, -75.72250366210938, -69.7388687133789, -63.75523376464844, -57.77159881591797, -51.7879638671875, -45.80432891845703, -39.8206787109375, -33.83704376220703, -27.853408813476562, -21.869773864746094, -15.886138916015625, -9.902503967285156, -3.9188690185546875, 2.0647659301757812, 8.04840087890625, 14.032035827636719, 20.015670776367188, 25.999305725097656, 31.982940673828125, 37.966575622558594, 43.95021057128906, 49.93384552001953, 55.91748046875, 61.90111541748047, 67.88475036621094, 73.8683853149414, 79.85202026367188, 85.83565521240234, 91.81929016113281, 97.80292510986328, 103.78656005859375, 109.77019500732422, 115.75382995605469, 121.73746490478516, 127.72109985351562, 133.70474243164062, 139.68836975097656, 145.6719970703125, 151.6556396484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 11.0, 20.0, 23.0, 23.0, 32.0, 28.0, 36.0, 51.0, 52.0, 49.0, 41.0, 54.0, 46.0, 54.0, 56.0, 52.0, 47.0, 43.0, 31.0, 37.0, 30.0, 29.0, 24.0, 23.0, 20.0, 12.0, 12.0, 13.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.86239624023438, -75.18463897705078, -72.50687408447266, -69.82911682128906, -67.15135955810547, -64.47359466552734, -61.79583740234375, -59.11807632446289, -56.44031524658203, -53.76255416870117, -51.08479690551758, -48.40703582763672, -45.72927474975586, -43.051513671875, -40.373756408691406, -37.69599533081055, -35.01823806762695, -32.340476989746094, -29.662717819213867, -26.98495864868164, -24.30719757080078, -21.629438400268555, -18.951679229736328, -16.27391815185547, -13.596158981323242, -10.9183988571167, -8.240638732910156, -5.56287956237793, -2.8851194381713867, -0.20735931396484375, 2.470399856567383, 5.148160934448242, 7.825920104980469, 10.503680229187012, 13.181440353393555, 15.859199523925781, 18.53696060180664, 21.214719772338867, 23.892478942871094, 26.570240020751953, 29.24799919128418, 31.925758361816406, 34.603519439697266, 37.281280517578125, 39.95903778076172, 42.63679885864258, 45.31455993652344, 47.99231719970703, 50.67007827758789, 53.34783935546875, 56.025596618652344, 58.7033576965332, 61.38111877441406, 64.05887603759766, 66.73663330078125, 69.41439819335938, 72.09215545654297, 74.76991271972656, 77.44767761230469, 80.12543487548828, 82.80319213867188, 85.48095703125, 88.1587142944336, 90.83647155761719, 93.51423645019531]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 11.0, 11.0, 14.0, 24.0, 42.0, 58.0, 86.0, 118.0, 232.0, 326.0, 559.0, 988.0, 1790.0, 3384.0, 6574.0, 13549.0, 31488.0, 83918.0, 296046.0, 2758383.0, 750726.0, 152539.0, 51578.0, 20496.0, 9777.0, 4941.0, 2696.0, 1533.0, 854.0, 528.0, 352.0, 211.0, 147.0, 79.0, 63.0, 48.0, 34.0, 23.0, 14.0, 12.0, 8.0, 9.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.0625, -16.55712890625, -16.0517578125, -15.54638671875, -15.041015625, -14.53564453125, -14.0302734375, -13.52490234375, -13.01953125, -12.51416015625, -12.0087890625, -11.50341796875, -10.998046875, -10.49267578125, -9.9873046875, -9.48193359375, -8.9765625, -8.47119140625, -7.9658203125, -7.46044921875, -6.955078125, -6.44970703125, -5.9443359375, -5.43896484375, -4.93359375, -4.42822265625, -3.9228515625, -3.41748046875, -2.912109375, -2.40673828125, -1.9013671875, -1.39599609375, -0.890625, -0.38525390625, 0.1201171875, 0.62548828125, 1.130859375, 1.63623046875, 2.1416015625, 2.64697265625, 3.15234375, 3.65771484375, 4.1630859375, 4.66845703125, 5.173828125, 5.67919921875, 6.1845703125, 6.68994140625, 7.1953125, 7.70068359375, 8.2060546875, 8.71142578125, 9.216796875, 9.72216796875, 10.2275390625, 10.73291015625, 11.23828125, 11.74365234375, 12.2490234375, 12.75439453125, 13.259765625, 13.76513671875, 14.2705078125, 14.77587890625, 15.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 2.0, 6.0, 5.0, 6.0, 15.0, 21.0, 18.0, 17.0, 31.0, 27.0, 43.0, 36.0, 43.0, 52.0, 34.0, 47.0, 82.0, 53.0, 65.0, 52.0, 57.0, 37.0, 34.0, 29.0, 30.0, 22.0, 20.0, 32.0, 16.0, 15.0, 15.0, 6.0, 10.0, 12.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.882720947265625, -2.78497314453125, -2.687225341796875, -2.5894775390625, -2.491729736328125, -2.39398193359375, -2.296234130859375, -2.198486328125, -2.100738525390625, -2.00299072265625, -1.905242919921875, -1.8074951171875, -1.709747314453125, -1.61199951171875, -1.514251708984375, -1.41650390625, -1.318756103515625, -1.22100830078125, -1.123260498046875, -1.0255126953125, -0.927764892578125, -0.83001708984375, -0.732269287109375, -0.634521484375, -0.536773681640625, -0.43902587890625, -0.341278076171875, -0.2435302734375, -0.145782470703125, -0.04803466796875, 0.049713134765625, 0.1474609375, 0.245208740234375, 0.34295654296875, 0.440704345703125, 0.5384521484375, 0.636199951171875, 0.73394775390625, 0.831695556640625, 0.929443359375, 1.027191162109375, 1.12493896484375, 1.222686767578125, 1.3204345703125, 1.418182373046875, 1.51593017578125, 1.613677978515625, 1.71142578125, 1.809173583984375, 1.90692138671875, 2.004669189453125, 2.1024169921875, 2.200164794921875, 2.29791259765625, 2.395660400390625, 2.493408203125, 2.591156005859375, 2.68890380859375, 2.786651611328125, 2.8843994140625, 2.982147216796875, 3.07989501953125, 3.177642822265625, 3.275390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 16.0, 21.0, 30.0, 39.0, 66.0, 73.0, 94.0, 197.0, 338.0, 1029.0, 5150.0, 60832.0, 3448651.0, 652444.0, 21278.0, 2523.0, 644.0, 303.0, 152.0, 103.0, 85.0, 51.0, 40.0, 33.0, 29.0, 11.0, 14.0, 5.0, 7.0, 3.0, 4.0, 4.0, 5.0], "bins": [-68.375, -66.814208984375, -65.25341796875, -63.692626953125, -62.1318359375, -60.571044921875, -59.01025390625, -57.449462890625, -55.888671875, -54.327880859375, -52.76708984375, -51.206298828125, -49.6455078125, -48.084716796875, -46.52392578125, -44.963134765625, -43.40234375, -41.841552734375, -40.28076171875, -38.719970703125, -37.1591796875, -35.598388671875, -34.03759765625, -32.476806640625, -30.916015625, -29.355224609375, -27.79443359375, -26.233642578125, -24.6728515625, -23.112060546875, -21.55126953125, -19.990478515625, -18.4296875, -16.868896484375, -15.30810546875, -13.747314453125, -12.1865234375, -10.625732421875, -9.06494140625, -7.504150390625, -5.943359375, -4.382568359375, -2.82177734375, -1.260986328125, 0.2998046875, 1.860595703125, 3.42138671875, 4.982177734375, 6.54296875, 8.103759765625, 9.66455078125, 11.225341796875, 12.7861328125, 14.346923828125, 15.90771484375, 17.468505859375, 19.029296875, 20.590087890625, 22.15087890625, 23.711669921875, 25.2724609375, 26.833251953125, 28.39404296875, 29.954833984375, 31.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 17.0, 24.0, 47.0, 91.0, 164.0, 318.0, 748.0, 1413.0, 532.0, 313.0, 172.0, 85.0, 49.0, 33.0, 21.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.73760986328125, -5.3385009765625, -4.93939208984375, -4.540283203125, -4.14117431640625, -3.7420654296875, -3.34295654296875, -2.94384765625, -2.54473876953125, -2.1456298828125, -1.74652099609375, -1.347412109375, -0.94830322265625, -0.5491943359375, -0.15008544921875, 0.2490234375, 0.64813232421875, 1.0472412109375, 1.44635009765625, 1.845458984375, 2.24456787109375, 2.6436767578125, 3.04278564453125, 3.44189453125, 3.84100341796875, 4.2401123046875, 4.63922119140625, 5.038330078125, 5.43743896484375, 5.8365478515625, 6.23565673828125, 6.634765625, 7.03387451171875, 7.4329833984375, 7.83209228515625, 8.231201171875, 8.63031005859375, 9.0294189453125, 9.42852783203125, 9.82763671875, 10.22674560546875, 10.6258544921875, 11.02496337890625, 11.424072265625, 11.82318115234375, 12.2222900390625, 12.62139892578125, 13.0205078125, 13.41961669921875, 13.8187255859375, 14.21783447265625, 14.616943359375, 15.01605224609375, 15.4151611328125, 15.81427001953125, 16.21337890625, 16.61248779296875, 17.0115966796875, 17.41070556640625, 17.809814453125, 18.20892333984375, 18.6080322265625, 19.00714111328125, 19.40625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 15.0, 33.0, 65.0, 98.0, 140.0, 169.0, 154.0, 127.0, 96.0, 37.0, 24.0, 16.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.52430725097656, -116.35123443603516, -113.17815399169922, -110.00508117675781, -106.83200073242188, -103.65892791748047, -100.48585510253906, -97.31277465820312, -94.13970184326172, -90.96662902832031, -87.79354858398438, -84.62047576904297, -81.44740295410156, -78.27432250976562, -75.10124969482422, -71.92817687988281, -68.75509643554688, -65.58202362060547, -62.40894317626953, -59.235870361328125, -56.06279373168945, -52.88971710205078, -49.716644287109375, -46.5435676574707, -43.37049102783203, -40.19741439819336, -37.02433776855469, -33.85126495361328, -30.67818832397461, -27.505111694335938, -24.3320369720459, -21.15896224975586, -17.985885620117188, -14.812809944152832, -11.639734268188477, -8.466658592224121, -5.293582916259766, -2.12050724029541, 1.0525684356689453, 4.225643157958984, 7.398719787597656, 10.571795463562012, 13.744871139526367, 16.917945861816406, 20.091022491455078, 23.26409912109375, 26.43717384338379, 29.610248565673828, 32.7833251953125, 35.95640182495117, 39.129478454589844, 42.30255126953125, 45.47562789916992, 48.648704528808594, 51.82177734375, 54.99485397338867, 58.167930603027344, 61.341007232666016, 64.51408386230469, 67.6871566772461, 70.8602294921875, 74.03330993652344, 77.20638275146484, 80.37945556640625, 83.55253601074219]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 7.0, 13.0, 12.0, 11.0, 17.0, 27.0, 25.0, 37.0, 29.0, 40.0, 42.0, 31.0, 61.0, 54.0, 52.0, 46.0, 51.0, 50.0, 45.0, 41.0, 43.0, 38.0, 26.0, 36.0, 28.0, 20.0, 16.0, 13.0, 14.0, 16.0, 15.0, 10.0, 8.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.718284606933594, -33.530364990234375, -32.342445373535156, -31.15452766418457, -29.966609954833984, -28.778690338134766, -27.590770721435547, -26.402851104736328, -25.214933395385742, -24.027013778686523, -22.839096069335938, -21.65117645263672, -20.4632568359375, -19.275339126586914, -18.087419509887695, -16.89950180053711, -15.71158218383789, -14.523663520812988, -13.335744857788086, -12.147825241088867, -10.959906578063965, -9.771987915039062, -8.584068298339844, -7.396149635314941, -6.208230972290039, -5.020312309265137, -3.832393169403076, -2.6444742679595947, -1.4565553665161133, -0.26863670349121094, 0.9192824363708496, 2.10720157623291, 3.2951202392578125, 4.483038902282715, 5.670958042144775, 6.858877182006836, 8.046795845031738, 9.23471450805664, 10.42263412475586, 11.610552787780762, 12.798471450805664, 13.986390113830566, 15.174308776855469, 16.362228393554688, 17.550148010253906, 18.738065719604492, 19.92598533630371, 21.113903045654297, 22.301822662353516, 23.489742279052734, 24.67765998840332, 25.86557960510254, 27.053497314453125, 28.241416931152344, 29.429336547851562, 30.61725616455078, 31.805173873901367, 32.99309158325195, 34.18101119995117, 35.36893081665039, 36.55685043334961, 37.74476623535156, 38.93268585205078, 40.12060546875, 41.30852508544922]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 15.0, 10.0, 17.0, 20.0, 48.0, 48.0, 91.0, 138.0, 231.0, 373.0, 671.0, 1090.0, 2229.0, 4442.0, 9532.0, 21119.0, 47715.0, 105883.0, 222966.0, 308323.0, 174033.0, 81361.0, 36548.0, 16605.0, 7491.0, 3470.0, 1820.0, 925.0, 531.0, 312.0, 196.0, 102.0, 75.0, 41.0, 24.0, 23.0, 15.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8203125, -15.345703125, -14.87109375, -14.396484375, -13.921875, -13.447265625, -12.97265625, -12.498046875, -12.0234375, -11.548828125, -11.07421875, -10.599609375, -10.125, -9.650390625, -9.17578125, -8.701171875, -8.2265625, -7.751953125, -7.27734375, -6.802734375, -6.328125, -5.853515625, -5.37890625, -4.904296875, -4.4296875, -3.955078125, -3.48046875, -3.005859375, -2.53125, -2.056640625, -1.58203125, -1.107421875, -0.6328125, -0.158203125, 0.31640625, 0.791015625, 1.265625, 1.740234375, 2.21484375, 2.689453125, 3.1640625, 3.638671875, 4.11328125, 4.587890625, 5.0625, 5.537109375, 6.01171875, 6.486328125, 6.9609375, 7.435546875, 7.91015625, 8.384765625, 8.859375, 9.333984375, 9.80859375, 10.283203125, 10.7578125, 11.232421875, 11.70703125, 12.181640625, 12.65625, 13.130859375, 13.60546875, 14.080078125, 14.5546875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 17.0, 11.0, 23.0, 17.0, 27.0, 33.0, 19.0, 37.0, 30.0, 38.0, 46.0, 47.0, 49.0, 60.0, 61.0, 46.0, 43.0, 43.0, 40.0, 39.0, 33.0, 38.0, 25.0, 27.0, 14.0, 27.0, 18.0, 15.0, 13.0, 15.0, 6.0, 8.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.334197998046875, -2.24456787109375, -2.154937744140625, -2.0653076171875, -1.975677490234375, -1.88604736328125, -1.796417236328125, -1.706787109375, -1.617156982421875, -1.52752685546875, -1.437896728515625, -1.3482666015625, -1.258636474609375, -1.16900634765625, -1.079376220703125, -0.98974609375, -0.900115966796875, -0.81048583984375, -0.720855712890625, -0.6312255859375, -0.541595458984375, -0.45196533203125, -0.362335205078125, -0.272705078125, -0.183074951171875, -0.09344482421875, -0.003814697265625, 0.0858154296875, 0.175445556640625, 0.26507568359375, 0.354705810546875, 0.4443359375, 0.533966064453125, 0.62359619140625, 0.713226318359375, 0.8028564453125, 0.892486572265625, 0.98211669921875, 1.071746826171875, 1.161376953125, 1.251007080078125, 1.34063720703125, 1.430267333984375, 1.5198974609375, 1.609527587890625, 1.69915771484375, 1.788787841796875, 1.87841796875, 1.968048095703125, 2.05767822265625, 2.147308349609375, 2.2369384765625, 2.326568603515625, 2.41619873046875, 2.505828857421875, 2.595458984375, 2.685089111328125, 2.77471923828125, 2.864349365234375, 2.9539794921875, 3.043609619140625, 3.13323974609375, 3.222869873046875, 3.3125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 0.0, 8.0, 9.0, 9.0, 13.0, 20.0, 28.0, 27.0, 36.0, 44.0, 50.0, 79.0, 75.0, 115.0, 164.0, 164.0, 246.0, 366.0, 543.0, 833.0, 1383.0, 2520.0, 4933.0, 9875.0, 21844.0, 49167.0, 107570.0, 225417.0, 298251.0, 173958.0, 81041.0, 36286.0, 16369.0, 7588.0, 3840.0, 1982.0, 1159.0, 739.0, 505.0, 335.0, 253.0, 159.0, 122.0, 105.0, 79.0, 56.0, 50.0, 38.0, 27.0, 21.0, 14.0, 17.0, 8.0, 3.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0], "bins": [-11.59375, -11.2349853515625, -10.876220703125, -10.5174560546875, -10.15869140625, -9.7999267578125, -9.441162109375, -9.0823974609375, -8.7236328125, -8.3648681640625, -8.006103515625, -7.6473388671875, -7.28857421875, -6.9298095703125, -6.571044921875, -6.2122802734375, -5.853515625, -5.4947509765625, -5.135986328125, -4.7772216796875, -4.41845703125, -4.0596923828125, -3.700927734375, -3.3421630859375, -2.9833984375, -2.6246337890625, -2.265869140625, -1.9071044921875, -1.54833984375, -1.1895751953125, -0.830810546875, -0.4720458984375, -0.11328125, 0.2454833984375, 0.604248046875, 0.9630126953125, 1.32177734375, 1.6805419921875, 2.039306640625, 2.3980712890625, 2.7568359375, 3.1156005859375, 3.474365234375, 3.8331298828125, 4.19189453125, 4.5506591796875, 4.909423828125, 5.2681884765625, 5.626953125, 5.9857177734375, 6.344482421875, 6.7032470703125, 7.06201171875, 7.4207763671875, 7.779541015625, 8.1383056640625, 8.4970703125, 8.8558349609375, 9.214599609375, 9.5733642578125, 9.93212890625, 10.2908935546875, 10.649658203125, 11.0084228515625, 11.3671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 19.0, 41.0, 34.0, 40.0, 37.0, 41.0, 57.0, 42.0, 54.0, 44.0, 59.0, 56.0, 44.0, 37.0, 54.0, 44.0, 37.0, 21.0, 32.0, 19.0, 16.0, 14.0, 17.0, 17.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453125, -12.997802734375, -12.54248046875, -12.087158203125, -11.6318359375, -11.176513671875, -10.72119140625, -10.265869140625, -9.810546875, -9.355224609375, -8.89990234375, -8.444580078125, -7.9892578125, -7.533935546875, -7.07861328125, -6.623291015625, -6.16796875, -5.712646484375, -5.25732421875, -4.802001953125, -4.3466796875, -3.891357421875, -3.43603515625, -2.980712890625, -2.525390625, -2.070068359375, -1.61474609375, -1.159423828125, -0.7041015625, -0.248779296875, 0.20654296875, 0.661865234375, 1.1171875, 1.572509765625, 2.02783203125, 2.483154296875, 2.9384765625, 3.393798828125, 3.84912109375, 4.304443359375, 4.759765625, 5.215087890625, 5.67041015625, 6.125732421875, 6.5810546875, 7.036376953125, 7.49169921875, 7.947021484375, 8.40234375, 8.857666015625, 9.31298828125, 9.768310546875, 10.2236328125, 10.678955078125, 11.13427734375, 11.589599609375, 12.044921875, 12.500244140625, 12.95556640625, 13.410888671875, 13.8662109375, 14.321533203125, 14.77685546875, 15.232177734375, 15.6875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 13.0, 20.0, 34.0, 45.0, 67.0, 130.0, 234.0, 353.0, 689.0, 1337.0, 3090.0, 7960.0, 24572.0, 95402.0, 383326.0, 392536.0, 99049.0, 25246.0, 8244.0, 3180.0, 1357.0, 693.0, 379.0, 209.0, 134.0, 81.0, 50.0, 33.0, 18.0, 13.0, 12.0, 7.0, 8.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.9827880859375, -9.660888671875, -9.3389892578125, -9.01708984375, -8.6951904296875, -8.373291015625, -8.0513916015625, -7.7294921875, -7.4075927734375, -7.085693359375, -6.7637939453125, -6.44189453125, -6.1199951171875, -5.798095703125, -5.4761962890625, -5.154296875, -4.8323974609375, -4.510498046875, -4.1885986328125, -3.86669921875, -3.5447998046875, -3.222900390625, -2.9010009765625, -2.5791015625, -2.2572021484375, -1.935302734375, -1.6134033203125, -1.29150390625, -0.9696044921875, -0.647705078125, -0.3258056640625, -0.00390625, 0.3179931640625, 0.639892578125, 0.9617919921875, 1.28369140625, 1.6055908203125, 1.927490234375, 2.2493896484375, 2.5712890625, 2.8931884765625, 3.215087890625, 3.5369873046875, 3.85888671875, 4.1807861328125, 4.502685546875, 4.8245849609375, 5.146484375, 5.4683837890625, 5.790283203125, 6.1121826171875, 6.43408203125, 6.7559814453125, 7.077880859375, 7.3997802734375, 7.7216796875, 8.0435791015625, 8.365478515625, 8.6873779296875, 9.00927734375, 9.3311767578125, 9.653076171875, 9.9749755859375, 10.296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 16.0, 9.0, 23.0, 24.0, 28.0, 41.0, 28.0, 62.0, 57.0, 95.0, 125.0, 98.0, 73.0, 52.0, 45.0, 40.0, 21.0, 25.0, 21.0, 15.0, 13.0, 12.0, 11.0, 9.0, 3.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014162063598632812, -0.0013765394687652588, -0.0013368725776672363, -0.0012972056865692139, -0.0012575387954711914, -0.001217871904373169, -0.0011782050132751465, -0.001138538122177124, -0.0010988712310791016, -0.001059204339981079, -0.0010195374488830566, -0.0009798705577850342, -0.0009402036666870117, -0.0009005367755889893, -0.0008608698844909668, -0.0008212029933929443, -0.0007815361022949219, -0.0007418692111968994, -0.000702202320098877, -0.0006625354290008545, -0.000622868537902832, -0.0005832016468048096, -0.0005435347557067871, -0.0005038678646087646, -0.0004642009735107422, -0.0004245340824127197, -0.00038486719131469727, -0.0003452003002166748, -0.00030553340911865234, -0.0002658665180206299, -0.00022619962692260742, -0.00018653273582458496, -0.0001468658447265625, -0.00010719895362854004, -6.753206253051758e-05, -2.7865171432495117e-05, 1.1801719665527344e-05, 5.1468610763549805e-05, 9.113550186157227e-05, 0.00013080239295959473, 0.0001704692840576172, 0.00021013617515563965, 0.0002498030662536621, 0.00028946995735168457, 0.00032913684844970703, 0.0003688037395477295, 0.00040847063064575195, 0.0004481375217437744, 0.0004878044128417969, 0.0005274713039398193, 0.0005671381950378418, 0.0006068050861358643, 0.0006464719772338867, 0.0006861388683319092, 0.0007258057594299316, 0.0007654726505279541, 0.0008051395416259766, 0.000844806432723999, 0.0008844733238220215, 0.0009241402149200439, 0.0009638071060180664, 0.0010034739971160889, 0.0010431408882141113, 0.0010828077793121338, 0.0011224746704101562]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 11.0, 16.0, 19.0, 26.0, 43.0, 93.0, 161.0, 321.0, 596.0, 1213.0, 2848.0, 8064.0, 28335.0, 133456.0, 528648.0, 270948.0, 52673.0, 13345.0, 4230.0, 1784.0, 803.0, 353.0, 215.0, 122.0, 66.0, 51.0, 31.0, 17.0, 19.0, 14.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.111083984375, -12.72216796875, -12.333251953125, -11.9443359375, -11.555419921875, -11.16650390625, -10.777587890625, -10.388671875, -9.999755859375, -9.61083984375, -9.221923828125, -8.8330078125, -8.444091796875, -8.05517578125, -7.666259765625, -7.27734375, -6.888427734375, -6.49951171875, -6.110595703125, -5.7216796875, -5.332763671875, -4.94384765625, -4.554931640625, -4.166015625, -3.777099609375, -3.38818359375, -2.999267578125, -2.6103515625, -2.221435546875, -1.83251953125, -1.443603515625, -1.0546875, -0.665771484375, -0.27685546875, 0.112060546875, 0.5009765625, 0.889892578125, 1.27880859375, 1.667724609375, 2.056640625, 2.445556640625, 2.83447265625, 3.223388671875, 3.6123046875, 4.001220703125, 4.39013671875, 4.779052734375, 5.16796875, 5.556884765625, 5.94580078125, 6.334716796875, 6.7236328125, 7.112548828125, 7.50146484375, 7.890380859375, 8.279296875, 8.668212890625, 9.05712890625, 9.446044921875, 9.8349609375, 10.223876953125, 10.61279296875, 11.001708984375, 11.390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 14.0, 21.0, 19.0, 31.0, 35.0, 40.0, 58.0, 71.0, 88.0, 79.0, 96.0, 79.0, 75.0, 54.0, 52.0, 41.0, 29.0, 29.0, 12.0, 11.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.26953125, -7.0362548828125, -6.802978515625, -6.5697021484375, -6.33642578125, -6.1031494140625, -5.869873046875, -5.6365966796875, -5.4033203125, -5.1700439453125, -4.936767578125, -4.7034912109375, -4.47021484375, -4.2369384765625, -4.003662109375, -3.7703857421875, -3.537109375, -3.3038330078125, -3.070556640625, -2.8372802734375, -2.60400390625, -2.3707275390625, -2.137451171875, -1.9041748046875, -1.6708984375, -1.4376220703125, -1.204345703125, -0.9710693359375, -0.73779296875, -0.5045166015625, -0.271240234375, -0.0379638671875, 0.1953125, 0.4285888671875, 0.661865234375, 0.8951416015625, 1.12841796875, 1.3616943359375, 1.594970703125, 1.8282470703125, 2.0615234375, 2.2947998046875, 2.528076171875, 2.7613525390625, 2.99462890625, 3.2279052734375, 3.461181640625, 3.6944580078125, 3.927734375, 4.1610107421875, 4.394287109375, 4.6275634765625, 4.86083984375, 5.0941162109375, 5.327392578125, 5.5606689453125, 5.7939453125, 6.0272216796875, 6.260498046875, 6.4937744140625, 6.72705078125, 6.9603271484375, 7.193603515625, 7.4268798828125, 7.66015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 13.0, 11.0, 16.0, 31.0, 67.0, 104.0, 145.0, 162.0, 170.0, 133.0, 76.0, 36.0, 16.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.40904235839844, -167.1335906982422, -161.85813903808594, -156.5826873779297, -151.3072509765625, -146.03179931640625, -140.75634765625, -135.48089599609375, -130.2054443359375, -124.92999267578125, -119.654541015625, -114.37909698486328, -109.10364532470703, -103.82819366455078, -98.55274963378906, -93.27729797363281, -88.00184631347656, -82.72639465332031, -77.45094299316406, -72.17549896240234, -66.9000473022461, -61.624595642089844, -56.34914779663086, -51.073699951171875, -45.798248291015625, -40.522796630859375, -35.24734878540039, -29.971899032592773, -24.696449279785156, -19.42099952697754, -14.145549774169922, -8.870101928710938, -3.59466552734375, 1.6807842254638672, 6.956233978271484, 12.231683731079102, 17.50713348388672, 22.782583236694336, 28.058032989501953, 33.33348083496094, 38.60893249511719, 43.88438415527344, 49.15983200073242, 54.435279846191406, 59.710731506347656, 64.9861831665039, 70.26162719726562, 75.53707885742188, 80.81253051757812, 86.08798217773438, 91.36343383789062, 96.63887786865234, 101.9143295288086, 107.18978118896484, 112.46522521972656, 117.74067687988281, 123.01612854003906, 128.2915802001953, 133.56703186035156, 138.8424835205078, 144.117919921875, 149.39337158203125, 154.6688232421875, 159.94427490234375, 165.2197265625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 12.0, 8.0, 9.0, 19.0, 12.0, 18.0, 19.0, 19.0, 20.0, 26.0, 37.0, 39.0, 42.0, 29.0, 30.0, 35.0, 29.0, 38.0, 42.0, 40.0, 45.0, 38.0, 41.0, 36.0, 27.0, 28.0, 32.0, 21.0, 22.0, 20.0, 28.0, 21.0, 9.0, 17.0, 13.0, 9.0, 12.0, 6.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.08466339111328, -63.961360931396484, -61.83805847167969, -59.714759826660156, -57.59145736694336, -55.46815490722656, -53.34485626220703, -51.221553802490234, -49.09825134277344, -46.97494888305664, -44.851646423339844, -42.72834777832031, -40.605045318603516, -38.48174285888672, -36.35844421386719, -34.23514175415039, -32.111839294433594, -29.988536834716797, -27.865236282348633, -25.74193572998047, -23.618633270263672, -21.495330810546875, -19.37203025817871, -17.248729705810547, -15.12542724609375, -13.00212574005127, -10.878824234008789, -8.755522727966309, -6.632221221923828, -4.508919715881348, -2.385618209838867, -0.2623167037963867, 1.8609771728515625, 3.984278678894043, 6.107580184936523, 8.230881690979004, 10.354183197021484, 12.477484703063965, 14.600786209106445, 16.72408676147461, 18.847389221191406, 20.970691680908203, 23.093992233276367, 25.21729278564453, 27.340595245361328, 29.463897705078125, 31.58719825744629, 33.71049880981445, 35.83380126953125, 37.95710372924805, 40.080406188964844, 42.203704833984375, 44.32700729370117, 46.45030975341797, 48.5736083984375, 50.6969108581543, 52.820213317871094, 54.94351577758789, 57.06681823730469, 59.19011688232422, 61.313419342041016, 63.43672180175781, 65.56002044677734, 67.6833267211914, 69.80662536621094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 12.0, 14.0, 10.0, 28.0, 27.0, 39.0, 58.0, 96.0, 141.0, 206.0, 298.0, 451.0, 772.0, 1292.0, 2377.0, 4293.0, 8631.0, 17320.0, 41603.0, 128170.0, 1082907.0, 2659429.0, 157327.0, 47718.0, 20063.0, 9325.0, 4873.0, 2670.0, 1498.0, 933.0, 571.0, 360.0, 243.0, 163.0, 114.0, 75.0, 44.0, 37.0, 25.0, 18.0, 12.0, 12.0, 2.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.46875, -15.9708251953125, -15.472900390625, -14.9749755859375, -14.47705078125, -13.9791259765625, -13.481201171875, -12.9832763671875, -12.4853515625, -11.9874267578125, -11.489501953125, -10.9915771484375, -10.49365234375, -9.9957275390625, -9.497802734375, -8.9998779296875, -8.501953125, -8.0040283203125, -7.506103515625, -7.0081787109375, -6.51025390625, -6.0123291015625, -5.514404296875, -5.0164794921875, -4.5185546875, -4.0206298828125, -3.522705078125, -3.0247802734375, -2.52685546875, -2.0289306640625, -1.531005859375, -1.0330810546875, -0.53515625, -0.0372314453125, 0.460693359375, 0.9586181640625, 1.45654296875, 1.9544677734375, 2.452392578125, 2.9503173828125, 3.4482421875, 3.9461669921875, 4.444091796875, 4.9420166015625, 5.43994140625, 5.9378662109375, 6.435791015625, 6.9337158203125, 7.431640625, 7.9295654296875, 8.427490234375, 8.9254150390625, 9.42333984375, 9.9212646484375, 10.419189453125, 10.9171142578125, 11.4150390625, 11.9129638671875, 12.410888671875, 12.9088134765625, 13.40673828125, 13.9046630859375, 14.402587890625, 14.9005126953125, 15.3984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 4.0, 11.0, 10.0, 15.0, 17.0, 20.0, 17.0, 23.0, 25.0, 24.0, 41.0, 27.0, 52.0, 32.0, 61.0, 41.0, 33.0, 51.0, 51.0, 44.0, 39.0, 29.0, 39.0, 40.0, 34.0, 33.0, 16.0, 28.0, 16.0, 27.0, 11.0, 14.0, 13.0, 11.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.3699951171875, -2.284912109375, -2.1998291015625, -2.11474609375, -2.0296630859375, -1.944580078125, -1.8594970703125, -1.7744140625, -1.6893310546875, -1.604248046875, -1.5191650390625, -1.43408203125, -1.3489990234375, -1.263916015625, -1.1788330078125, -1.09375, -1.0086669921875, -0.923583984375, -0.8385009765625, -0.75341796875, -0.6683349609375, -0.583251953125, -0.4981689453125, -0.4130859375, -0.3280029296875, -0.242919921875, -0.1578369140625, -0.07275390625, 0.0123291015625, 0.097412109375, 0.1824951171875, 0.267578125, 0.3526611328125, 0.437744140625, 0.5228271484375, 0.60791015625, 0.6929931640625, 0.778076171875, 0.8631591796875, 0.9482421875, 1.0333251953125, 1.118408203125, 1.2034912109375, 1.28857421875, 1.3736572265625, 1.458740234375, 1.5438232421875, 1.62890625, 1.7139892578125, 1.799072265625, 1.8841552734375, 1.96923828125, 2.0543212890625, 2.139404296875, 2.2244873046875, 2.3095703125, 2.3946533203125, 2.479736328125, 2.5648193359375, 2.64990234375, 2.7349853515625, 2.820068359375, 2.9051513671875, 2.990234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 13.0, 30.0, 16.0, 28.0, 28.0, 34.0, 57.0, 67.0, 72.0, 82.0, 132.0, 272.0, 899.0, 3622.0, 22771.0, 278620.0, 3700009.0, 167118.0, 16214.0, 2712.0, 657.0, 237.0, 120.0, 82.0, 71.0, 56.0, 39.0, 35.0, 35.0, 22.0, 36.0, 14.0, 19.0, 10.0, 7.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -34.1279296875, -33.005859375, -31.8837890625, -30.76171875, -29.6396484375, -28.517578125, -27.3955078125, -26.2734375, -25.1513671875, -24.029296875, -22.9072265625, -21.78515625, -20.6630859375, -19.541015625, -18.4189453125, -17.296875, -16.1748046875, -15.052734375, -13.9306640625, -12.80859375, -11.6865234375, -10.564453125, -9.4423828125, -8.3203125, -7.1982421875, -6.076171875, -4.9541015625, -3.83203125, -2.7099609375, -1.587890625, -0.4658203125, 0.65625, 1.7783203125, 2.900390625, 4.0224609375, 5.14453125, 6.2666015625, 7.388671875, 8.5107421875, 9.6328125, 10.7548828125, 11.876953125, 12.9990234375, 14.12109375, 15.2431640625, 16.365234375, 17.4873046875, 18.609375, 19.7314453125, 20.853515625, 21.9755859375, 23.09765625, 24.2197265625, 25.341796875, 26.4638671875, 27.5859375, 28.7080078125, 29.830078125, 30.9521484375, 32.07421875, 33.1962890625, 34.318359375, 35.4404296875, 36.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 17.0, 12.0, 31.0, 82.0, 144.0, 420.0, 1957.0, 923.0, 263.0, 112.0, 53.0, 31.0, 17.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984375, -16.522705078125, -16.06103515625, -15.599365234375, -15.1376953125, -14.676025390625, -14.21435546875, -13.752685546875, -13.291015625, -12.829345703125, -12.36767578125, -11.906005859375, -11.4443359375, -10.982666015625, -10.52099609375, -10.059326171875, -9.59765625, -9.135986328125, -8.67431640625, -8.212646484375, -7.7509765625, -7.289306640625, -6.82763671875, -6.365966796875, -5.904296875, -5.442626953125, -4.98095703125, -4.519287109375, -4.0576171875, -3.595947265625, -3.13427734375, -2.672607421875, -2.2109375, -1.749267578125, -1.28759765625, -0.825927734375, -0.3642578125, 0.097412109375, 0.55908203125, 1.020751953125, 1.482421875, 1.944091796875, 2.40576171875, 2.867431640625, 3.3291015625, 3.790771484375, 4.25244140625, 4.714111328125, 5.17578125, 5.637451171875, 6.09912109375, 6.560791015625, 7.0224609375, 7.484130859375, 7.94580078125, 8.407470703125, 8.869140625, 9.330810546875, 9.79248046875, 10.254150390625, 10.7158203125, 11.177490234375, 11.63916015625, 12.100830078125, 12.5625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 13.0, 13.0, 12.0, 26.0, 52.0, 59.0, 98.0, 140.0, 147.0, 122.0, 117.0, 73.0, 49.0, 29.0, 23.0, 12.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.19105529785156, -72.3633041381836, -70.53555297851562, -68.70780181884766, -66.88005065917969, -65.05229187011719, -63.22454071044922, -61.39678955078125, -59.56903839111328, -57.74128723144531, -55.913536071777344, -54.08578109741211, -52.25802993774414, -50.43027877807617, -48.60252380371094, -46.77477264404297, -44.947021484375, -43.11927032470703, -41.29151916503906, -39.46376419067383, -37.63601303100586, -35.80826187133789, -33.980506896972656, -32.15275573730469, -30.32500457763672, -28.49725341796875, -26.66950035095215, -24.841747283935547, -23.013996124267578, -21.18624496459961, -19.358491897583008, -17.530738830566406, -15.702987670898438, -13.875235557556152, -12.047483444213867, -10.219731330871582, -8.391979217529297, -6.564227104187012, -4.736474990844727, -2.9087228775024414, -1.0809707641601562, 0.7467813491821289, 2.574533462524414, 4.402285575866699, 6.230037689208984, 8.05778980255127, 9.885541915893555, 11.71329402923584, 13.541046142578125, 15.36879825592041, 17.196550369262695, 19.024303436279297, 20.852054595947266, 22.679805755615234, 24.507558822631836, 26.335311889648438, 28.163063049316406, 29.990814208984375, 31.818567276000977, 33.64632034301758, 35.47407150268555, 37.301822662353516, 39.12957763671875, 40.95732879638672, 42.78507995605469]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 5.0, 14.0, 14.0, 12.0, 19.0, 14.0, 22.0, 25.0, 21.0, 33.0, 34.0, 32.0, 30.0, 29.0, 41.0, 30.0, 30.0, 35.0, 38.0, 41.0, 27.0, 52.0, 37.0, 36.0, 37.0, 22.0, 24.0, 25.0, 19.0, 25.0, 10.0, 19.0, 13.0, 12.0, 16.0, 11.0, 14.0, 8.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-20.922992706298828, -20.303266525268555, -19.683542251586914, -19.06381607055664, -18.444091796875, -17.824365615844727, -17.204641342163086, -16.584915161132812, -15.965190887451172, -15.345465660095215, -14.725740432739258, -14.1060152053833, -13.486289978027344, -12.866564750671387, -12.24683952331543, -11.627113342285156, -11.0073881149292, -10.387662887573242, -9.767937660217285, -9.148212432861328, -8.528487205505371, -7.908761978149414, -7.289036273956299, -6.669311046600342, -6.049585819244385, -5.429860591888428, -4.810135364532471, -4.1904096603393555, -3.5706846714019775, -2.9509594440460205, -2.3312339782714844, -1.7115087509155273, -1.0917835235595703, -0.4720582365989685, 0.1476670503616333, 0.7673923969268799, 1.387117624282837, 2.006842851638794, 2.62656831741333, 3.246293544769287, 3.866018772125244, 4.485743999481201, 5.105469226837158, 5.725194931030273, 6.3449201583862305, 6.9646453857421875, 7.5843706130981445, 8.204095840454102, 8.823821067810059, 9.443546295166016, 10.063271522521973, 10.68299674987793, 11.302721977233887, 11.922447204589844, 12.542173385620117, 13.161897659301758, 13.781623840332031, 14.401349067687988, 15.021074295043945, 15.640799522399902, 16.26052474975586, 16.880250930786133, 17.499975204467773, 18.119701385498047, 18.739425659179688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 7.0, 7.0, 11.0, 14.0, 10.0, 17.0, 29.0, 49.0, 52.0, 74.0, 124.0, 182.0, 286.0, 433.0, 613.0, 1004.0, 1570.0, 2702.0, 4802.0, 8567.0, 15385.0, 29035.0, 55184.0, 105526.0, 194999.0, 263603.0, 169983.0, 90984.0, 47380.0, 24866.0, 13229.0, 7357.0, 4101.0, 2465.0, 1400.0, 837.0, 534.0, 332.0, 266.0, 156.0, 109.0, 66.0, 56.0, 37.0, 28.0, 28.0, 12.0, 10.0, 14.0, 8.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.390625, -10.9892578125, -10.587890625, -10.1865234375, -9.78515625, -9.3837890625, -8.982421875, -8.5810546875, -8.1796875, -7.7783203125, -7.376953125, -6.9755859375, -6.57421875, -6.1728515625, -5.771484375, -5.3701171875, -4.96875, -4.5673828125, -4.166015625, -3.7646484375, -3.36328125, -2.9619140625, -2.560546875, -2.1591796875, -1.7578125, -1.3564453125, -0.955078125, -0.5537109375, -0.15234375, 0.2490234375, 0.650390625, 1.0517578125, 1.453125, 1.8544921875, 2.255859375, 2.6572265625, 3.05859375, 3.4599609375, 3.861328125, 4.2626953125, 4.6640625, 5.0654296875, 5.466796875, 5.8681640625, 6.26953125, 6.6708984375, 7.072265625, 7.4736328125, 7.875, 8.2763671875, 8.677734375, 9.0791015625, 9.48046875, 9.8818359375, 10.283203125, 10.6845703125, 11.0859375, 11.4873046875, 11.888671875, 12.2900390625, 12.69140625, 13.0927734375, 13.494140625, 13.8955078125, 14.296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 13.0, 18.0, 21.0, 18.0, 16.0, 19.0, 21.0, 35.0, 27.0, 38.0, 51.0, 45.0, 41.0, 47.0, 63.0, 39.0, 39.0, 48.0, 39.0, 41.0, 33.0, 37.0, 30.0, 23.0, 21.0, 23.0, 14.0, 19.0, 13.0, 19.0, 14.0, 13.0, 8.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.245452880859375, -2.16082763671875, -2.076202392578125, -1.9915771484375, -1.906951904296875, -1.82232666015625, -1.737701416015625, -1.653076171875, -1.568450927734375, -1.48382568359375, -1.399200439453125, -1.3145751953125, -1.229949951171875, -1.14532470703125, -1.060699462890625, -0.97607421875, -0.891448974609375, -0.80682373046875, -0.722198486328125, -0.6375732421875, -0.552947998046875, -0.46832275390625, -0.383697509765625, -0.299072265625, -0.214447021484375, -0.12982177734375, -0.045196533203125, 0.0394287109375, 0.124053955078125, 0.20867919921875, 0.293304443359375, 0.3779296875, 0.462554931640625, 0.54718017578125, 0.631805419921875, 0.7164306640625, 0.801055908203125, 0.88568115234375, 0.970306396484375, 1.054931640625, 1.139556884765625, 1.22418212890625, 1.308807373046875, 1.3934326171875, 1.478057861328125, 1.56268310546875, 1.647308349609375, 1.73193359375, 1.816558837890625, 1.90118408203125, 1.985809326171875, 2.0704345703125, 2.155059814453125, 2.23968505859375, 2.324310302734375, 2.408935546875, 2.493560791015625, 2.57818603515625, 2.662811279296875, 2.7474365234375, 2.832061767578125, 2.91668701171875, 3.001312255859375, 3.0859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 6.0, 10.0, 12.0, 18.0, 31.0, 31.0, 42.0, 53.0, 67.0, 92.0, 120.0, 159.0, 239.0, 308.0, 405.0, 650.0, 1153.0, 2378.0, 6360.0, 19346.0, 67781.0, 228191.0, 438523.0, 196951.0, 58092.0, 16723.0, 5441.0, 2190.0, 1083.0, 617.0, 374.0, 272.0, 206.0, 161.0, 99.0, 80.0, 60.0, 50.0, 34.0, 32.0, 28.0, 18.0, 21.0, 14.0, 4.0, 5.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-17.65625, -17.128173828125, -16.60009765625, -16.072021484375, -15.5439453125, -15.015869140625, -14.48779296875, -13.959716796875, -13.431640625, -12.903564453125, -12.37548828125, -11.847412109375, -11.3193359375, -10.791259765625, -10.26318359375, -9.735107421875, -9.20703125, -8.678955078125, -8.15087890625, -7.622802734375, -7.0947265625, -6.566650390625, -6.03857421875, -5.510498046875, -4.982421875, -4.454345703125, -3.92626953125, -3.398193359375, -2.8701171875, -2.342041015625, -1.81396484375, -1.285888671875, -0.7578125, -0.229736328125, 0.29833984375, 0.826416015625, 1.3544921875, 1.882568359375, 2.41064453125, 2.938720703125, 3.466796875, 3.994873046875, 4.52294921875, 5.051025390625, 5.5791015625, 6.107177734375, 6.63525390625, 7.163330078125, 7.69140625, 8.219482421875, 8.74755859375, 9.275634765625, 9.8037109375, 10.331787109375, 10.85986328125, 11.387939453125, 11.916015625, 12.444091796875, 12.97216796875, 13.500244140625, 14.0283203125, 14.556396484375, 15.08447265625, 15.612548828125, 16.140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 13.0, 8.0, 8.0, 13.0, 15.0, 23.0, 13.0, 21.0, 28.0, 27.0, 31.0, 34.0, 38.0, 50.0, 35.0, 41.0, 49.0, 42.0, 53.0, 29.0, 37.0, 35.0, 38.0, 29.0, 31.0, 29.0, 32.0, 32.0, 22.0, 17.0, 21.0, 14.0, 11.0, 16.0, 10.0, 13.0, 10.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.46875, -11.112060546875, -10.75537109375, -10.398681640625, -10.0419921875, -9.685302734375, -9.32861328125, -8.971923828125, -8.615234375, -8.258544921875, -7.90185546875, -7.545166015625, -7.1884765625, -6.831787109375, -6.47509765625, -6.118408203125, -5.76171875, -5.405029296875, -5.04833984375, -4.691650390625, -4.3349609375, -3.978271484375, -3.62158203125, -3.264892578125, -2.908203125, -2.551513671875, -2.19482421875, -1.838134765625, -1.4814453125, -1.124755859375, -0.76806640625, -0.411376953125, -0.0546875, 0.302001953125, 0.65869140625, 1.015380859375, 1.3720703125, 1.728759765625, 2.08544921875, 2.442138671875, 2.798828125, 3.155517578125, 3.51220703125, 3.868896484375, 4.2255859375, 4.582275390625, 4.93896484375, 5.295654296875, 5.65234375, 6.009033203125, 6.36572265625, 6.722412109375, 7.0791015625, 7.435791015625, 7.79248046875, 8.149169921875, 8.505859375, 8.862548828125, 9.21923828125, 9.575927734375, 9.9326171875, 10.289306640625, 10.64599609375, 11.002685546875, 11.359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 21.0, 24.0, 40.0, 77.0, 173.0, 394.0, 923.0, 2867.0, 10872.0, 63201.0, 521826.0, 389739.0, 45804.0, 8828.0, 2285.0, 809.0, 288.0, 125.0, 78.0, 42.0, 32.0, 19.0, 12.0, 4.0, 10.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.0682373046875, -13.581787109375, -13.0953369140625, -12.60888671875, -12.1224365234375, -11.635986328125, -11.1495361328125, -10.6630859375, -10.1766357421875, -9.690185546875, -9.2037353515625, -8.71728515625, -8.2308349609375, -7.744384765625, -7.2579345703125, -6.771484375, -6.2850341796875, -5.798583984375, -5.3121337890625, -4.82568359375, -4.3392333984375, -3.852783203125, -3.3663330078125, -2.8798828125, -2.3934326171875, -1.906982421875, -1.4205322265625, -0.93408203125, -0.4476318359375, 0.038818359375, 0.5252685546875, 1.01171875, 1.4981689453125, 1.984619140625, 2.4710693359375, 2.95751953125, 3.4439697265625, 3.930419921875, 4.4168701171875, 4.9033203125, 5.3897705078125, 5.876220703125, 6.3626708984375, 6.84912109375, 7.3355712890625, 7.822021484375, 8.3084716796875, 8.794921875, 9.2813720703125, 9.767822265625, 10.2542724609375, 10.74072265625, 11.2271728515625, 11.713623046875, 12.2000732421875, 12.6865234375, 13.1729736328125, 13.659423828125, 14.1458740234375, 14.63232421875, 15.1187744140625, 15.605224609375, 16.0916748046875, 16.578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 8.0, 16.0, 15.0, 21.0, 25.0, 34.0, 39.0, 39.0, 59.0, 83.0, 131.0, 147.0, 91.0, 51.0, 47.0, 36.0, 24.0, 25.0, 15.0, 18.0, 16.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.001386880874633789, -0.0013422966003417969, -0.0012977123260498047, -0.0012531280517578125, -0.0012085437774658203, -0.0011639595031738281, -0.001119375228881836, -0.0010747909545898438, -0.0010302066802978516, -0.0009856224060058594, -0.0009410381317138672, -0.000896453857421875, -0.0008518695831298828, -0.0008072853088378906, -0.0007627010345458984, -0.0007181167602539062, -0.0006735324859619141, -0.0006289482116699219, -0.0005843639373779297, -0.0005397796630859375, -0.0004951953887939453, -0.0004506111145019531, -0.00040602684020996094, -0.00036144256591796875, -0.00031685829162597656, -0.0002722740173339844, -0.0002276897430419922, -0.00018310546875, -0.0001385211944580078, -9.393692016601562e-05, -4.935264587402344e-05, -4.76837158203125e-06, 3.981590270996094e-05, 8.440017700195312e-05, 0.0001289844512939453, 0.0001735687255859375, 0.0002181529998779297, 0.0002627372741699219, 0.00030732154846191406, 0.00035190582275390625, 0.00039649009704589844, 0.0004410743713378906, 0.0004856586456298828, 0.000530242919921875, 0.0005748271942138672, 0.0006194114685058594, 0.0006639957427978516, 0.0007085800170898438, 0.0007531642913818359, 0.0007977485656738281, 0.0008423328399658203, 0.0008869171142578125, 0.0009315013885498047, 0.0009760856628417969, 0.001020669937133789, 0.0010652542114257812, 0.0011098384857177734, 0.0011544227600097656, 0.0011990070343017578, 0.00124359130859375, 0.0012881755828857422, 0.0013327598571777344, 0.0013773441314697266, 0.0014219284057617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 7.0, 10.0, 21.0, 19.0, 31.0, 46.0, 93.0, 126.0, 224.0, 427.0, 829.0, 1781.0, 4803.0, 19727.0, 168037.0, 721096.0, 109259.0, 14749.0, 4035.0, 1613.0, 692.0, 377.0, 188.0, 122.0, 74.0, 34.0, 32.0, 15.0, 18.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.46875, -17.916015625, -17.36328125, -16.810546875, -16.2578125, -15.705078125, -15.15234375, -14.599609375, -14.046875, -13.494140625, -12.94140625, -12.388671875, -11.8359375, -11.283203125, -10.73046875, -10.177734375, -9.625, -9.072265625, -8.51953125, -7.966796875, -7.4140625, -6.861328125, -6.30859375, -5.755859375, -5.203125, -4.650390625, -4.09765625, -3.544921875, -2.9921875, -2.439453125, -1.88671875, -1.333984375, -0.78125, -0.228515625, 0.32421875, 0.876953125, 1.4296875, 1.982421875, 2.53515625, 3.087890625, 3.640625, 4.193359375, 4.74609375, 5.298828125, 5.8515625, 6.404296875, 6.95703125, 7.509765625, 8.0625, 8.615234375, 9.16796875, 9.720703125, 10.2734375, 10.826171875, 11.37890625, 11.931640625, 12.484375, 13.037109375, 13.58984375, 14.142578125, 14.6953125, 15.248046875, 15.80078125, 16.353515625, 16.90625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 3.0, 14.0, 15.0, 21.0, 33.0, 47.0, 54.0, 83.0, 118.0, 107.0, 112.0, 98.0, 63.0, 51.0, 55.0, 27.0, 22.0, 13.0, 7.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3284912109375, -7.047607421875, -6.7667236328125, -6.48583984375, -6.2049560546875, -5.924072265625, -5.6431884765625, -5.3623046875, -5.0814208984375, -4.800537109375, -4.5196533203125, -4.23876953125, -3.9578857421875, -3.677001953125, -3.3961181640625, -3.115234375, -2.8343505859375, -2.553466796875, -2.2725830078125, -1.99169921875, -1.7108154296875, -1.429931640625, -1.1490478515625, -0.8681640625, -0.5872802734375, -0.306396484375, -0.0255126953125, 0.25537109375, 0.5362548828125, 0.817138671875, 1.0980224609375, 1.37890625, 1.6597900390625, 1.940673828125, 2.2215576171875, 2.50244140625, 2.7833251953125, 3.064208984375, 3.3450927734375, 3.6259765625, 3.9068603515625, 4.187744140625, 4.4686279296875, 4.74951171875, 5.0303955078125, 5.311279296875, 5.5921630859375, 5.873046875, 6.1539306640625, 6.434814453125, 6.7156982421875, 6.99658203125, 7.2774658203125, 7.558349609375, 7.8392333984375, 8.1201171875, 8.4010009765625, 8.681884765625, 8.9627685546875, 9.24365234375, 9.5245361328125, 9.805419921875, 10.0863037109375, 10.3671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 9.0, 26.0, 39.0, 81.0, 156.0, 210.0, 191.0, 134.0, 82.0, 39.0, 18.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.3468017578125, -166.20130920410156, -160.0558319091797, -153.91033935546875, -147.76486206054688, -141.61936950683594, -135.473876953125, -129.32839965820312, -123.18290710449219, -117.03742218017578, -110.89193725585938, -104.74644470214844, -98.60095977783203, -92.45547485351562, -86.30998229980469, -80.16449737548828, -74.01901245117188, -67.87352752685547, -61.7280387878418, -55.582550048828125, -49.43706512451172, -43.29158020019531, -37.14609146118164, -31.00060272216797, -24.855117797851562, -18.709630966186523, -12.564144134521484, -6.418657302856445, -0.27317047119140625, 5.872316360473633, 12.017803192138672, 18.163291931152344, 24.30877685546875, 30.45426368713379, 36.59975051879883, 42.7452392578125, 48.890724182128906, 55.03620910644531, 61.181697845458984, 67.32718658447266, 73.47267150878906, 79.61815643310547, 85.76364135742188, 91.90913391113281, 98.05461883544922, 104.20010375976562, 110.34559631347656, 116.49108123779297, 122.63656616210938, 128.7820587158203, 134.9275360107422, 141.07302856445312, 147.218505859375, 153.36399841308594, 159.50949096679688, 165.65496826171875, 171.8004608154297, 177.94595336914062, 184.0914306640625, 190.23692321777344, 196.38241577148438, 202.52789306640625, 208.6733856201172, 214.81887817382812, 220.96435546875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 10.0, 19.0, 16.0, 11.0, 18.0, 23.0, 21.0, 31.0, 24.0, 25.0, 27.0, 31.0, 39.0, 41.0, 52.0, 48.0, 52.0, 42.0, 42.0, 41.0, 33.0, 43.0, 36.0, 34.0, 32.0, 35.0, 21.0, 22.0, 17.0, 14.0, 12.0, 7.0, 13.0, 11.0, 11.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-72.09889221191406, -70.00700378417969, -67.91511535644531, -65.82323455810547, -63.731346130371094, -61.63945770263672, -59.547569274902344, -57.45568084716797, -55.36379623413086, -53.271907806396484, -51.180023193359375, -49.088134765625, -46.996246337890625, -44.904361724853516, -42.81247329711914, -40.72058868408203, -38.628700256347656, -36.53681182861328, -34.44492721557617, -32.3530387878418, -30.261152267456055, -28.169265747070312, -26.077377319335938, -23.985490798950195, -21.893604278564453, -19.80171775817871, -17.70983123779297, -15.617942810058594, -13.526056289672852, -11.43416976928711, -9.34228229522705, -7.250394821166992, -5.158515930175781, -3.066628932952881, -0.9747419357299805, 1.11714506149292, 3.2090320587158203, 5.3009185791015625, 7.392806053161621, 9.48469352722168, 11.576580047607422, 13.668466567993164, 15.760354042053223, 17.85224151611328, 19.944128036499023, 22.036014556884766, 24.12790298461914, 26.219789505004883, 28.311676025390625, 30.403562545776367, 32.49544906616211, 34.587337493896484, 36.679222106933594, 38.77111053466797, 40.862998962402344, 42.95488739013672, 45.04677200317383, 47.1386604309082, 49.23054504394531, 51.32243347167969, 53.41432189941406, 55.50620651245117, 57.59809494018555, 59.689979553222656, 61.78186798095703]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 12.0, 7.0, 7.0, 18.0, 25.0, 37.0, 52.0, 73.0, 128.0, 167.0, 288.0, 392.0, 636.0, 1073.0, 1724.0, 3093.0, 5907.0, 12133.0, 27312.0, 71997.0, 278254.0, 3078994.0, 537049.0, 105146.0, 36667.0, 15789.0, 7550.0, 3998.0, 2264.0, 1317.0, 812.0, 479.0, 303.0, 207.0, 125.0, 70.0, 53.0, 43.0, 26.0, 22.0, 13.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.7822265625, -15.267578125, -14.7529296875, -14.23828125, -13.7236328125, -13.208984375, -12.6943359375, -12.1796875, -11.6650390625, -11.150390625, -10.6357421875, -10.12109375, -9.6064453125, -9.091796875, -8.5771484375, -8.0625, -7.5478515625, -7.033203125, -6.5185546875, -6.00390625, -5.4892578125, -4.974609375, -4.4599609375, -3.9453125, -3.4306640625, -2.916015625, -2.4013671875, -1.88671875, -1.3720703125, -0.857421875, -0.3427734375, 0.171875, 0.6865234375, 1.201171875, 1.7158203125, 2.23046875, 2.7451171875, 3.259765625, 3.7744140625, 4.2890625, 4.8037109375, 5.318359375, 5.8330078125, 6.34765625, 6.8623046875, 7.376953125, 7.8916015625, 8.40625, 8.9208984375, 9.435546875, 9.9501953125, 10.46484375, 10.9794921875, 11.494140625, 12.0087890625, 12.5234375, 13.0380859375, 13.552734375, 14.0673828125, 14.58203125, 15.0966796875, 15.611328125, 16.1259765625, 16.640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 8.0, 12.0, 13.0, 21.0, 20.0, 18.0, 21.0, 30.0, 25.0, 22.0, 48.0, 29.0, 56.0, 44.0, 50.0, 46.0, 47.0, 52.0, 40.0, 33.0, 43.0, 37.0, 40.0, 38.0, 33.0, 29.0, 27.0, 18.0, 12.0, 15.0, 13.0, 23.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.5657958984375, -2.473388671875, -2.3809814453125, -2.28857421875, -2.1961669921875, -2.103759765625, -2.0113525390625, -1.9189453125, -1.8265380859375, -1.734130859375, -1.6417236328125, -1.54931640625, -1.4569091796875, -1.364501953125, -1.2720947265625, -1.1796875, -1.0872802734375, -0.994873046875, -0.9024658203125, -0.81005859375, -0.7176513671875, -0.625244140625, -0.5328369140625, -0.4404296875, -0.3480224609375, -0.255615234375, -0.1632080078125, -0.07080078125, 0.0216064453125, 0.114013671875, 0.2064208984375, 0.298828125, 0.3912353515625, 0.483642578125, 0.5760498046875, 0.66845703125, 0.7608642578125, 0.853271484375, 0.9456787109375, 1.0380859375, 1.1304931640625, 1.222900390625, 1.3153076171875, 1.40771484375, 1.5001220703125, 1.592529296875, 1.6849365234375, 1.77734375, 1.8697509765625, 1.962158203125, 2.0545654296875, 2.14697265625, 2.2393798828125, 2.331787109375, 2.4241943359375, 2.5166015625, 2.6090087890625, 2.701416015625, 2.7938232421875, 2.88623046875, 2.9786376953125, 3.071044921875, 3.1634521484375, 3.255859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 14.0, 18.0, 21.0, 28.0, 50.0, 59.0, 108.0, 192.0, 441.0, 1197.0, 3423.0, 13214.0, 68803.0, 738083.0, 3156358.0, 176343.0, 26605.0, 6129.0, 1821.0, 679.0, 281.0, 141.0, 61.0, 48.0, 28.0, 19.0, 22.0, 14.0, 14.0, 14.0, 5.0, 7.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0625, -23.2919921875, -22.521484375, -21.7509765625, -20.98046875, -20.2099609375, -19.439453125, -18.6689453125, -17.8984375, -17.1279296875, -16.357421875, -15.5869140625, -14.81640625, -14.0458984375, -13.275390625, -12.5048828125, -11.734375, -10.9638671875, -10.193359375, -9.4228515625, -8.65234375, -7.8818359375, -7.111328125, -6.3408203125, -5.5703125, -4.7998046875, -4.029296875, -3.2587890625, -2.48828125, -1.7177734375, -0.947265625, -0.1767578125, 0.59375, 1.3642578125, 2.134765625, 2.9052734375, 3.67578125, 4.4462890625, 5.216796875, 5.9873046875, 6.7578125, 7.5283203125, 8.298828125, 9.0693359375, 9.83984375, 10.6103515625, 11.380859375, 12.1513671875, 12.921875, 13.6923828125, 14.462890625, 15.2333984375, 16.00390625, 16.7744140625, 17.544921875, 18.3154296875, 19.0859375, 19.8564453125, 20.626953125, 21.3974609375, 22.16796875, 22.9384765625, 23.708984375, 24.4794921875, 25.25]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 8.0, 2.0, 8.0, 15.0, 15.0, 35.0, 31.0, 55.0, 70.0, 113.0, 190.0, 360.0, 759.0, 1230.0, 469.0, 245.0, 163.0, 91.0, 70.0, 51.0, 25.0, 21.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.765625, -10.50457763671875, -10.2435302734375, -9.98248291015625, -9.721435546875, -9.46038818359375, -9.1993408203125, -8.93829345703125, -8.67724609375, -8.41619873046875, -8.1551513671875, -7.89410400390625, -7.633056640625, -7.37200927734375, -7.1109619140625, -6.84991455078125, -6.5888671875, -6.32781982421875, -6.0667724609375, -5.80572509765625, -5.544677734375, -5.28363037109375, -5.0225830078125, -4.76153564453125, -4.50048828125, -4.23944091796875, -3.9783935546875, -3.71734619140625, -3.456298828125, -3.19525146484375, -2.9342041015625, -2.67315673828125, -2.412109375, -2.15106201171875, -1.8900146484375, -1.62896728515625, -1.367919921875, -1.10687255859375, -0.8458251953125, -0.58477783203125, -0.32373046875, -0.06268310546875, 0.1983642578125, 0.45941162109375, 0.720458984375, 0.98150634765625, 1.2425537109375, 1.50360107421875, 1.7646484375, 2.02569580078125, 2.2867431640625, 2.54779052734375, 2.808837890625, 3.06988525390625, 3.3309326171875, 3.59197998046875, 3.85302734375, 4.11407470703125, 4.3751220703125, 4.63616943359375, 4.897216796875, 5.15826416015625, 5.4193115234375, 5.68035888671875, 5.94140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 16.0, 48.0, 91.0, 169.0, 247.0, 217.0, 105.0, 54.0, 26.0, 10.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-160.65032958984375, -157.3536834716797, -154.05703735351562, -150.76040649414062, -147.46376037597656, -144.1671142578125, -140.87046813964844, -137.57382202148438, -134.2771759033203, -130.98052978515625, -127.68389129638672, -124.38724517822266, -121.0905990600586, -117.79396057128906, -114.497314453125, -111.20066833496094, -107.90403747558594, -104.60739135742188, -101.31075286865234, -98.01410675048828, -94.71746063232422, -91.42082214355469, -88.12417602539062, -84.82752990722656, -81.5308837890625, -78.23423767089844, -74.9375991821289, -71.64095306396484, -68.34430694580078, -65.04766845703125, -61.75102233886719, -58.45438003540039, -55.15774154663086, -51.86109924316406, -48.564453125, -45.2678108215332, -41.971168518066406, -38.674522399902344, -35.37788009643555, -32.08123779296875, -28.78459358215332, -25.48794937133789, -22.191307067871094, -18.894662857055664, -15.59801959991455, -12.301376342773438, -9.004732131958008, -5.708089828491211, -2.4114456176757812, 0.8851978778839111, 4.1818413734436035, 7.478485107421875, 10.775128364562988, 14.071771621704102, 17.36841583251953, 20.665058135986328, 23.961702346801758, 27.258346557617188, 30.554988861083984, 33.85163116455078, 37.148277282714844, 40.44491958618164, 43.74156188964844, 47.0382080078125, 50.3348503112793]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 7.0, 8.0, 7.0, 7.0, 17.0, 13.0, 11.0, 16.0, 19.0, 23.0, 20.0, 30.0, 31.0, 23.0, 37.0, 39.0, 32.0, 42.0, 41.0, 38.0, 50.0, 36.0, 40.0, 29.0, 38.0, 47.0, 52.0, 34.0, 23.0, 21.0, 27.0, 16.0, 24.0, 15.0, 9.0, 17.0, 8.0, 6.0, 7.0, 6.0, 7.0, 5.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.069576263427734, -20.323698043823242, -19.57781982421875, -18.83194351196289, -18.0860652923584, -17.340187072753906, -16.594308853149414, -15.848430633544922, -15.102553367614746, -14.356675148010254, -13.610797882080078, -12.864919662475586, -12.119041442871094, -11.373164176940918, -10.627285957336426, -9.88140869140625, -9.135530471801758, -8.389652252197266, -7.64377498626709, -6.897896766662598, -6.152019023895264, -5.40614128112793, -4.6602630615234375, -3.9143853187561035, -3.1685075759887695, -2.4226298332214355, -1.6767518520355225, -0.9308738708496094, -0.1849961280822754, 0.5608816146850586, 1.3067598342895508, 2.0526375770568848, 2.7985172271728516, 3.5443949699401855, 4.2902727127075195, 5.036150932312012, 5.782028675079346, 6.52790641784668, 7.273784637451172, 8.019662857055664, 8.76554012298584, 9.511418342590332, 10.257295608520508, 11.003173828125, 11.749052047729492, 12.494929313659668, 13.24080753326416, 13.986684799194336, 14.732563018798828, 15.47844123840332, 16.224319458007812, 16.970195770263672, 17.716073989868164, 18.461952209472656, 19.20783042907715, 19.95370864868164, 20.6995849609375, 21.445463180541992, 22.191341400146484, 22.937217712402344, 23.683095932006836, 24.428974151611328, 25.17485237121582, 25.920730590820312, 26.666608810424805]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 12.0, 17.0, 29.0, 41.0, 76.0, 113.0, 173.0, 272.0, 464.0, 801.0, 1452.0, 2705.0, 5657.0, 11664.0, 25563.0, 59120.0, 163087.0, 469149.0, 188661.0, 65878.0, 27966.0, 12857.0, 6054.0, 3002.0, 1552.0, 861.0, 495.0, 293.0, 197.0, 126.0, 77.0, 55.0, 30.0, 17.0, 14.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.953125, -19.421875, -18.890625, -18.359375, -17.828125, -17.296875, -16.765625, -16.234375, -15.703125, -15.171875, -14.640625, -14.109375, -13.578125, -13.046875, -12.515625, -11.984375, -11.453125, -10.921875, -10.390625, -9.859375, -9.328125, -8.796875, -8.265625, -7.734375, -7.203125, -6.671875, -6.140625, -5.609375, -5.078125, -4.546875, -4.015625, -3.484375, -2.953125, -2.421875, -1.890625, -1.359375, -0.828125, -0.296875, 0.234375, 0.765625, 1.296875, 1.828125, 2.359375, 2.890625, 3.421875, 3.953125, 4.484375, 5.015625, 5.546875, 6.078125, 6.609375, 7.140625, 7.671875, 8.203125, 8.734375, 9.265625, 9.796875, 10.328125, 10.859375, 11.390625, 11.921875, 12.453125, 12.984375, 13.515625, 14.046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 17.0, 10.0, 9.0, 20.0, 29.0, 16.0, 28.0, 27.0, 37.0, 28.0, 24.0, 41.0, 55.0, 40.0, 62.0, 41.0, 50.0, 39.0, 41.0, 34.0, 42.0, 46.0, 32.0, 42.0, 32.0, 24.0, 20.0, 28.0, 10.0, 16.0, 14.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.30645751953125, -2.2144775390625, -2.12249755859375, -2.030517578125, -1.93853759765625, -1.8465576171875, -1.75457763671875, -1.66259765625, -1.57061767578125, -1.4786376953125, -1.38665771484375, -1.294677734375, -1.20269775390625, -1.1107177734375, -1.01873779296875, -0.9267578125, -0.83477783203125, -0.7427978515625, -0.65081787109375, -0.558837890625, -0.46685791015625, -0.3748779296875, -0.28289794921875, -0.19091796875, -0.09893798828125, -0.0069580078125, 0.08502197265625, 0.177001953125, 0.26898193359375, 0.3609619140625, 0.45294189453125, 0.544921875, 0.63690185546875, 0.7288818359375, 0.82086181640625, 0.912841796875, 1.00482177734375, 1.0968017578125, 1.18878173828125, 1.28076171875, 1.37274169921875, 1.4647216796875, 1.55670166015625, 1.648681640625, 1.74066162109375, 1.8326416015625, 1.92462158203125, 2.0166015625, 2.10858154296875, 2.2005615234375, 2.29254150390625, 2.384521484375, 2.47650146484375, 2.5684814453125, 2.66046142578125, 2.75244140625, 2.84442138671875, 2.9364013671875, 3.02838134765625, 3.120361328125, 3.21234130859375, 3.3043212890625, 3.39630126953125, 3.48828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 16.0, 17.0, 17.0, 22.0, 26.0, 49.0, 59.0, 73.0, 105.0, 125.0, 171.0, 249.0, 335.0, 494.0, 901.0, 1883.0, 5178.0, 15915.0, 53877.0, 194358.0, 545818.0, 161293.0, 45258.0, 13606.0, 4430.0, 1750.0, 863.0, 445.0, 321.0, 237.0, 166.0, 126.0, 90.0, 76.0, 52.0, 39.0, 29.0, 14.0, 17.0, 13.0, 12.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.46875, -15.94482421875, -15.4208984375, -14.89697265625, -14.373046875, -13.84912109375, -13.3251953125, -12.80126953125, -12.27734375, -11.75341796875, -11.2294921875, -10.70556640625, -10.181640625, -9.65771484375, -9.1337890625, -8.60986328125, -8.0859375, -7.56201171875, -7.0380859375, -6.51416015625, -5.990234375, -5.46630859375, -4.9423828125, -4.41845703125, -3.89453125, -3.37060546875, -2.8466796875, -2.32275390625, -1.798828125, -1.27490234375, -0.7509765625, -0.22705078125, 0.296875, 0.82080078125, 1.3447265625, 1.86865234375, 2.392578125, 2.91650390625, 3.4404296875, 3.96435546875, 4.48828125, 5.01220703125, 5.5361328125, 6.06005859375, 6.583984375, 7.10791015625, 7.6318359375, 8.15576171875, 8.6796875, 9.20361328125, 9.7275390625, 10.25146484375, 10.775390625, 11.29931640625, 11.8232421875, 12.34716796875, 12.87109375, 13.39501953125, 13.9189453125, 14.44287109375, 14.966796875, 15.49072265625, 16.0146484375, 16.53857421875, 17.0625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 5.0, 14.0, 12.0, 27.0, 12.0, 12.0, 21.0, 22.0, 33.0, 26.0, 34.0, 31.0, 31.0, 38.0, 42.0, 52.0, 42.0, 44.0, 47.0, 28.0, 42.0, 39.0, 34.0, 41.0, 36.0, 32.0, 27.0, 36.0, 17.0, 18.0, 23.0, 16.0, 14.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-13.171875, -12.8050537109375, -12.438232421875, -12.0714111328125, -11.70458984375, -11.3377685546875, -10.970947265625, -10.6041259765625, -10.2373046875, -9.8704833984375, -9.503662109375, -9.1368408203125, -8.77001953125, -8.4031982421875, -8.036376953125, -7.6695556640625, -7.302734375, -6.9359130859375, -6.569091796875, -6.2022705078125, -5.83544921875, -5.4686279296875, -5.101806640625, -4.7349853515625, -4.3681640625, -4.0013427734375, -3.634521484375, -3.2677001953125, -2.90087890625, -2.5340576171875, -2.167236328125, -1.8004150390625, -1.43359375, -1.0667724609375, -0.699951171875, -0.3331298828125, 0.03369140625, 0.4005126953125, 0.767333984375, 1.1341552734375, 1.5009765625, 1.8677978515625, 2.234619140625, 2.6014404296875, 2.96826171875, 3.3350830078125, 3.701904296875, 4.0687255859375, 4.435546875, 4.8023681640625, 5.169189453125, 5.5360107421875, 5.90283203125, 6.2696533203125, 6.636474609375, 7.0032958984375, 7.3701171875, 7.7369384765625, 8.103759765625, 8.4705810546875, 8.83740234375, 9.2042236328125, 9.571044921875, 9.9378662109375, 10.3046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 2.0, 7.0, 14.0, 23.0, 24.0, 60.0, 82.0, 152.0, 227.0, 411.0, 869.0, 2541.0, 10480.0, 59559.0, 538587.0, 378649.0, 44848.0, 8155.0, 2113.0, 802.0, 377.0, 214.0, 109.0, 89.0, 47.0, 27.0, 22.0, 10.0, 15.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.2490234375, -12.833984375, -12.4189453125, -12.00390625, -11.5888671875, -11.173828125, -10.7587890625, -10.34375, -9.9287109375, -9.513671875, -9.0986328125, -8.68359375, -8.2685546875, -7.853515625, -7.4384765625, -7.0234375, -6.6083984375, -6.193359375, -5.7783203125, -5.36328125, -4.9482421875, -4.533203125, -4.1181640625, -3.703125, -3.2880859375, -2.873046875, -2.4580078125, -2.04296875, -1.6279296875, -1.212890625, -0.7978515625, -0.3828125, 0.0322265625, 0.447265625, 0.8623046875, 1.27734375, 1.6923828125, 2.107421875, 2.5224609375, 2.9375, 3.3525390625, 3.767578125, 4.1826171875, 4.59765625, 5.0126953125, 5.427734375, 5.8427734375, 6.2578125, 6.6728515625, 7.087890625, 7.5029296875, 7.91796875, 8.3330078125, 8.748046875, 9.1630859375, 9.578125, 9.9931640625, 10.408203125, 10.8232421875, 11.23828125, 11.6533203125, 12.068359375, 12.4833984375, 12.8984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 10.0, 13.0, 9.0, 18.0, 18.0, 22.0, 29.0, 39.0, 96.0, 195.0, 223.0, 98.0, 33.0, 40.0, 23.0, 27.0, 21.0, 11.0, 7.0, 5.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001407623291015625, -0.0013535618782043457, -0.0012995004653930664, -0.0012454390525817871, -0.0011913776397705078, -0.0011373162269592285, -0.0010832548141479492, -0.00102919340133667, -0.0009751319885253906, -0.0009210705757141113, -0.000867009162902832, -0.0008129477500915527, -0.0007588863372802734, -0.0007048249244689941, -0.0006507635116577148, -0.0005967020988464355, -0.0005426406860351562, -0.000488579273223877, -0.00043451786041259766, -0.00038045644760131836, -0.00032639503479003906, -0.00027233362197875977, -0.00021827220916748047, -0.00016421079635620117, -0.00011014938354492188, -5.608797073364258e-05, -2.0265579223632812e-06, 5.2034854888916016e-05, 0.00010609626770019531, 0.0001601576805114746, 0.0002142190933227539, 0.0002682805061340332, 0.0003223419189453125, 0.0003764033317565918, 0.0004304647445678711, 0.0004845261573791504, 0.0005385875701904297, 0.000592648983001709, 0.0006467103958129883, 0.0007007718086242676, 0.0007548332214355469, 0.0008088946342468262, 0.0008629560470581055, 0.0009170174598693848, 0.0009710788726806641, 0.0010251402854919434, 0.0010792016983032227, 0.001133263111114502, 0.0011873245239257812, 0.0012413859367370605, 0.0012954473495483398, 0.0013495087623596191, 0.0014035701751708984, 0.0014576315879821777, 0.001511693000793457, 0.0015657544136047363, 0.0016198158264160156, 0.001673877239227295, 0.0017279386520385742, 0.0017820000648498535, 0.0018360614776611328, 0.0018901228904724121, 0.0019441843032836914, 0.0019982457160949707, 0.00205230712890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 11.0, 11.0, 13.0, 25.0, 38.0, 68.0, 106.0, 181.0, 370.0, 805.0, 2653.0, 20759.0, 635327.0, 370033.0, 14534.0, 2191.0, 685.0, 351.0, 178.0, 74.0, 60.0, 31.0, 20.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.953125, -17.170166015625, -16.38720703125, -15.604248046875, -14.8212890625, -14.038330078125, -13.25537109375, -12.472412109375, -11.689453125, -10.906494140625, -10.12353515625, -9.340576171875, -8.5576171875, -7.774658203125, -6.99169921875, -6.208740234375, -5.42578125, -4.642822265625, -3.85986328125, -3.076904296875, -2.2939453125, -1.510986328125, -0.72802734375, 0.054931640625, 0.837890625, 1.620849609375, 2.40380859375, 3.186767578125, 3.9697265625, 4.752685546875, 5.53564453125, 6.318603515625, 7.1015625, 7.884521484375, 8.66748046875, 9.450439453125, 10.2333984375, 11.016357421875, 11.79931640625, 12.582275390625, 13.365234375, 14.148193359375, 14.93115234375, 15.714111328125, 16.4970703125, 17.280029296875, 18.06298828125, 18.845947265625, 19.62890625, 20.411865234375, 21.19482421875, 21.977783203125, 22.7607421875, 23.543701171875, 24.32666015625, 25.109619140625, 25.892578125, 26.675537109375, 27.45849609375, 28.241455078125, 29.0244140625, 29.807373046875, 30.59033203125, 31.373291015625, 32.15625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 4.0, 11.0, 9.0, 16.0, 17.0, 24.0, 29.0, 34.0, 50.0, 62.0, 84.0, 109.0, 105.0, 89.0, 61.0, 65.0, 39.0, 33.0, 26.0, 23.0, 15.0, 14.0, 22.0, 9.0, 5.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.5625, -7.33514404296875, -7.1077880859375, -6.88043212890625, -6.653076171875, -6.42572021484375, -6.1983642578125, -5.97100830078125, -5.74365234375, -5.51629638671875, -5.2889404296875, -5.06158447265625, -4.834228515625, -4.60687255859375, -4.3795166015625, -4.15216064453125, -3.9248046875, -3.69744873046875, -3.4700927734375, -3.24273681640625, -3.015380859375, -2.78802490234375, -2.5606689453125, -2.33331298828125, -2.10595703125, -1.87860107421875, -1.6512451171875, -1.42388916015625, -1.196533203125, -0.96917724609375, -0.7418212890625, -0.51446533203125, -0.287109375, -0.05975341796875, 0.1676025390625, 0.39495849609375, 0.622314453125, 0.84967041015625, 1.0770263671875, 1.30438232421875, 1.53173828125, 1.75909423828125, 1.9864501953125, 2.21380615234375, 2.441162109375, 2.66851806640625, 2.8958740234375, 3.12322998046875, 3.3505859375, 3.57794189453125, 3.8052978515625, 4.03265380859375, 4.260009765625, 4.48736572265625, 4.7147216796875, 4.94207763671875, 5.16943359375, 5.39678955078125, 5.6241455078125, 5.85150146484375, 6.078857421875, 6.30621337890625, 6.5335693359375, 6.76092529296875, 6.98828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 21.0, 49.0, 99.0, 147.0, 210.0, 186.0, 143.0, 63.0, 34.0, 23.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.17317199707031, -59.779273986816406, -54.3853759765625, -48.99147415161133, -43.59757614135742, -38.203678131103516, -32.809776306152344, -27.415878295898438, -22.02198028564453, -16.628082275390625, -11.234182357788086, -5.840282440185547, -0.4463844299316406, 4.947513580322266, 10.341415405273438, 15.735313415527344, 21.12921142578125, 26.523109436035156, 31.917009353637695, 37.310909271240234, 42.70480728149414, 48.09870529174805, 53.49260711669922, 58.886505126953125, 64.28040313720703, 69.67430114746094, 75.06819915771484, 80.46209716796875, 85.85600280761719, 91.24989318847656, 96.643798828125, 102.0376968383789, 107.43157958984375, 112.82547760009766, 118.21937561035156, 123.61328125, 129.00717163085938, 134.4010772705078, 139.79498291015625, 145.18887329101562, 150.582763671875, 155.97666931152344, 161.3705596923828, 166.76446533203125, 172.15835571289062, 177.55226135253906, 182.9461669921875, 188.34005737304688, 193.7339630126953, 199.12786865234375, 204.52175903320312, 209.91566467285156, 215.30955505371094, 220.70346069335938, 226.09735107421875, 231.4912567138672, 236.88516235351562, 242.27906799316406, 247.67295837402344, 253.06686401367188, 258.46075439453125, 263.8546447753906, 269.2485656738281, 274.6424560546875, 280.0363464355469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 9.0, 14.0, 8.0, 12.0, 14.0, 11.0, 14.0, 16.0, 16.0, 26.0, 27.0, 23.0, 31.0, 39.0, 35.0, 44.0, 38.0, 22.0, 60.0, 41.0, 41.0, 44.0, 46.0, 38.0, 38.0, 37.0, 28.0, 37.0, 28.0, 35.0, 24.0, 25.0, 13.0, 8.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.59772491455078, -58.66156005859375, -56.72539520263672, -54.78923034667969, -52.853065490722656, -50.916900634765625, -48.98073959350586, -47.04457473754883, -45.1084098815918, -43.172245025634766, -41.236080169677734, -39.2999153137207, -37.36375427246094, -35.427589416503906, -33.491424560546875, -31.555259704589844, -29.619094848632812, -27.68292999267578, -25.74676513671875, -23.81060218811035, -21.87443733215332, -19.93827247619629, -18.00210952758789, -16.06594467163086, -14.129779815673828, -12.193614959716797, -10.257451057434082, -8.321287155151367, -6.385122299194336, -4.448957443237305, -2.51279354095459, -0.576629638671875, 1.3595314025878906, 3.2956957817077637, 5.231860160827637, 7.16802453994751, 9.104188919067383, 11.040353775024414, 12.976517677307129, 14.912681579589844, 16.848846435546875, 18.785011291503906, 20.721176147460938, 22.657339096069336, 24.593503952026367, 26.5296688079834, 28.465831756591797, 30.401996612548828, 32.33816146850586, 34.27432632446289, 36.21049118041992, 38.14665603637695, 40.08281707763672, 42.01898193359375, 43.95514678955078, 45.89131164550781, 47.827476501464844, 49.763641357421875, 51.699806213378906, 53.63597106933594, 55.57213592529297, 57.50830078125, 59.444461822509766, 61.3806266784668, 63.31679153442383]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 2.0, 7.0, 8.0, 21.0, 16.0, 22.0, 34.0, 38.0, 83.0, 114.0, 224.0, 450.0, 1096.0, 3001.0, 9471.0, 40717.0, 536180.0, 3496137.0, 83700.0, 15684.0, 4394.0, 1508.0, 662.0, 281.0, 167.0, 86.0, 54.0, 39.0, 21.0, 21.0, 7.0, 9.0, 4.0, 3.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.33984375, -34.0859375, -32.83203125, -31.578125, -30.32421875, -29.0703125, -27.81640625, -26.5625, -25.30859375, -24.0546875, -22.80078125, -21.546875, -20.29296875, -19.0390625, -17.78515625, -16.53125, -15.27734375, -14.0234375, -12.76953125, -11.515625, -10.26171875, -9.0078125, -7.75390625, -6.5, -5.24609375, -3.9921875, -2.73828125, -1.484375, -0.23046875, 1.0234375, 2.27734375, 3.53125, 4.78515625, 6.0390625, 7.29296875, 8.546875, 9.80078125, 11.0546875, 12.30859375, 13.5625, 14.81640625, 16.0703125, 17.32421875, 18.578125, 19.83203125, 21.0859375, 22.33984375, 23.59375, 24.84765625, 26.1015625, 27.35546875, 28.609375, 29.86328125, 31.1171875, 32.37109375, 33.625, 34.87890625, 36.1328125, 37.38671875, 38.640625, 39.89453125, 41.1484375, 42.40234375, 43.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 13.0, 13.0, 14.0, 17.0, 19.0, 18.0, 31.0, 29.0, 33.0, 34.0, 40.0, 33.0, 49.0, 58.0, 57.0, 49.0, 39.0, 38.0, 40.0, 51.0, 43.0, 31.0, 37.0, 44.0, 20.0, 20.0, 21.0, 22.0, 16.0, 11.0, 14.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.921875, -2.82684326171875, -2.7318115234375, -2.63677978515625, -2.541748046875, -2.44671630859375, -2.3516845703125, -2.25665283203125, -2.16162109375, -2.06658935546875, -1.9715576171875, -1.87652587890625, -1.781494140625, -1.68646240234375, -1.5914306640625, -1.49639892578125, -1.4013671875, -1.30633544921875, -1.2113037109375, -1.11627197265625, -1.021240234375, -0.92620849609375, -0.8311767578125, -0.73614501953125, -0.64111328125, -0.54608154296875, -0.4510498046875, -0.35601806640625, -0.260986328125, -0.16595458984375, -0.0709228515625, 0.02410888671875, 0.119140625, 0.21417236328125, 0.3092041015625, 0.40423583984375, 0.499267578125, 0.59429931640625, 0.6893310546875, 0.78436279296875, 0.87939453125, 0.97442626953125, 1.0694580078125, 1.16448974609375, 1.259521484375, 1.35455322265625, 1.4495849609375, 1.54461669921875, 1.6396484375, 1.73468017578125, 1.8297119140625, 1.92474365234375, 2.019775390625, 2.11480712890625, 2.2098388671875, 2.30487060546875, 2.39990234375, 2.49493408203125, 2.5899658203125, 2.68499755859375, 2.780029296875, 2.87506103515625, 2.9700927734375, 3.06512451171875, 3.16015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 9.0, 8.0, 20.0, 18.0, 22.0, 28.0, 30.0, 44.0, 44.0, 59.0, 71.0, 126.0, 164.0, 262.0, 557.0, 1348.0, 5035.0, 28460.0, 387352.0, 3639693.0, 112501.0, 13299.0, 2862.0, 934.0, 427.0, 238.0, 118.0, 103.0, 80.0, 81.0, 47.0, 38.0, 31.0, 37.0, 27.0, 22.0, 15.0, 11.0, 16.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.05029296875, -29.9130859375, -28.77587890625, -27.638671875, -26.50146484375, -25.3642578125, -24.22705078125, -23.08984375, -21.95263671875, -20.8154296875, -19.67822265625, -18.541015625, -17.40380859375, -16.2666015625, -15.12939453125, -13.9921875, -12.85498046875, -11.7177734375, -10.58056640625, -9.443359375, -8.30615234375, -7.1689453125, -6.03173828125, -4.89453125, -3.75732421875, -2.6201171875, -1.48291015625, -0.345703125, 0.79150390625, 1.9287109375, 3.06591796875, 4.203125, 5.34033203125, 6.4775390625, 7.61474609375, 8.751953125, 9.88916015625, 11.0263671875, 12.16357421875, 13.30078125, 14.43798828125, 15.5751953125, 16.71240234375, 17.849609375, 18.98681640625, 20.1240234375, 21.26123046875, 22.3984375, 23.53564453125, 24.6728515625, 25.81005859375, 26.947265625, 28.08447265625, 29.2216796875, 30.35888671875, 31.49609375, 32.63330078125, 33.7705078125, 34.90771484375, 36.044921875, 37.18212890625, 38.3193359375, 39.45654296875, 40.59375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 24.0, 19.0, 60.0, 92.0, 212.0, 520.0, 1956.0, 696.0, 250.0, 102.0, 58.0, 33.0, 11.0, 13.0, 9.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.637939453125, -6.21337890625, -5.788818359375, -5.3642578125, -4.939697265625, -4.51513671875, -4.090576171875, -3.666015625, -3.241455078125, -2.81689453125, -2.392333984375, -1.9677734375, -1.543212890625, -1.11865234375, -0.694091796875, -0.26953125, 0.155029296875, 0.57958984375, 1.004150390625, 1.4287109375, 1.853271484375, 2.27783203125, 2.702392578125, 3.126953125, 3.551513671875, 3.97607421875, 4.400634765625, 4.8251953125, 5.249755859375, 5.67431640625, 6.098876953125, 6.5234375, 6.947998046875, 7.37255859375, 7.797119140625, 8.2216796875, 8.646240234375, 9.07080078125, 9.495361328125, 9.919921875, 10.344482421875, 10.76904296875, 11.193603515625, 11.6181640625, 12.042724609375, 12.46728515625, 12.891845703125, 13.31640625, 13.740966796875, 14.16552734375, 14.590087890625, 15.0146484375, 15.439208984375, 15.86376953125, 16.288330078125, 16.712890625, 17.137451171875, 17.56201171875, 17.986572265625, 18.4111328125, 18.835693359375, 19.26025390625, 19.684814453125, 20.109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 40.0, 71.0, 177.0, 221.0, 189.0, 145.0, 87.0, 27.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.99659729003906, -132.76165771484375, -129.52670288085938, -126.29175567626953, -123.05680847167969, -119.82186126708984, -116.5869140625, -113.35196685791016, -110.11701965332031, -106.88207244873047, -103.64712524414062, -100.41217803955078, -97.17723083496094, -93.9422836303711, -90.70733642578125, -87.4723892211914, -84.23744201660156, -81.00249481201172, -77.76754760742188, -74.53260040283203, -71.29765319824219, -68.06270599365234, -64.8277587890625, -61.592811584472656, -58.35786437988281, -55.12291717529297, -51.887969970703125, -48.65302276611328, -45.41807556152344, -42.183128356933594, -38.94818115234375, -35.713233947753906, -32.47828674316406, -29.24333953857422, -26.008392333984375, -22.77344512939453, -19.538497924804688, -16.303550720214844, -13.068603515625, -9.833656311035156, -6.5987091064453125, -3.3637619018554688, -0.128814697265625, 3.1061325073242188, 6.3410797119140625, 9.576026916503906, 12.81097412109375, 16.045921325683594, 19.280868530273438, 22.51581573486328, 25.750762939453125, 28.98571014404297, 32.22065734863281, 35.455604553222656, 38.6905517578125, 41.925498962402344, 45.16044616699219, 48.39539337158203, 51.630340576171875, 54.86528778076172, 58.10023498535156, 61.335182189941406, 64.57012939453125, 67.8050765991211, 71.04002380371094]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 9.0, 5.0, 4.0, 8.0, 16.0, 15.0, 17.0, 22.0, 30.0, 34.0, 29.0, 40.0, 49.0, 45.0, 49.0, 61.0, 54.0, 42.0, 51.0, 36.0, 43.0, 48.0, 45.0, 44.0, 31.0, 31.0, 16.0, 24.0, 18.0, 13.0, 11.0, 11.0, 12.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-36.22332000732422, -35.2440071105957, -34.26469421386719, -33.28538131713867, -32.306068420410156, -31.32675552368164, -30.347442626953125, -29.36812973022461, -28.388816833496094, -27.409503936767578, -26.430191040039062, -25.450878143310547, -24.47156524658203, -23.492252349853516, -22.512939453125, -21.533626556396484, -20.5543155670166, -19.575002670288086, -18.59568977355957, -17.616376876831055, -16.63706398010254, -15.657751083374023, -14.678439140319824, -13.699126243591309, -12.719813346862793, -11.740500450134277, -10.761187553405762, -9.781875610351562, -8.802562713623047, -7.823249340057373, -6.843936920166016, -5.8646240234375, -4.885311126708984, -3.9059982299804688, -2.9266855716705322, -1.9473729133605957, -0.9680600166320801, 0.011252880096435547, 0.990565299987793, 1.9698781967163086, 2.949191093444824, 3.92850399017334, 4.9078168869018555, 5.887129306793213, 6.8664422035217285, 7.845755100250244, 8.825067520141602, 9.804380416870117, 10.783693313598633, 11.763006210327148, 12.742319107055664, 13.72163200378418, 14.700944900512695, 15.680257797241211, 16.659568786621094, 17.63888168334961, 18.618194580078125, 19.59750747680664, 20.576820373535156, 21.556133270263672, 22.535446166992188, 23.514759063720703, 24.49407196044922, 25.473384857177734, 26.45269775390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 20.0, 30.0, 45.0, 46.0, 65.0, 128.0, 160.0, 260.0, 404.0, 806.0, 1502.0, 3110.0, 7103.0, 16944.0, 42840.0, 123992.0, 509438.0, 231819.0, 65666.0, 24904.0, 10255.0, 4374.0, 2079.0, 1015.0, 568.0, 336.0, 215.0, 146.0, 81.0, 54.0, 40.0, 19.0, 18.0, 15.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.777099609375, -15.16357421875, -14.550048828125, -13.9365234375, -13.322998046875, -12.70947265625, -12.095947265625, -11.482421875, -10.868896484375, -10.25537109375, -9.641845703125, -9.0283203125, -8.414794921875, -7.80126953125, -7.187744140625, -6.57421875, -5.960693359375, -5.34716796875, -4.733642578125, -4.1201171875, -3.506591796875, -2.89306640625, -2.279541015625, -1.666015625, -1.052490234375, -0.43896484375, 0.174560546875, 0.7880859375, 1.401611328125, 2.01513671875, 2.628662109375, 3.2421875, 3.855712890625, 4.46923828125, 5.082763671875, 5.6962890625, 6.309814453125, 6.92333984375, 7.536865234375, 8.150390625, 8.763916015625, 9.37744140625, 9.990966796875, 10.6044921875, 11.218017578125, 11.83154296875, 12.445068359375, 13.05859375, 13.672119140625, 14.28564453125, 14.899169921875, 15.5126953125, 16.126220703125, 16.73974609375, 17.353271484375, 17.966796875, 18.580322265625, 19.19384765625, 19.807373046875, 20.4208984375, 21.034423828125, 21.64794921875, 22.261474609375, 22.875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 18.0, 20.0, 9.0, 16.0, 33.0, 28.0, 22.0, 21.0, 38.0, 30.0, 40.0, 44.0, 43.0, 46.0, 54.0, 44.0, 49.0, 49.0, 42.0, 49.0, 37.0, 39.0, 40.0, 30.0, 31.0, 18.0, 17.0, 24.0, 15.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8299560546875, -2.730224609375, -2.6304931640625, -2.53076171875, -2.4310302734375, -2.331298828125, -2.2315673828125, -2.1318359375, -2.0321044921875, -1.932373046875, -1.8326416015625, -1.73291015625, -1.6331787109375, -1.533447265625, -1.4337158203125, -1.333984375, -1.2342529296875, -1.134521484375, -1.0347900390625, -0.93505859375, -0.8353271484375, -0.735595703125, -0.6358642578125, -0.5361328125, -0.4364013671875, -0.336669921875, -0.2369384765625, -0.13720703125, -0.0374755859375, 0.062255859375, 0.1619873046875, 0.26171875, 0.3614501953125, 0.461181640625, 0.5609130859375, 0.66064453125, 0.7603759765625, 0.860107421875, 0.9598388671875, 1.0595703125, 1.1593017578125, 1.259033203125, 1.3587646484375, 1.45849609375, 1.5582275390625, 1.657958984375, 1.7576904296875, 1.857421875, 1.9571533203125, 2.056884765625, 2.1566162109375, 2.25634765625, 2.3560791015625, 2.455810546875, 2.5555419921875, 2.6552734375, 2.7550048828125, 2.854736328125, 2.9544677734375, 3.05419921875, 3.1539306640625, 3.253662109375, 3.3533935546875, 3.453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 10.0, 13.0, 13.0, 15.0, 25.0, 24.0, 25.0, 47.0, 83.0, 121.0, 195.0, 356.0, 643.0, 1302.0, 2881.0, 7113.0, 17785.0, 46996.0, 143077.0, 499383.0, 222601.0, 64866.0, 24185.0, 9365.0, 3835.0, 1671.0, 792.0, 395.0, 237.0, 150.0, 100.0, 60.0, 54.0, 33.0, 33.0, 15.0, 16.0, 13.0, 3.0, 4.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.734375, -14.296630859375, -13.85888671875, -13.421142578125, -12.9833984375, -12.545654296875, -12.10791015625, -11.670166015625, -11.232421875, -10.794677734375, -10.35693359375, -9.919189453125, -9.4814453125, -9.043701171875, -8.60595703125, -8.168212890625, -7.73046875, -7.292724609375, -6.85498046875, -6.417236328125, -5.9794921875, -5.541748046875, -5.10400390625, -4.666259765625, -4.228515625, -3.790771484375, -3.35302734375, -2.915283203125, -2.4775390625, -2.039794921875, -1.60205078125, -1.164306640625, -0.7265625, -0.288818359375, 0.14892578125, 0.586669921875, 1.0244140625, 1.462158203125, 1.89990234375, 2.337646484375, 2.775390625, 3.213134765625, 3.65087890625, 4.088623046875, 4.5263671875, 4.964111328125, 5.40185546875, 5.839599609375, 6.27734375, 6.715087890625, 7.15283203125, 7.590576171875, 8.0283203125, 8.466064453125, 8.90380859375, 9.341552734375, 9.779296875, 10.217041015625, 10.65478515625, 11.092529296875, 11.5302734375, 11.968017578125, 12.40576171875, 12.843505859375, 13.28125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 8.0, 12.0, 8.0, 9.0, 10.0, 11.0, 12.0, 11.0, 22.0, 28.0, 44.0, 24.0, 44.0, 37.0, 46.0, 38.0, 41.0, 50.0, 57.0, 36.0, 44.0, 35.0, 48.0, 39.0, 41.0, 31.0, 35.0, 30.0, 27.0, 17.0, 22.0, 23.0, 15.0, 16.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8682861328125, -12.455322265625, -12.0423583984375, -11.62939453125, -11.2164306640625, -10.803466796875, -10.3905029296875, -9.9775390625, -9.5645751953125, -9.151611328125, -8.7386474609375, -8.32568359375, -7.9127197265625, -7.499755859375, -7.0867919921875, -6.673828125, -6.2608642578125, -5.847900390625, -5.4349365234375, -5.02197265625, -4.6090087890625, -4.196044921875, -3.7830810546875, -3.3701171875, -2.9571533203125, -2.544189453125, -2.1312255859375, -1.71826171875, -1.3052978515625, -0.892333984375, -0.4793701171875, -0.06640625, 0.3465576171875, 0.759521484375, 1.1724853515625, 1.58544921875, 1.9984130859375, 2.411376953125, 2.8243408203125, 3.2373046875, 3.6502685546875, 4.063232421875, 4.4761962890625, 4.88916015625, 5.3021240234375, 5.715087890625, 6.1280517578125, 6.541015625, 6.9539794921875, 7.366943359375, 7.7799072265625, 8.19287109375, 8.6058349609375, 9.018798828125, 9.4317626953125, 9.8447265625, 10.2576904296875, 10.670654296875, 11.0836181640625, 11.49658203125, 11.9095458984375, 12.322509765625, 12.7354736328125, 13.1484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 12.0, 30.0, 38.0, 63.0, 85.0, 145.0, 367.0, 869.0, 3126.0, 14965.0, 214076.0, 765664.0, 40579.0, 5883.0, 1553.0, 573.0, 231.0, 110.0, 62.0, 42.0, 30.0, 15.0, 11.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.89013671875, -15.3271484375, -14.76416015625, -14.201171875, -13.63818359375, -13.0751953125, -12.51220703125, -11.94921875, -11.38623046875, -10.8232421875, -10.26025390625, -9.697265625, -9.13427734375, -8.5712890625, -8.00830078125, -7.4453125, -6.88232421875, -6.3193359375, -5.75634765625, -5.193359375, -4.63037109375, -4.0673828125, -3.50439453125, -2.94140625, -2.37841796875, -1.8154296875, -1.25244140625, -0.689453125, -0.12646484375, 0.4365234375, 0.99951171875, 1.5625, 2.12548828125, 2.6884765625, 3.25146484375, 3.814453125, 4.37744140625, 4.9404296875, 5.50341796875, 6.06640625, 6.62939453125, 7.1923828125, 7.75537109375, 8.318359375, 8.88134765625, 9.4443359375, 10.00732421875, 10.5703125, 11.13330078125, 11.6962890625, 12.25927734375, 12.822265625, 13.38525390625, 13.9482421875, 14.51123046875, 15.07421875, 15.63720703125, 16.2001953125, 16.76318359375, 17.326171875, 17.88916015625, 18.4521484375, 19.01513671875, 19.578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 3.0, 5.0, 5.0, 6.0, 11.0, 9.0, 10.0, 25.0, 28.0, 28.0, 54.0, 103.0, 170.0, 204.0, 118.0, 66.0, 29.0, 20.0, 17.0, 17.0, 9.0, 11.0, 10.0, 7.0, 10.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001369476318359375, -0.001326829195022583, -0.001284182071685791, -0.001241534948348999, -0.001198887825012207, -0.001156240701675415, -0.001113593578338623, -0.001070946455001831, -0.001028299331665039, -0.000985652208328247, -0.0009430050849914551, -0.0009003579616546631, -0.0008577108383178711, -0.0008150637149810791, -0.0007724165916442871, -0.0007297694683074951, -0.0006871223449707031, -0.0006444752216339111, -0.0006018280982971191, -0.0005591809749603271, -0.0005165338516235352, -0.00047388672828674316, -0.00043123960494995117, -0.0003885924816131592, -0.0003459453582763672, -0.0003032982349395752, -0.0002606511116027832, -0.0002180039882659912, -0.00017535686492919922, -0.00013270974159240723, -9.006261825561523e-05, -4.741549491882324e-05, -4.76837158203125e-06, 3.787875175476074e-05, 8.052587509155273e-05, 0.00012317299842834473, 0.00016582012176513672, 0.0002084672451019287, 0.0002511143684387207, 0.0002937614917755127, 0.0003364086151123047, 0.0003790557384490967, 0.00042170286178588867, 0.00046434998512268066, 0.0005069971084594727, 0.0005496442317962646, 0.0005922913551330566, 0.0006349384784698486, 0.0006775856018066406, 0.0007202327251434326, 0.0007628798484802246, 0.0008055269718170166, 0.0008481740951538086, 0.0008908212184906006, 0.0009334683418273926, 0.0009761154651641846, 0.0010187625885009766, 0.0010614097118377686, 0.0011040568351745605, 0.0011467039585113525, 0.0011893510818481445, 0.0012319982051849365, 0.0012746453285217285, 0.0013172924518585205, 0.0013599395751953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 13.0, 7.0, 6.0, 15.0, 24.0, 30.0, 34.0, 59.0, 75.0, 125.0, 189.0, 299.0, 531.0, 781.0, 1374.0, 2482.0, 4879.0, 10943.0, 32042.0, 162570.0, 629396.0, 150680.0, 30768.0, 10625.0, 4721.0, 2405.0, 1309.0, 796.0, 499.0, 281.0, 201.0, 117.0, 89.0, 51.0, 40.0, 18.0, 17.0, 14.0, 14.0, 9.0, 12.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.449462890625, -9.11767578125, -8.785888671875, -8.4541015625, -8.122314453125, -7.79052734375, -7.458740234375, -7.126953125, -6.795166015625, -6.46337890625, -6.131591796875, -5.7998046875, -5.468017578125, -5.13623046875, -4.804443359375, -4.47265625, -4.140869140625, -3.80908203125, -3.477294921875, -3.1455078125, -2.813720703125, -2.48193359375, -2.150146484375, -1.818359375, -1.486572265625, -1.15478515625, -0.822998046875, -0.4912109375, -0.159423828125, 0.17236328125, 0.504150390625, 0.8359375, 1.167724609375, 1.49951171875, 1.831298828125, 2.1630859375, 2.494873046875, 2.82666015625, 3.158447265625, 3.490234375, 3.822021484375, 4.15380859375, 4.485595703125, 4.8173828125, 5.149169921875, 5.48095703125, 5.812744140625, 6.14453125, 6.476318359375, 6.80810546875, 7.139892578125, 7.4716796875, 7.803466796875, 8.13525390625, 8.467041015625, 8.798828125, 9.130615234375, 9.46240234375, 9.794189453125, 10.1259765625, 10.457763671875, 10.78955078125, 11.121337890625, 11.453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 8.0, 13.0, 11.0, 19.0, 40.0, 50.0, 71.0, 67.0, 112.0, 150.0, 125.0, 85.0, 67.0, 41.0, 26.0, 22.0, 18.0, 16.0, 13.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9298095703125, -9.625244140625, -9.3206787109375, -9.01611328125, -8.7115478515625, -8.406982421875, -8.1024169921875, -7.7978515625, -7.4932861328125, -7.188720703125, -6.8841552734375, -6.57958984375, -6.2750244140625, -5.970458984375, -5.6658935546875, -5.361328125, -5.0567626953125, -4.752197265625, -4.4476318359375, -4.14306640625, -3.8385009765625, -3.533935546875, -3.2293701171875, -2.9248046875, -2.6202392578125, -2.315673828125, -2.0111083984375, -1.70654296875, -1.4019775390625, -1.097412109375, -0.7928466796875, -0.48828125, -0.1837158203125, 0.120849609375, 0.4254150390625, 0.72998046875, 1.0345458984375, 1.339111328125, 1.6436767578125, 1.9482421875, 2.2528076171875, 2.557373046875, 2.8619384765625, 3.16650390625, 3.4710693359375, 3.775634765625, 4.0802001953125, 4.384765625, 4.6893310546875, 4.993896484375, 5.2984619140625, 5.60302734375, 5.9075927734375, 6.212158203125, 6.5167236328125, 6.8212890625, 7.1258544921875, 7.430419921875, 7.7349853515625, 8.03955078125, 8.3441162109375, 8.648681640625, 8.9532470703125, 9.2578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 20.0, 19.0, 46.0, 102.0, 139.0, 184.0, 170.0, 125.0, 94.0, 56.0, 29.0, 17.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.27543640136719, -74.3579330444336, -69.4404296875, -64.52291870117188, -59.60541534423828, -54.68791198730469, -49.77040481567383, -44.85289764404297, -39.935394287109375, -35.01789093017578, -30.100383758544922, -25.182878494262695, -20.26537322998047, -15.347867965698242, -10.430362701416016, -5.512855529785156, -0.5953521728515625, 4.322153091430664, 9.23965835571289, 14.157163619995117, 19.074668884277344, 23.99217414855957, 28.909679412841797, 33.827186584472656, 38.74468994140625, 43.662193298339844, 48.5797004699707, 53.49720764160156, 58.414710998535156, 63.33221435546875, 68.24972534179688, 73.16722869873047, 78.08473205566406, 83.00223541259766, 87.91973876953125, 92.83724975585938, 97.75475311279297, 102.67225646972656, 107.58976745605469, 112.50727081298828, 117.42477416992188, 122.34227752685547, 127.25978088378906, 132.1772918701172, 137.09478759765625, 142.01229858398438, 146.9298095703125, 151.84732055664062, 156.7648162841797, 161.6823272705078, 166.59982299804688, 171.517333984375, 176.43484497070312, 181.3523406982422, 186.2698516845703, 191.18734741210938, 196.1048583984375, 201.02236938476562, 205.9398651123047, 210.8573760986328, 215.77487182617188, 220.6923828125, 225.60989379882812, 230.52740478515625, 235.4449005126953]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 22.0, 13.0, 18.0, 23.0, 38.0, 29.0, 29.0, 42.0, 42.0, 46.0, 48.0, 33.0, 34.0, 56.0, 45.0, 41.0, 36.0, 36.0, 42.0, 39.0, 39.0, 39.0, 25.0, 31.0, 18.0, 19.0, 12.0, 13.0, 12.0, 3.0, 6.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-65.46266174316406, -63.459285736083984, -61.455909729003906, -59.45252990722656, -57.449153900146484, -55.445777893066406, -53.44239807128906, -51.439022064208984, -49.435646057128906, -47.43227005004883, -45.42889404296875, -43.425514221191406, -41.42213821411133, -39.41876220703125, -37.415382385253906, -35.41200637817383, -33.40863037109375, -31.405254364013672, -29.40187644958496, -27.39849853515625, -25.395122528076172, -23.391746520996094, -21.388368606567383, -19.384990692138672, -17.381614685058594, -15.3782377243042, -13.374860763549805, -11.37148380279541, -9.368106842041016, -7.364729881286621, -5.361352920532227, -3.357975959777832, -1.3546066284179688, 0.6487703323364258, 2.6521472930908203, 4.655524253845215, 6.658901214599609, 8.662278175354004, 10.665655136108398, 12.669032096862793, 14.672409057617188, 16.675785064697266, 18.679162979125977, 20.682540893554688, 22.685916900634766, 24.689292907714844, 26.692670822143555, 28.696048736572266, 30.699424743652344, 32.70280075073242, 34.7061767578125, 36.709556579589844, 38.71293258666992, 40.71630859375, 42.719688415527344, 44.72306442260742, 46.7264404296875, 48.72981643676758, 50.733192443847656, 52.736572265625, 54.73994827270508, 56.743324279785156, 58.7467041015625, 60.75008010864258, 62.753456115722656]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 10.0, 7.0, 13.0, 25.0, 16.0, 32.0, 24.0, 43.0, 68.0, 97.0, 147.0, 175.0, 278.0, 405.0, 614.0, 980.0, 1613.0, 2821.0, 5023.0, 9800.0, 21426.0, 55353.0, 210935.0, 3191116.0, 535196.0, 94970.0, 32388.0, 14277.0, 7006.0, 3759.0, 2108.0, 1240.0, 759.0, 497.0, 333.0, 211.0, 156.0, 108.0, 80.0, 44.0, 37.0, 22.0, 17.0, 12.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-23.3125, -22.621337890625, -21.93017578125, -21.239013671875, -20.5478515625, -19.856689453125, -19.16552734375, -18.474365234375, -17.783203125, -17.092041015625, -16.40087890625, -15.709716796875, -15.0185546875, -14.327392578125, -13.63623046875, -12.945068359375, -12.25390625, -11.562744140625, -10.87158203125, -10.180419921875, -9.4892578125, -8.798095703125, -8.10693359375, -7.415771484375, -6.724609375, -6.033447265625, -5.34228515625, -4.651123046875, -3.9599609375, -3.268798828125, -2.57763671875, -1.886474609375, -1.1953125, -0.504150390625, 0.18701171875, 0.878173828125, 1.5693359375, 2.260498046875, 2.95166015625, 3.642822265625, 4.333984375, 5.025146484375, 5.71630859375, 6.407470703125, 7.0986328125, 7.789794921875, 8.48095703125, 9.172119140625, 9.86328125, 10.554443359375, 11.24560546875, 11.936767578125, 12.6279296875, 13.319091796875, 14.01025390625, 14.701416015625, 15.392578125, 16.083740234375, 16.77490234375, 17.466064453125, 18.1572265625, 18.848388671875, 19.53955078125, 20.230712890625, 20.921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 12.0, 7.0, 13.0, 18.0, 14.0, 17.0, 27.0, 25.0, 22.0, 43.0, 36.0, 48.0, 38.0, 50.0, 47.0, 56.0, 31.0, 34.0, 48.0, 38.0, 46.0, 32.0, 45.0, 34.0, 39.0, 39.0, 23.0, 18.0, 11.0, 13.0, 18.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.888671875, -2.79107666015625, -2.6934814453125, -2.59588623046875, -2.498291015625, -2.40069580078125, -2.3031005859375, -2.20550537109375, -2.10791015625, -2.01031494140625, -1.9127197265625, -1.81512451171875, -1.717529296875, -1.61993408203125, -1.5223388671875, -1.42474365234375, -1.3271484375, -1.22955322265625, -1.1319580078125, -1.03436279296875, -0.936767578125, -0.83917236328125, -0.7415771484375, -0.64398193359375, -0.54638671875, -0.44879150390625, -0.3511962890625, -0.25360107421875, -0.156005859375, -0.05841064453125, 0.0391845703125, 0.13677978515625, 0.234375, 0.33197021484375, 0.4295654296875, 0.52716064453125, 0.624755859375, 0.72235107421875, 0.8199462890625, 0.91754150390625, 1.01513671875, 1.11273193359375, 1.2103271484375, 1.30792236328125, 1.405517578125, 1.50311279296875, 1.6007080078125, 1.69830322265625, 1.7958984375, 1.89349365234375, 1.9910888671875, 2.08868408203125, 2.186279296875, 2.28387451171875, 2.3814697265625, 2.47906494140625, 2.57666015625, 2.67425537109375, 2.7718505859375, 2.86944580078125, 2.967041015625, 3.06463623046875, 3.1622314453125, 3.25982666015625, 3.357421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 19.0, 18.0, 19.0, 35.0, 34.0, 75.0, 102.0, 162.0, 255.0, 418.0, 692.0, 1376.0, 2557.0, 5616.0, 13397.0, 36560.0, 128500.0, 973631.0, 2761622.0, 189555.0, 48937.0, 16962.0, 6888.0, 3136.0, 1682.0, 775.0, 451.0, 258.0, 154.0, 103.0, 76.0, 61.0, 39.0, 29.0, 17.0, 14.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.110595703125, -18.53369140625, -17.956787109375, -17.3798828125, -16.802978515625, -16.22607421875, -15.649169921875, -15.072265625, -14.495361328125, -13.91845703125, -13.341552734375, -12.7646484375, -12.187744140625, -11.61083984375, -11.033935546875, -10.45703125, -9.880126953125, -9.30322265625, -8.726318359375, -8.1494140625, -7.572509765625, -6.99560546875, -6.418701171875, -5.841796875, -5.264892578125, -4.68798828125, -4.111083984375, -3.5341796875, -2.957275390625, -2.38037109375, -1.803466796875, -1.2265625, -0.649658203125, -0.07275390625, 0.504150390625, 1.0810546875, 1.657958984375, 2.23486328125, 2.811767578125, 3.388671875, 3.965576171875, 4.54248046875, 5.119384765625, 5.6962890625, 6.273193359375, 6.85009765625, 7.427001953125, 8.00390625, 8.580810546875, 9.15771484375, 9.734619140625, 10.3115234375, 10.888427734375, 11.46533203125, 12.042236328125, 12.619140625, 13.196044921875, 13.77294921875, 14.349853515625, 14.9267578125, 15.503662109375, 16.08056640625, 16.657470703125, 17.234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 15.0, 12.0, 23.0, 34.0, 54.0, 61.0, 108.0, 230.0, 486.0, 1653.0, 634.0, 308.0, 147.0, 85.0, 63.0, 47.0, 28.0, 17.0, 11.0, 7.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.953125, -8.6876220703125, -8.422119140625, -8.1566162109375, -7.89111328125, -7.6256103515625, -7.360107421875, -7.0946044921875, -6.8291015625, -6.5635986328125, -6.298095703125, -6.0325927734375, -5.76708984375, -5.5015869140625, -5.236083984375, -4.9705810546875, -4.705078125, -4.4395751953125, -4.174072265625, -3.9085693359375, -3.64306640625, -3.3775634765625, -3.112060546875, -2.8465576171875, -2.5810546875, -2.3155517578125, -2.050048828125, -1.7845458984375, -1.51904296875, -1.2535400390625, -0.988037109375, -0.7225341796875, -0.45703125, -0.1915283203125, 0.073974609375, 0.3394775390625, 0.60498046875, 0.8704833984375, 1.135986328125, 1.4014892578125, 1.6669921875, 1.9324951171875, 2.197998046875, 2.4635009765625, 2.72900390625, 2.9945068359375, 3.260009765625, 3.5255126953125, 3.791015625, 4.0565185546875, 4.322021484375, 4.5875244140625, 4.85302734375, 5.1185302734375, 5.384033203125, 5.6495361328125, 5.9150390625, 6.1805419921875, 6.446044921875, 6.7115478515625, 6.97705078125, 7.2425537109375, 7.508056640625, 7.7735595703125, 8.0390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 11.0, 7.0, 6.0, 9.0, 20.0, 21.0, 38.0, 54.0, 96.0, 109.0, 127.0, 126.0, 109.0, 94.0, 67.0, 35.0, 39.0, 17.0, 9.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.28128051757812, -68.7434310913086, -67.2055892944336, -65.66773986816406, -64.12989044189453, -62.59204864501953, -61.05419921875, -59.516353607177734, -57.97850799560547, -56.4406623840332, -54.90281295776367, -53.364967346191406, -51.82712173461914, -50.289276123046875, -48.751426696777344, -47.21358108520508, -45.67573547363281, -44.13788986206055, -42.600040435791016, -41.06219482421875, -39.524349212646484, -37.98650360107422, -36.44865417480469, -34.91080856323242, -33.37295913696289, -31.835111618041992, -30.297266006469727, -28.759418487548828, -27.221572875976562, -25.683725357055664, -24.145877838134766, -22.6080322265625, -21.070188522338867, -19.53234100341797, -17.994495391845703, -16.456647872924805, -14.918802261352539, -13.38095474243164, -11.843108177185059, -10.305261611938477, -8.767415046691895, -7.2295684814453125, -5.6917219161987305, -4.15387487411499, -2.616028308868408, -1.0781817436218262, 0.45966529846191406, 1.997511863708496, 3.535358428955078, 5.07320499420166, 6.611051559448242, 8.14889907836914, 9.686744689941406, 11.224592208862305, 12.762438774108887, 14.300285339355469, 15.83813190460205, 17.375978469848633, 18.91382598876953, 20.451671600341797, 21.989519119262695, 23.52736473083496, 25.06521224975586, 26.603057861328125, 28.140905380249023]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 11.0, 10.0, 9.0, 14.0, 17.0, 16.0, 26.0, 32.0, 29.0, 41.0, 32.0, 36.0, 46.0, 43.0, 37.0, 42.0, 38.0, 52.0, 35.0, 48.0, 40.0, 37.0, 58.0, 36.0, 29.0, 31.0, 24.0, 22.0, 21.0, 10.0, 19.0, 10.0, 4.0, 7.0, 2.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.436439514160156, -25.6163387298584, -24.79623794555664, -23.976137161254883, -23.156036376953125, -22.335933685302734, -21.515832901000977, -20.69573211669922, -19.87563133239746, -19.055530548095703, -18.235429763793945, -17.415328979492188, -16.595226287841797, -15.775126457214355, -14.955024719238281, -14.134923934936523, -13.314823150634766, -12.494722366333008, -11.67462158203125, -10.854519844055176, -10.034419059753418, -9.21431827545166, -8.394216537475586, -7.574115753173828, -6.75401496887207, -5.9339141845703125, -5.1138129234313965, -4.2937116622924805, -3.4736108779907227, -2.653510093688965, -1.8334088325500488, -1.0133075714111328, -0.1932086944580078, 0.6268923282623291, 1.446993350982666, 2.267094373703003, 3.08719539642334, 3.9072961807250977, 4.727397441864014, 5.54749870300293, 6.3675994873046875, 7.187700271606445, 8.007801055908203, 8.827902793884277, 9.648003578186035, 10.468104362487793, 11.288206100463867, 12.108306884765625, 12.928407669067383, 13.74850845336914, 14.568609237670898, 15.388710975646973, 16.208812713623047, 17.028911590576172, 17.849014282226562, 18.66911506652832, 19.489215850830078, 20.309316635131836, 21.129417419433594, 21.94951820373535, 22.76961898803711, 23.5897216796875, 24.409822463989258, 25.229923248291016, 26.050024032592773]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 12.0, 22.0, 30.0, 48.0, 68.0, 109.0, 217.0, 351.0, 569.0, 1144.0, 2368.0, 5256.0, 12797.0, 34871.0, 94199.0, 246733.0, 375501.0, 170368.0, 63832.0, 23607.0, 8883.0, 3813.0, 1781.0, 866.0, 438.0, 295.0, 152.0, 75.0, 52.0, 33.0, 22.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.793212890625, -17.16455078125, -16.535888671875, -15.9072265625, -15.278564453125, -14.64990234375, -14.021240234375, -13.392578125, -12.763916015625, -12.13525390625, -11.506591796875, -10.8779296875, -10.249267578125, -9.62060546875, -8.991943359375, -8.36328125, -7.734619140625, -7.10595703125, -6.477294921875, -5.8486328125, -5.219970703125, -4.59130859375, -3.962646484375, -3.333984375, -2.705322265625, -2.07666015625, -1.447998046875, -0.8193359375, -0.190673828125, 0.43798828125, 1.066650390625, 1.6953125, 2.323974609375, 2.95263671875, 3.581298828125, 4.2099609375, 4.838623046875, 5.46728515625, 6.095947265625, 6.724609375, 7.353271484375, 7.98193359375, 8.610595703125, 9.2392578125, 9.867919921875, 10.49658203125, 11.125244140625, 11.75390625, 12.382568359375, 13.01123046875, 13.639892578125, 14.2685546875, 14.897216796875, 15.52587890625, 16.154541015625, 16.783203125, 17.411865234375, 18.04052734375, 18.669189453125, 19.2978515625, 19.926513671875, 20.55517578125, 21.183837890625, 21.8125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 9.0, 10.0, 15.0, 16.0, 16.0, 31.0, 26.0, 24.0, 27.0, 42.0, 56.0, 53.0, 53.0, 55.0, 53.0, 50.0, 43.0, 37.0, 46.0, 44.0, 47.0, 35.0, 34.0, 38.0, 21.0, 16.0, 19.0, 20.0, 11.0, 12.0, 7.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.255859375, -3.141693115234375, -3.02752685546875, -2.913360595703125, -2.7991943359375, -2.685028076171875, -2.57086181640625, -2.456695556640625, -2.342529296875, -2.228363037109375, -2.11419677734375, -2.000030517578125, -1.8858642578125, -1.771697998046875, -1.65753173828125, -1.543365478515625, -1.42919921875, -1.315032958984375, -1.20086669921875, -1.086700439453125, -0.9725341796875, -0.858367919921875, -0.74420166015625, -0.630035400390625, -0.515869140625, -0.401702880859375, -0.28753662109375, -0.173370361328125, -0.0592041015625, 0.054962158203125, 0.16912841796875, 0.283294677734375, 0.3974609375, 0.511627197265625, 0.62579345703125, 0.739959716796875, 0.8541259765625, 0.968292236328125, 1.08245849609375, 1.196624755859375, 1.310791015625, 1.424957275390625, 1.53912353515625, 1.653289794921875, 1.7674560546875, 1.881622314453125, 1.99578857421875, 2.109954833984375, 2.22412109375, 2.338287353515625, 2.45245361328125, 2.566619873046875, 2.6807861328125, 2.794952392578125, 2.90911865234375, 3.023284912109375, 3.137451171875, 3.251617431640625, 3.36578369140625, 3.479949951171875, 3.5941162109375, 3.708282470703125, 3.82244873046875, 3.936614990234375, 4.05078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 12.0, 9.0, 13.0, 22.0, 16.0, 32.0, 33.0, 37.0, 63.0, 58.0, 87.0, 78.0, 132.0, 157.0, 223.0, 292.0, 382.0, 513.0, 850.0, 1728.0, 4799.0, 18268.0, 84723.0, 371706.0, 430680.0, 101306.0, 21719.0, 5414.0, 1935.0, 926.0, 583.0, 364.0, 311.0, 234.0, 167.0, 142.0, 118.0, 86.0, 67.0, 46.0, 41.0, 40.0, 30.0, 30.0, 22.0, 15.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.25, -20.587158203125, -19.92431640625, -19.261474609375, -18.5986328125, -17.935791015625, -17.27294921875, -16.610107421875, -15.947265625, -15.284423828125, -14.62158203125, -13.958740234375, -13.2958984375, -12.633056640625, -11.97021484375, -11.307373046875, -10.64453125, -9.981689453125, -9.31884765625, -8.656005859375, -7.9931640625, -7.330322265625, -6.66748046875, -6.004638671875, -5.341796875, -4.678955078125, -4.01611328125, -3.353271484375, -2.6904296875, -2.027587890625, -1.36474609375, -0.701904296875, -0.0390625, 0.623779296875, 1.28662109375, 1.949462890625, 2.6123046875, 3.275146484375, 3.93798828125, 4.600830078125, 5.263671875, 5.926513671875, 6.58935546875, 7.252197265625, 7.9150390625, 8.577880859375, 9.24072265625, 9.903564453125, 10.56640625, 11.229248046875, 11.89208984375, 12.554931640625, 13.2177734375, 13.880615234375, 14.54345703125, 15.206298828125, 15.869140625, 16.531982421875, 17.19482421875, 17.857666015625, 18.5205078125, 19.183349609375, 19.84619140625, 20.509033203125, 21.171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 10.0, 12.0, 13.0, 17.0, 19.0, 17.0, 19.0, 29.0, 28.0, 41.0, 30.0, 27.0, 38.0, 36.0, 32.0, 51.0, 46.0, 51.0, 42.0, 43.0, 43.0, 43.0, 37.0, 42.0, 31.0, 32.0, 26.0, 16.0, 11.0, 14.0, 14.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.390625, -13.9525146484375, -13.514404296875, -13.0762939453125, -12.63818359375, -12.2000732421875, -11.761962890625, -11.3238525390625, -10.8857421875, -10.4476318359375, -10.009521484375, -9.5714111328125, -9.13330078125, -8.6951904296875, -8.257080078125, -7.8189697265625, -7.380859375, -6.9427490234375, -6.504638671875, -6.0665283203125, -5.62841796875, -5.1903076171875, -4.752197265625, -4.3140869140625, -3.8759765625, -3.4378662109375, -2.999755859375, -2.5616455078125, -2.12353515625, -1.6854248046875, -1.247314453125, -0.8092041015625, -0.37109375, 0.0670166015625, 0.505126953125, 0.9432373046875, 1.38134765625, 1.8194580078125, 2.257568359375, 2.6956787109375, 3.1337890625, 3.5718994140625, 4.010009765625, 4.4481201171875, 4.88623046875, 5.3243408203125, 5.762451171875, 6.2005615234375, 6.638671875, 7.0767822265625, 7.514892578125, 7.9530029296875, 8.39111328125, 8.8292236328125, 9.267333984375, 9.7054443359375, 10.1435546875, 10.5816650390625, 11.019775390625, 11.4578857421875, 11.89599609375, 12.3341064453125, 12.772216796875, 13.2103271484375, 13.6484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 19.0, 21.0, 33.0, 65.0, 116.0, 303.0, 723.0, 2587.0, 13211.0, 136857.0, 778676.0, 101832.0, 10671.0, 2196.0, 701.0, 264.0, 120.0, 58.0, 27.0, 21.0, 15.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.515625, -21.88037109375, -21.2451171875, -20.60986328125, -19.974609375, -19.33935546875, -18.7041015625, -18.06884765625, -17.43359375, -16.79833984375, -16.1630859375, -15.52783203125, -14.892578125, -14.25732421875, -13.6220703125, -12.98681640625, -12.3515625, -11.71630859375, -11.0810546875, -10.44580078125, -9.810546875, -9.17529296875, -8.5400390625, -7.90478515625, -7.26953125, -6.63427734375, -5.9990234375, -5.36376953125, -4.728515625, -4.09326171875, -3.4580078125, -2.82275390625, -2.1875, -1.55224609375, -0.9169921875, -0.28173828125, 0.353515625, 0.98876953125, 1.6240234375, 2.25927734375, 2.89453125, 3.52978515625, 4.1650390625, 4.80029296875, 5.435546875, 6.07080078125, 6.7060546875, 7.34130859375, 7.9765625, 8.61181640625, 9.2470703125, 9.88232421875, 10.517578125, 11.15283203125, 11.7880859375, 12.42333984375, 13.05859375, 13.69384765625, 14.3291015625, 14.96435546875, 15.599609375, 16.23486328125, 16.8701171875, 17.50537109375, 18.140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 16.0, 24.0, 23.0, 40.0, 45.0, 70.0, 106.0, 169.0, 193.0, 87.0, 53.0, 43.0, 31.0, 27.0, 12.0, 14.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.003566741943359375, -0.003490731120109558, -0.003414720296859741, -0.0033387094736099243, -0.0032626986503601074, -0.0031866878271102905, -0.0031106770038604736, -0.0030346661806106567, -0.00295865535736084, -0.002882644534111023, -0.002806633710861206, -0.002730622887611389, -0.0026546120643615723, -0.0025786012411117554, -0.0025025904178619385, -0.0024265795946121216, -0.0023505687713623047, -0.002274557948112488, -0.002198547124862671, -0.002122536301612854, -0.002046525478363037, -0.00197051465511322, -0.0018945038318634033, -0.0018184930086135864, -0.0017424821853637695, -0.0016664713621139526, -0.0015904605388641357, -0.0015144497156143188, -0.001438438892364502, -0.001362428069114685, -0.0012864172458648682, -0.0012104064226150513, -0.0011343955993652344, -0.0010583847761154175, -0.0009823739528656006, -0.0009063631296157837, -0.0008303523063659668, -0.0007543414831161499, -0.000678330659866333, -0.0006023198366165161, -0.0005263090133666992, -0.0004502981901168823, -0.00037428736686706543, -0.00029827654361724854, -0.00022226572036743164, -0.00014625489711761475, -7.024407386779785e-05, 5.766749382019043e-06, 8.177757263183594e-05, 0.00015778839588165283, 0.00023379921913146973, 0.0003098100423812866, 0.0003858208656311035, 0.0004618316888809204, 0.0005378425121307373, 0.0006138533353805542, 0.0006898641586303711, 0.000765874981880188, 0.0008418858051300049, 0.0009178966283798218, 0.0009939074516296387, 0.0010699182748794556, 0.0011459290981292725, 0.0012219399213790894, 0.0012979507446289062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 8.0, 10.0, 17.0, 50.0, 71.0, 110.0, 174.0, 388.0, 1011.0, 4323.0, 65754.0, 903294.0, 67108.0, 4298.0, 973.0, 412.0, 208.0, 135.0, 83.0, 43.0, 31.0, 16.0, 11.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.436279296875, -33.46630859375, -32.496337890625, -31.5263671875, -30.556396484375, -29.58642578125, -28.616455078125, -27.646484375, -26.676513671875, -25.70654296875, -24.736572265625, -23.7666015625, -22.796630859375, -21.82666015625, -20.856689453125, -19.88671875, -18.916748046875, -17.94677734375, -16.976806640625, -16.0068359375, -15.036865234375, -14.06689453125, -13.096923828125, -12.126953125, -11.156982421875, -10.18701171875, -9.217041015625, -8.2470703125, -7.277099609375, -6.30712890625, -5.337158203125, -4.3671875, -3.397216796875, -2.42724609375, -1.457275390625, -0.4873046875, 0.482666015625, 1.45263671875, 2.422607421875, 3.392578125, 4.362548828125, 5.33251953125, 6.302490234375, 7.2724609375, 8.242431640625, 9.21240234375, 10.182373046875, 11.15234375, 12.122314453125, 13.09228515625, 14.062255859375, 15.0322265625, 16.002197265625, 16.97216796875, 17.942138671875, 18.912109375, 19.882080078125, 20.85205078125, 21.822021484375, 22.7919921875, 23.761962890625, 24.73193359375, 25.701904296875, 26.671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 11.0, 27.0, 32.0, 37.0, 52.0, 75.0, 104.0, 99.0, 150.0, 105.0, 74.0, 50.0, 43.0, 25.0, 26.0, 20.0, 16.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8515625, -13.4691162109375, -13.086669921875, -12.7042236328125, -12.32177734375, -11.9393310546875, -11.556884765625, -11.1744384765625, -10.7919921875, -10.4095458984375, -10.027099609375, -9.6446533203125, -9.26220703125, -8.8797607421875, -8.497314453125, -8.1148681640625, -7.732421875, -7.3499755859375, -6.967529296875, -6.5850830078125, -6.20263671875, -5.8201904296875, -5.437744140625, -5.0552978515625, -4.6728515625, -4.2904052734375, -3.907958984375, -3.5255126953125, -3.14306640625, -2.7606201171875, -2.378173828125, -1.9957275390625, -1.61328125, -1.2308349609375, -0.848388671875, -0.4659423828125, -0.08349609375, 0.2989501953125, 0.681396484375, 1.0638427734375, 1.4462890625, 1.8287353515625, 2.211181640625, 2.5936279296875, 2.97607421875, 3.3585205078125, 3.740966796875, 4.1234130859375, 4.505859375, 4.8883056640625, 5.270751953125, 5.6531982421875, 6.03564453125, 6.4180908203125, 6.800537109375, 7.1829833984375, 7.5654296875, 7.9478759765625, 8.330322265625, 8.7127685546875, 9.09521484375, 9.4776611328125, 9.860107421875, 10.2425537109375, 10.625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 14.0, 29.0, 98.0, 229.0, 328.0, 194.0, 85.0, 24.0, 9.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.1737365722656, -389.239990234375, -378.3062744140625, -367.3725280761719, -356.4388122558594, -345.50506591796875, -334.57135009765625, -323.6376037597656, -312.703857421875, -301.7701110839844, -290.8363952636719, -279.90264892578125, -268.96893310546875, -258.0351867675781, -247.10145568847656, -236.167724609375, -225.2340087890625, -214.30027770996094, -203.36654663085938, -192.43280029296875, -181.49908447265625, -170.56533813476562, -159.63160705566406, -148.6978759765625, -137.76414489746094, -126.83041381835938, -115.89668273925781, -104.96294403076172, -94.02921295166016, -83.0954818725586, -72.1617431640625, -61.22801208496094, -50.2943115234375, -39.36058044433594, -28.42684555053711, -17.49311065673828, -6.559379577636719, 4.374351501464844, 15.308090209960938, 26.2418212890625, 37.17555236816406, 48.109283447265625, 59.04301834106445, 69.97675323486328, 80.91048431396484, 91.8442153930664, 102.7779541015625, 113.71168518066406, 124.64541625976562, 135.5791473388672, 146.51287841796875, 157.44662475585938, 168.38034057617188, 179.3140869140625, 190.24781799316406, 201.18154907226562, 212.1152801513672, 223.04901123046875, 233.9827423095703, 244.91647338867188, 255.8502197265625, 266.783935546875, 277.7176818847656, 288.65142822265625, 299.58514404296875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 8.0, 9.0, 13.0, 13.0, 12.0, 21.0, 20.0, 23.0, 21.0, 33.0, 36.0, 34.0, 34.0, 44.0, 34.0, 30.0, 30.0, 31.0, 51.0, 44.0, 42.0, 38.0, 52.0, 31.0, 39.0, 28.0, 31.0, 29.0, 28.0, 13.0, 26.0, 15.0, 16.0, 17.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-79.36653137207031, -77.12184143066406, -74.87715148925781, -72.63246154785156, -70.38777160644531, -68.14308166503906, -65.89839172363281, -63.65370178222656, -61.40901184082031, -59.16432189941406, -56.91963195800781, -54.67494201660156, -52.43025207519531, -50.18556213378906, -47.94087219238281, -45.69618225097656, -43.45149230957031, -41.20680236816406, -38.96211242675781, -36.71742248535156, -34.47273254394531, -32.22804260253906, -29.983352661132812, -27.738662719726562, -25.493972778320312, -23.249282836914062, -21.004592895507812, -18.759902954101562, -16.515213012695312, -14.270523071289062, -12.025833129882812, -9.781143188476562, -7.536445617675781, -5.291755676269531, -3.0470657348632812, -0.8023757934570312, 1.4423141479492188, 3.6870040893554688, 5.931694030761719, 8.176383972167969, 10.421073913574219, 12.665763854980469, 14.910453796386719, 17.15514373779297, 19.39983367919922, 21.64452362060547, 23.88921356201172, 26.13390350341797, 28.37859344482422, 30.62328338623047, 32.86797332763672, 35.11266326904297, 37.35735321044922, 39.60204315185547, 41.84673309326172, 44.09142303466797, 46.33611297607422, 48.58080291748047, 50.82549285888672, 53.07018280029297, 55.31487274169922, 57.55956268310547, 59.80425262451172, 62.04894256591797, 64.29363250732422]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 6.0, 16.0, 21.0, 42.0, 36.0, 61.0, 86.0, 130.0, 213.0, 301.0, 422.0, 698.0, 1246.0, 2079.0, 3990.0, 8053.0, 18524.0, 49165.0, 167850.0, 1205398.0, 2424258.0, 211326.0, 58315.0, 21611.0, 9487.0, 4728.0, 2434.0, 1406.0, 822.0, 524.0, 334.0, 190.0, 163.0, 107.0, 51.0, 63.0, 35.0, 23.0, 16.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.328125, -19.7799072265625, -19.231689453125, -18.6834716796875, -18.13525390625, -17.5870361328125, -17.038818359375, -16.4906005859375, -15.9423828125, -15.3941650390625, -14.845947265625, -14.2977294921875, -13.74951171875, -13.2012939453125, -12.653076171875, -12.1048583984375, -11.556640625, -11.0084228515625, -10.460205078125, -9.9119873046875, -9.36376953125, -8.8155517578125, -8.267333984375, -7.7191162109375, -7.1708984375, -6.6226806640625, -6.074462890625, -5.5262451171875, -4.97802734375, -4.4298095703125, -3.881591796875, -3.3333740234375, -2.78515625, -2.2369384765625, -1.688720703125, -1.1405029296875, -0.59228515625, -0.0440673828125, 0.504150390625, 1.0523681640625, 1.6005859375, 2.1488037109375, 2.697021484375, 3.2452392578125, 3.79345703125, 4.3416748046875, 4.889892578125, 5.4381103515625, 5.986328125, 6.5345458984375, 7.082763671875, 7.6309814453125, 8.17919921875, 8.7274169921875, 9.275634765625, 9.8238525390625, 10.3720703125, 10.9202880859375, 11.468505859375, 12.0167236328125, 12.56494140625, 13.1131591796875, 13.661376953125, 14.2095947265625, 14.7578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 11.0, 4.0, 11.0, 21.0, 24.0, 21.0, 17.0, 28.0, 33.0, 37.0, 52.0, 47.0, 36.0, 67.0, 49.0, 64.0, 52.0, 43.0, 42.0, 39.0, 36.0, 36.0, 36.0, 36.0, 34.0, 28.0, 19.0, 15.0, 10.0, 14.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.615234375, -3.493499755859375, -3.37176513671875, -3.250030517578125, -3.1282958984375, -3.006561279296875, -2.88482666015625, -2.763092041015625, -2.641357421875, -2.519622802734375, -2.39788818359375, -2.276153564453125, -2.1544189453125, -2.032684326171875, -1.91094970703125, -1.789215087890625, -1.66748046875, -1.545745849609375, -1.42401123046875, -1.302276611328125, -1.1805419921875, -1.058807373046875, -0.93707275390625, -0.815338134765625, -0.693603515625, -0.571868896484375, -0.45013427734375, -0.328399658203125, -0.2066650390625, -0.084930419921875, 0.03680419921875, 0.158538818359375, 0.2802734375, 0.402008056640625, 0.52374267578125, 0.645477294921875, 0.7672119140625, 0.888946533203125, 1.01068115234375, 1.132415771484375, 1.254150390625, 1.375885009765625, 1.49761962890625, 1.619354248046875, 1.7410888671875, 1.862823486328125, 1.98455810546875, 2.106292724609375, 2.22802734375, 2.349761962890625, 2.47149658203125, 2.593231201171875, 2.7149658203125, 2.836700439453125, 2.95843505859375, 3.080169677734375, 3.201904296875, 3.323638916015625, 3.44537353515625, 3.567108154296875, 3.6888427734375, 3.810577392578125, 3.93231201171875, 4.054046630859375, 4.17578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 8.0, 4.0, 10.0, 11.0, 17.0, 24.0, 26.0, 61.0, 65.0, 121.0, 190.0, 320.0, 510.0, 818.0, 1573.0, 2546.0, 5094.0, 10242.0, 23275.0, 60678.0, 193231.0, 967851.0, 2432273.0, 339201.0, 93972.0, 33561.0, 14069.0, 6648.0, 3447.0, 1820.0, 991.0, 634.0, 370.0, 203.0, 151.0, 106.0, 59.0, 46.0, 21.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.345703125, -12.91796875, -12.490234375, -12.0625, -11.634765625, -11.20703125, -10.779296875, -10.3515625, -9.923828125, -9.49609375, -9.068359375, -8.640625, -8.212890625, -7.78515625, -7.357421875, -6.9296875, -6.501953125, -6.07421875, -5.646484375, -5.21875, -4.791015625, -4.36328125, -3.935546875, -3.5078125, -3.080078125, -2.65234375, -2.224609375, -1.796875, -1.369140625, -0.94140625, -0.513671875, -0.0859375, 0.341796875, 0.76953125, 1.197265625, 1.625, 2.052734375, 2.48046875, 2.908203125, 3.3359375, 3.763671875, 4.19140625, 4.619140625, 5.046875, 5.474609375, 5.90234375, 6.330078125, 6.7578125, 7.185546875, 7.61328125, 8.041015625, 8.46875, 8.896484375, 9.32421875, 9.751953125, 10.1796875, 10.607421875, 11.03515625, 11.462890625, 11.890625, 12.318359375, 12.74609375, 13.173828125, 13.6015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 6.0, 12.0, 11.0, 13.0, 16.0, 40.0, 39.0, 64.0, 91.0, 149.0, 203.0, 328.0, 668.0, 1076.0, 464.0, 303.0, 162.0, 118.0, 69.0, 57.0, 47.0, 20.0, 25.0, 16.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.75225830078125, -8.4888916015625, -8.22552490234375, -7.962158203125, -7.69879150390625, -7.4354248046875, -7.17205810546875, -6.90869140625, -6.64532470703125, -6.3819580078125, -6.11859130859375, -5.855224609375, -5.59185791015625, -5.3284912109375, -5.06512451171875, -4.8017578125, -4.53839111328125, -4.2750244140625, -4.01165771484375, -3.748291015625, -3.48492431640625, -3.2215576171875, -2.95819091796875, -2.69482421875, -2.43145751953125, -2.1680908203125, -1.90472412109375, -1.641357421875, -1.37799072265625, -1.1146240234375, -0.85125732421875, -0.587890625, -0.32452392578125, -0.0611572265625, 0.20220947265625, 0.465576171875, 0.72894287109375, 0.9923095703125, 1.25567626953125, 1.51904296875, 1.78240966796875, 2.0457763671875, 2.30914306640625, 2.572509765625, 2.83587646484375, 3.0992431640625, 3.36260986328125, 3.6259765625, 3.88934326171875, 4.1527099609375, 4.41607666015625, 4.679443359375, 4.94281005859375, 5.2061767578125, 5.46954345703125, 5.73291015625, 5.99627685546875, 6.2596435546875, 6.52301025390625, 6.786376953125, 7.04974365234375, 7.3131103515625, 7.57647705078125, 7.83984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 27.0, 39.0, 116.0, 219.0, 246.0, 190.0, 90.0, 49.0, 15.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.73622131347656, -135.66502380371094, -131.5938262939453, -127.52262878417969, -123.45142364501953, -119.3802261352539, -115.30902862548828, -111.23783111572266, -107.1666259765625, -103.09542846679688, -99.02423095703125, -94.95303344726562, -90.88182830810547, -86.81063079833984, -82.73943328857422, -78.6682357788086, -74.59703826904297, -70.52584075927734, -66.45464324951172, -62.38344192504883, -58.31224060058594, -54.24104309082031, -50.16984558105469, -46.09864807128906, -42.02744674682617, -37.95624923706055, -33.885047912597656, -29.81385040283203, -25.742650985717773, -21.671451568603516, -17.60025405883789, -13.529054641723633, -9.457855224609375, -5.386656284332275, -1.3154573440551758, 2.7557411193847656, 6.826940536499023, 10.898139953613281, 14.969337463378906, 19.040536880493164, 23.111736297607422, 27.18293571472168, 31.254135131835938, 35.32533264160156, 39.39653015136719, 43.46773147583008, 47.5389289855957, 51.610130310058594, 55.68132781982422, 59.752525329589844, 63.823726654052734, 67.89492797851562, 71.96612548828125, 76.03732299804688, 80.1085205078125, 84.17971801757812, 88.25091552734375, 92.32211303710938, 96.393310546875, 100.46450805664062, 104.53571319580078, 108.6069107055664, 112.67810821533203, 116.74930572509766, 120.82051086425781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 19.0, 15.0, 19.0, 21.0, 24.0, 33.0, 40.0, 35.0, 40.0, 51.0, 46.0, 55.0, 58.0, 33.0, 32.0, 44.0, 51.0, 31.0, 40.0, 45.0, 42.0, 28.0, 26.0, 17.0, 20.0, 19.0, 17.0, 18.0, 12.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.3070068359375, -29.253692626953125, -28.200380325317383, -27.14706802368164, -26.093753814697266, -25.04043960571289, -23.98712730407715, -22.933815002441406, -21.88050079345703, -20.827186584472656, -19.773874282836914, -18.720561981201172, -17.667247772216797, -16.613933563232422, -15.56062126159668, -14.507308006286621, -13.453994750976562, -12.400681495666504, -11.347368240356445, -10.294054985046387, -9.240741729736328, -8.18742847442627, -7.134115219116211, -6.080801963806152, -5.027488708496094, -3.974175453186035, -2.9208621978759766, -1.867548942565918, -0.8142356872558594, 0.23907756805419922, 1.2923908233642578, 2.3457040786743164, 3.3990211486816406, 4.452334403991699, 5.505647659301758, 6.558960914611816, 7.612274169921875, 8.665587425231934, 9.718900680541992, 10.77221393585205, 11.82552719116211, 12.878840446472168, 13.932153701782227, 14.985466957092285, 16.038780212402344, 17.09209442138672, 18.14540672302246, 19.198719024658203, 20.252033233642578, 21.305347442626953, 22.358659744262695, 23.411972045898438, 24.465286254882812, 25.518600463867188, 26.57191276550293, 27.625225067138672, 28.678539276123047, 29.731853485107422, 30.785165786743164, 31.838478088378906, 32.89179229736328, 33.945106506347656, 34.99842071533203, 36.05173110961914, 37.105045318603516]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 17.0, 22.0, 26.0, 39.0, 70.0, 105.0, 163.0, 297.0, 467.0, 884.0, 1658.0, 3677.0, 8158.0, 19506.0, 49647.0, 131970.0, 297608.0, 305903.0, 138566.0, 52563.0, 20719.0, 8687.0, 3852.0, 1759.0, 900.0, 475.0, 305.0, 167.0, 109.0, 87.0, 48.0, 35.0, 25.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.953125, -17.392578125, -16.83203125, -16.271484375, -15.7109375, -15.150390625, -14.58984375, -14.029296875, -13.46875, -12.908203125, -12.34765625, -11.787109375, -11.2265625, -10.666015625, -10.10546875, -9.544921875, -8.984375, -8.423828125, -7.86328125, -7.302734375, -6.7421875, -6.181640625, -5.62109375, -5.060546875, -4.5, -3.939453125, -3.37890625, -2.818359375, -2.2578125, -1.697265625, -1.13671875, -0.576171875, -0.015625, 0.544921875, 1.10546875, 1.666015625, 2.2265625, 2.787109375, 3.34765625, 3.908203125, 4.46875, 5.029296875, 5.58984375, 6.150390625, 6.7109375, 7.271484375, 7.83203125, 8.392578125, 8.953125, 9.513671875, 10.07421875, 10.634765625, 11.1953125, 11.755859375, 12.31640625, 12.876953125, 13.4375, 13.998046875, 14.55859375, 15.119140625, 15.6796875, 16.240234375, 16.80078125, 17.361328125, 17.921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 9.0, 15.0, 10.0, 18.0, 20.0, 16.0, 28.0, 35.0, 40.0, 56.0, 34.0, 52.0, 54.0, 49.0, 53.0, 50.0, 40.0, 47.0, 44.0, 43.0, 40.0, 41.0, 39.0, 22.0, 22.0, 16.0, 24.0, 16.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.623046875, -3.495330810546875, -3.36761474609375, -3.239898681640625, -3.1121826171875, -2.984466552734375, -2.85675048828125, -2.729034423828125, -2.601318359375, -2.473602294921875, -2.34588623046875, -2.218170166015625, -2.0904541015625, -1.962738037109375, -1.83502197265625, -1.707305908203125, -1.57958984375, -1.451873779296875, -1.32415771484375, -1.196441650390625, -1.0687255859375, -0.941009521484375, -0.81329345703125, -0.685577392578125, -0.557861328125, -0.430145263671875, -0.30242919921875, -0.174713134765625, -0.0469970703125, 0.080718994140625, 0.20843505859375, 0.336151123046875, 0.4638671875, 0.591583251953125, 0.71929931640625, 0.847015380859375, 0.9747314453125, 1.102447509765625, 1.23016357421875, 1.357879638671875, 1.485595703125, 1.613311767578125, 1.74102783203125, 1.868743896484375, 1.9964599609375, 2.124176025390625, 2.25189208984375, 2.379608154296875, 2.50732421875, 2.635040283203125, 2.76275634765625, 2.890472412109375, 3.0181884765625, 3.145904541015625, 3.27362060546875, 3.401336669921875, 3.529052734375, 3.656768798828125, 3.78448486328125, 3.912200927734375, 4.0399169921875, 4.167633056640625, 4.29534912109375, 4.423065185546875, 4.55078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 6.0, 10.0, 8.0, 12.0, 25.0, 22.0, 31.0, 39.0, 60.0, 91.0, 98.0, 126.0, 158.0, 224.0, 321.0, 448.0, 586.0, 1042.0, 2130.0, 7351.0, 45317.0, 347697.0, 540621.0, 83548.0, 11938.0, 2919.0, 1215.0, 702.0, 472.0, 314.0, 241.0, 186.0, 143.0, 100.0, 77.0, 70.0, 40.0, 32.0, 33.0, 23.0, 18.0, 8.0, 11.0, 11.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.0, -26.07373046875, -25.1474609375, -24.22119140625, -23.294921875, -22.36865234375, -21.4423828125, -20.51611328125, -19.58984375, -18.66357421875, -17.7373046875, -16.81103515625, -15.884765625, -14.95849609375, -14.0322265625, -13.10595703125, -12.1796875, -11.25341796875, -10.3271484375, -9.40087890625, -8.474609375, -7.54833984375, -6.6220703125, -5.69580078125, -4.76953125, -3.84326171875, -2.9169921875, -1.99072265625, -1.064453125, -0.13818359375, 0.7880859375, 1.71435546875, 2.640625, 3.56689453125, 4.4931640625, 5.41943359375, 6.345703125, 7.27197265625, 8.1982421875, 9.12451171875, 10.05078125, 10.97705078125, 11.9033203125, 12.82958984375, 13.755859375, 14.68212890625, 15.6083984375, 16.53466796875, 17.4609375, 18.38720703125, 19.3134765625, 20.23974609375, 21.166015625, 22.09228515625, 23.0185546875, 23.94482421875, 24.87109375, 25.79736328125, 26.7236328125, 27.64990234375, 28.576171875, 29.50244140625, 30.4287109375, 31.35498046875, 32.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 23.0, 9.0, 22.0, 27.0, 27.0, 35.0, 46.0, 38.0, 42.0, 50.0, 66.0, 58.0, 53.0, 56.0, 47.0, 67.0, 64.0, 45.0, 36.0, 31.0, 33.0, 28.0, 24.0, 17.0, 9.0, 12.0, 10.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.75, -25.01025390625, -24.2705078125, -23.53076171875, -22.791015625, -22.05126953125, -21.3115234375, -20.57177734375, -19.83203125, -19.09228515625, -18.3525390625, -17.61279296875, -16.873046875, -16.13330078125, -15.3935546875, -14.65380859375, -13.9140625, -13.17431640625, -12.4345703125, -11.69482421875, -10.955078125, -10.21533203125, -9.4755859375, -8.73583984375, -7.99609375, -7.25634765625, -6.5166015625, -5.77685546875, -5.037109375, -4.29736328125, -3.5576171875, -2.81787109375, -2.078125, -1.33837890625, -0.5986328125, 0.14111328125, 0.880859375, 1.62060546875, 2.3603515625, 3.10009765625, 3.83984375, 4.57958984375, 5.3193359375, 6.05908203125, 6.798828125, 7.53857421875, 8.2783203125, 9.01806640625, 9.7578125, 10.49755859375, 11.2373046875, 11.97705078125, 12.716796875, 13.45654296875, 14.1962890625, 14.93603515625, 15.67578125, 16.41552734375, 17.1552734375, 17.89501953125, 18.634765625, 19.37451171875, 20.1142578125, 20.85400390625, 21.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 14.0, 26.0, 46.0, 59.0, 90.0, 128.0, 261.0, 439.0, 850.0, 1679.0, 3776.0, 10965.0, 38648.0, 163986.0, 467383.0, 267621.0, 65540.0, 16848.0, 5444.0, 2209.0, 1117.0, 558.0, 321.0, 190.0, 121.0, 74.0, 43.0, 27.0, 25.0, 7.0, 12.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.140625, -9.8564453125, -9.572265625, -9.2880859375, -9.00390625, -8.7197265625, -8.435546875, -8.1513671875, -7.8671875, -7.5830078125, -7.298828125, -7.0146484375, -6.73046875, -6.4462890625, -6.162109375, -5.8779296875, -5.59375, -5.3095703125, -5.025390625, -4.7412109375, -4.45703125, -4.1728515625, -3.888671875, -3.6044921875, -3.3203125, -3.0361328125, -2.751953125, -2.4677734375, -2.18359375, -1.8994140625, -1.615234375, -1.3310546875, -1.046875, -0.7626953125, -0.478515625, -0.1943359375, 0.08984375, 0.3740234375, 0.658203125, 0.9423828125, 1.2265625, 1.5107421875, 1.794921875, 2.0791015625, 2.36328125, 2.6474609375, 2.931640625, 3.2158203125, 3.5, 3.7841796875, 4.068359375, 4.3525390625, 4.63671875, 4.9208984375, 5.205078125, 5.4892578125, 5.7734375, 6.0576171875, 6.341796875, 6.6259765625, 6.91015625, 7.1943359375, 7.478515625, 7.7626953125, 8.046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 19.0, 26.0, 29.0, 40.0, 71.0, 66.0, 91.0, 104.0, 108.0, 93.0, 83.0, 56.0, 59.0, 31.0, 31.0, 25.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002105712890625, -0.002047628164291382, -0.0019895434379577637, -0.0019314587116241455, -0.0018733739852905273, -0.0018152892589569092, -0.001757204532623291, -0.0016991198062896729, -0.0016410350799560547, -0.0015829503536224365, -0.0015248656272888184, -0.0014667809009552002, -0.001408696174621582, -0.0013506114482879639, -0.0012925267219543457, -0.0012344419956207275, -0.0011763572692871094, -0.0011182725429534912, -0.001060187816619873, -0.0010021030902862549, -0.0009440183639526367, -0.0008859336376190186, -0.0008278489112854004, -0.0007697641849517822, -0.0007116794586181641, -0.0006535947322845459, -0.0005955100059509277, -0.0005374252796173096, -0.0004793405532836914, -0.00042125582695007324, -0.0003631711006164551, -0.0003050863742828369, -0.00024700164794921875, -0.00018891692161560059, -0.00013083219528198242, -7.274746894836426e-05, -1.4662742614746094e-05, 4.342198371887207e-05, 0.00010150671005249023, 0.0001595914363861084, 0.00021767616271972656, 0.0002757608890533447, 0.0003338456153869629, 0.00039193034172058105, 0.0004500150680541992, 0.0005080997943878174, 0.0005661845207214355, 0.0006242692470550537, 0.0006823539733886719, 0.00074043869972229, 0.0007985234260559082, 0.0008566081523895264, 0.0009146928787231445, 0.0009727776050567627, 0.0010308623313903809, 0.001088947057723999, 0.0011470317840576172, 0.0012051165103912354, 0.0012632012367248535, 0.0013212859630584717, 0.0013793706893920898, 0.001437455415725708, 0.0014955401420593262, 0.0015536248683929443, 0.0016117095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 8.0, 5.0, 8.0, 13.0, 24.0, 27.0, 34.0, 52.0, 78.0, 110.0, 223.0, 378.0, 854.0, 2113.0, 9537.0, 125627.0, 767934.0, 127877.0, 9627.0, 2170.0, 796.0, 446.0, 234.0, 149.0, 69.0, 59.0, 25.0, 16.0, 15.0, 18.0, 9.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.790283203125, -16.22119140625, -15.652099609375, -15.0830078125, -14.513916015625, -13.94482421875, -13.375732421875, -12.806640625, -12.237548828125, -11.66845703125, -11.099365234375, -10.5302734375, -9.961181640625, -9.39208984375, -8.822998046875, -8.25390625, -7.684814453125, -7.11572265625, -6.546630859375, -5.9775390625, -5.408447265625, -4.83935546875, -4.270263671875, -3.701171875, -3.132080078125, -2.56298828125, -1.993896484375, -1.4248046875, -0.855712890625, -0.28662109375, 0.282470703125, 0.8515625, 1.420654296875, 1.98974609375, 2.558837890625, 3.1279296875, 3.697021484375, 4.26611328125, 4.835205078125, 5.404296875, 5.973388671875, 6.54248046875, 7.111572265625, 7.6806640625, 8.249755859375, 8.81884765625, 9.387939453125, 9.95703125, 10.526123046875, 11.09521484375, 11.664306640625, 12.2333984375, 12.802490234375, 13.37158203125, 13.940673828125, 14.509765625, 15.078857421875, 15.64794921875, 16.217041015625, 16.7861328125, 17.355224609375, 17.92431640625, 18.493408203125, 19.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 11.0, 11.0, 15.0, 29.0, 35.0, 54.0, 62.0, 91.0, 74.0, 117.0, 84.0, 82.0, 68.0, 49.0, 46.0, 33.0, 18.0, 26.0, 13.0, 9.0, 7.0, 7.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4296875, -9.126220703125, -8.82275390625, -8.519287109375, -8.2158203125, -7.912353515625, -7.60888671875, -7.305419921875, -7.001953125, -6.698486328125, -6.39501953125, -6.091552734375, -5.7880859375, -5.484619140625, -5.18115234375, -4.877685546875, -4.57421875, -4.270751953125, -3.96728515625, -3.663818359375, -3.3603515625, -3.056884765625, -2.75341796875, -2.449951171875, -2.146484375, -1.843017578125, -1.53955078125, -1.236083984375, -0.9326171875, -0.629150390625, -0.32568359375, -0.022216796875, 0.28125, 0.584716796875, 0.88818359375, 1.191650390625, 1.4951171875, 1.798583984375, 2.10205078125, 2.405517578125, 2.708984375, 3.012451171875, 3.31591796875, 3.619384765625, 3.9228515625, 4.226318359375, 4.52978515625, 4.833251953125, 5.13671875, 5.440185546875, 5.74365234375, 6.047119140625, 6.3505859375, 6.654052734375, 6.95751953125, 7.260986328125, 7.564453125, 7.867919921875, 8.17138671875, 8.474853515625, 8.7783203125, 9.081787109375, 9.38525390625, 9.688720703125, 9.9921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 10.0, 32.0, 42.0, 82.0, 103.0, 142.0, 161.0, 163.0, 116.0, 77.0, 34.0, 22.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-240.88356018066406, -234.98587036132812, -229.08819580078125, -223.1905059814453, -217.29281616210938, -211.3951416015625, -205.49745178222656, -199.59976196289062, -193.70208740234375, -187.8043975830078, -181.90672302246094, -176.009033203125, -170.11134338378906, -164.21365356445312, -158.31597900390625, -152.4182891845703, -146.52059936523438, -140.62290954589844, -134.72523498535156, -128.82754516601562, -122.92985534667969, -117.03217315673828, -111.13449096679688, -105.23680114746094, -99.33911895751953, -93.44143676757812, -87.54374694824219, -81.64606475830078, -75.74838256835938, -69.85069274902344, -63.95301055908203, -58.05532455444336, -52.15763854980469, -46.259952545166016, -40.362266540527344, -34.46458435058594, -28.566898345947266, -22.669212341308594, -16.771530151367188, -10.873844146728516, -4.976158142089844, 0.9215269088745117, 6.819211959838867, 12.716896057128906, 18.614582061767578, 24.51226806640625, 30.409950256347656, 36.30763626098633, 42.205322265625, 48.10300827026367, 54.000694274902344, 59.89837646484375, 65.79606628417969, 71.6937484741211, 77.5914306640625, 83.48912048339844, 89.38680267333984, 95.28448486328125, 101.18217468261719, 107.0798568725586, 112.9775390625, 118.87522888183594, 124.77291107177734, 130.67059326171875, 136.5682830810547]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 16.0, 8.0, 19.0, 20.0, 21.0, 33.0, 41.0, 39.0, 28.0, 34.0, 34.0, 43.0, 38.0, 48.0, 37.0, 40.0, 42.0, 49.0, 40.0, 38.0, 33.0, 37.0, 26.0, 25.0, 22.0, 26.0, 24.0, 22.0, 20.0, 16.0, 16.0, 11.0, 2.0, 6.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.13624572753906, -86.36341094970703, -83.59058380126953, -80.8177490234375, -78.04491424560547, -75.27207946777344, -72.49925231933594, -69.7264175415039, -66.95358276367188, -64.18074798583984, -61.40791702270508, -58.63508605957031, -55.86225128173828, -53.089420318603516, -50.31658935546875, -47.54375457763672, -44.77092361450195, -41.99809265136719, -39.225257873535156, -36.45242691040039, -33.67959213256836, -30.906761169433594, -28.133928298950195, -25.361095428466797, -22.5882625579834, -19.8154296875, -17.0425968170166, -14.26976490020752, -11.496932029724121, -8.724099159240723, -5.951267242431641, -3.178434371948242, -0.40560150146484375, 2.3672311305999756, 5.140063762664795, 7.912896156311035, 10.685729026794434, 13.458561897277832, 16.231393814086914, 19.004226684570312, 21.77705955505371, 24.54989242553711, 27.322725296020508, 30.095558166503906, 32.86838912963867, 35.6412239074707, 38.41405487060547, 41.1868896484375, 43.959720611572266, 46.73255157470703, 49.50538635253906, 52.27821731567383, 55.05105209350586, 57.823883056640625, 60.596717834472656, 63.36954879760742, 66.14237976074219, 68.91521453857422, 71.68804168701172, 74.46087646484375, 77.23371124267578, 80.00654602050781, 82.77937316894531, 85.55220794677734, 88.32504272460938]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 11.0, 10.0, 24.0, 22.0, 41.0, 76.0, 132.0, 242.0, 457.0, 1119.0, 3500.0, 16445.0, 741719.0, 3407528.0, 17047.0, 3650.0, 1150.0, 509.0, 238.0, 138.0, 76.0, 35.0, 36.0, 18.0, 20.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.97021484375, -49.3779296875, -47.78564453125, -46.193359375, -44.60107421875, -43.0087890625, -41.41650390625, -39.82421875, -38.23193359375, -36.6396484375, -35.04736328125, -33.455078125, -31.86279296875, -30.2705078125, -28.67822265625, -27.0859375, -25.49365234375, -23.9013671875, -22.30908203125, -20.716796875, -19.12451171875, -17.5322265625, -15.93994140625, -14.34765625, -12.75537109375, -11.1630859375, -9.57080078125, -7.978515625, -6.38623046875, -4.7939453125, -3.20166015625, -1.609375, -0.01708984375, 1.5751953125, 3.16748046875, 4.759765625, 6.35205078125, 7.9443359375, 9.53662109375, 11.12890625, 12.72119140625, 14.3134765625, 15.90576171875, 17.498046875, 19.09033203125, 20.6826171875, 22.27490234375, 23.8671875, 25.45947265625, 27.0517578125, 28.64404296875, 30.236328125, 31.82861328125, 33.4208984375, 35.01318359375, 36.60546875, 38.19775390625, 39.7900390625, 41.38232421875, 42.974609375, 44.56689453125, 46.1591796875, 47.75146484375, 49.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 18.0, 23.0, 21.0, 22.0, 29.0, 35.0, 34.0, 46.0, 42.0, 53.0, 41.0, 60.0, 51.0, 42.0, 44.0, 33.0, 40.0, 48.0, 38.0, 39.0, 35.0, 34.0, 27.0, 27.0, 14.0, 12.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.783935546875, -3.64990234375, -3.515869140625, -3.3818359375, -3.247802734375, -3.11376953125, -2.979736328125, -2.845703125, -2.711669921875, -2.57763671875, -2.443603515625, -2.3095703125, -2.175537109375, -2.04150390625, -1.907470703125, -1.7734375, -1.639404296875, -1.50537109375, -1.371337890625, -1.2373046875, -1.103271484375, -0.96923828125, -0.835205078125, -0.701171875, -0.567138671875, -0.43310546875, -0.299072265625, -0.1650390625, -0.031005859375, 0.10302734375, 0.237060546875, 0.37109375, 0.505126953125, 0.63916015625, 0.773193359375, 0.9072265625, 1.041259765625, 1.17529296875, 1.309326171875, 1.443359375, 1.577392578125, 1.71142578125, 1.845458984375, 1.9794921875, 2.113525390625, 2.24755859375, 2.381591796875, 2.515625, 2.649658203125, 2.78369140625, 2.917724609375, 3.0517578125, 3.185791015625, 3.31982421875, 3.453857421875, 3.587890625, 3.721923828125, 3.85595703125, 3.989990234375, 4.1240234375, 4.258056640625, 4.39208984375, 4.526123046875, 4.66015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 16.0, 12.0, 13.0, 17.0, 26.0, 34.0, 38.0, 85.0, 114.0, 161.0, 208.0, 327.0, 454.0, 746.0, 1208.0, 2242.0, 4430.0, 9498.0, 26059.0, 104286.0, 3612036.0, 352300.0, 49885.0, 15682.0, 6571.0, 3183.0, 1684.0, 986.0, 642.0, 410.0, 274.0, 181.0, 134.0, 107.0, 70.0, 42.0, 48.0, 17.0, 15.0, 7.0, 15.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.5484619140625, -13.042236328125, -12.5360107421875, -12.02978515625, -11.5235595703125, -11.017333984375, -10.5111083984375, -10.0048828125, -9.4986572265625, -8.992431640625, -8.4862060546875, -7.97998046875, -7.4737548828125, -6.967529296875, -6.4613037109375, -5.955078125, -5.4488525390625, -4.942626953125, -4.4364013671875, -3.93017578125, -3.4239501953125, -2.917724609375, -2.4114990234375, -1.9052734375, -1.3990478515625, -0.892822265625, -0.3865966796875, 0.11962890625, 0.6258544921875, 1.132080078125, 1.6383056640625, 2.14453125, 2.6507568359375, 3.156982421875, 3.6632080078125, 4.16943359375, 4.6756591796875, 5.181884765625, 5.6881103515625, 6.1943359375, 6.7005615234375, 7.206787109375, 7.7130126953125, 8.21923828125, 8.7254638671875, 9.231689453125, 9.7379150390625, 10.244140625, 10.7503662109375, 11.256591796875, 11.7628173828125, 12.26904296875, 12.7752685546875, 13.281494140625, 13.7877197265625, 14.2939453125, 14.8001708984375, 15.306396484375, 15.8126220703125, 16.31884765625, 16.8250732421875, 17.331298828125, 17.8375244140625, 18.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 12.0, 15.0, 30.0, 30.0, 69.0, 130.0, 267.0, 2630.0, 468.0, 170.0, 66.0, 49.0, 29.0, 18.0, 8.0, 13.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.156341552734375, -4.04315185546875, -3.929962158203125, -3.8167724609375, -3.703582763671875, -3.59039306640625, -3.477203369140625, -3.364013671875, -3.250823974609375, -3.13763427734375, -3.024444580078125, -2.9112548828125, -2.798065185546875, -2.68487548828125, -2.571685791015625, -2.45849609375, -2.345306396484375, -2.23211669921875, -2.118927001953125, -2.0057373046875, -1.892547607421875, -1.77935791015625, -1.666168212890625, -1.552978515625, -1.439788818359375, -1.32659912109375, -1.213409423828125, -1.1002197265625, -0.987030029296875, -0.87384033203125, -0.760650634765625, -0.6474609375, -0.534271240234375, -0.42108154296875, -0.307891845703125, -0.1947021484375, -0.081512451171875, 0.03167724609375, 0.144866943359375, 0.258056640625, 0.371246337890625, 0.48443603515625, 0.597625732421875, 0.7108154296875, 0.824005126953125, 0.93719482421875, 1.050384521484375, 1.16357421875, 1.276763916015625, 1.38995361328125, 1.503143310546875, 1.6163330078125, 1.729522705078125, 1.84271240234375, 1.955902099609375, 2.069091796875, 2.182281494140625, 2.29547119140625, 2.408660888671875, 2.5218505859375, 2.635040283203125, 2.74822998046875, 2.861419677734375, 2.974609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 9.0, 11.0, 11.0, 19.0, 16.0, 28.0, 28.0, 31.0, 50.0, 67.0, 72.0, 82.0, 72.0, 73.0, 79.0, 80.0, 65.0, 50.0, 39.0, 30.0, 28.0, 21.0, 13.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.861871719360352, -11.460796356201172, -11.059720993041992, -10.658645629882812, -10.257570266723633, -9.856494903564453, -9.45542049407959, -9.05434513092041, -8.65326976776123, -8.25219440460205, -7.851119041442871, -7.45004415512085, -7.04896879196167, -6.64789342880249, -6.246818542480469, -5.845743179321289, -5.444667816162109, -5.04359245300293, -4.64251708984375, -4.2414422035217285, -3.840366840362549, -3.439291477203369, -3.0382163524627686, -2.637141227722168, -2.2360658645629883, -1.8349906206130981, -1.433915376663208, -1.0328401327133179, -0.6317648887634277, -0.23068952560424805, 0.17038559913635254, 0.5714607238769531, 0.9725360870361328, 1.373611330986023, 1.774686574935913, 2.1757616996765137, 2.5768370628356934, 2.977912425994873, 3.3789875507354736, 3.780062675476074, 4.181138038635254, 4.582213401794434, 4.983288764953613, 5.384363651275635, 5.7854390144348145, 6.186514377593994, 6.587589263916016, 6.988664627075195, 7.389739990234375, 7.790815353393555, 8.191890716552734, 8.592966079711914, 8.994041442871094, 9.395116806030273, 9.796191215515137, 10.197266578674316, 10.598341941833496, 10.999417304992676, 11.400492668151855, 11.801568031311035, 12.202642440795898, 12.603717803955078, 13.004793167114258, 13.405868530273438, 13.806943893432617]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 4.0, 5.0, 5.0, 9.0, 10.0, 7.0, 16.0, 16.0, 29.0, 27.0, 24.0, 34.0, 39.0, 37.0, 39.0, 31.0, 46.0, 48.0, 37.0, 56.0, 45.0, 53.0, 52.0, 54.0, 41.0, 39.0, 32.0, 24.0, 31.0, 26.0, 10.0, 10.0, 8.0, 15.0, 9.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.728302955627441, -8.423388481140137, -8.118474006652832, -7.813559055328369, -7.5086445808410645, -7.20373010635376, -6.898815155029297, -6.593900680541992, -6.2889862060546875, -5.984071731567383, -5.679157257080078, -5.374242305755615, -5.0693278312683105, -4.764413356781006, -4.459498405456543, -4.154583930969238, -3.8496694564819336, -3.544754981994629, -3.239840269088745, -2.9349255561828613, -2.6300110816955566, -2.325096607208252, -2.020181894302368, -1.7152671813964844, -1.4103527069091797, -1.1054381132125854, -0.8005235195159912, -0.495608925819397, -0.19069433212280273, 0.1142202615737915, 0.41913485527038574, 0.7240495681762695, 1.0289630889892578, 1.333877682685852, 1.6387922763824463, 1.9437068700790405, 2.2486214637756348, 2.5535359382629395, 2.8584506511688232, 3.163365364074707, 3.4682798385620117, 3.7731943130493164, 4.078108787536621, 4.383023738861084, 4.687938213348389, 4.992852687835693, 5.297767639160156, 5.602682113647461, 5.907596588134766, 6.21251106262207, 6.517425537109375, 6.822340488433838, 7.127254962921143, 7.432169437408447, 7.73708438873291, 8.041998863220215, 8.34691333770752, 8.651827812194824, 8.956742286682129, 9.261656761169434, 9.566572189331055, 9.87148666381836, 10.176401138305664, 10.481315612792969, 10.786230087280273]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 13.0, 12.0, 18.0, 32.0, 39.0, 58.0, 103.0, 136.0, 213.0, 411.0, 654.0, 1123.0, 2011.0, 4014.0, 7756.0, 16571.0, 35815.0, 77533.0, 153954.0, 239985.0, 231307.0, 142797.0, 70560.0, 32981.0, 15201.0, 7037.0, 3635.0, 1935.0, 1070.0, 608.0, 316.0, 229.0, 139.0, 89.0, 66.0, 45.0, 23.0, 17.0, 12.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3551025390625, -10.975830078125, -10.5965576171875, -10.21728515625, -9.8380126953125, -9.458740234375, -9.0794677734375, -8.7001953125, -8.3209228515625, -7.941650390625, -7.5623779296875, -7.18310546875, -6.8038330078125, -6.424560546875, -6.0452880859375, -5.666015625, -5.2867431640625, -4.907470703125, -4.5281982421875, -4.14892578125, -3.7696533203125, -3.390380859375, -3.0111083984375, -2.6318359375, -2.2525634765625, -1.873291015625, -1.4940185546875, -1.11474609375, -0.7354736328125, -0.356201171875, 0.0230712890625, 0.40234375, 0.7816162109375, 1.160888671875, 1.5401611328125, 1.91943359375, 2.2987060546875, 2.677978515625, 3.0572509765625, 3.4365234375, 3.8157958984375, 4.195068359375, 4.5743408203125, 4.95361328125, 5.3328857421875, 5.712158203125, 6.0914306640625, 6.470703125, 6.8499755859375, 7.229248046875, 7.6085205078125, 7.98779296875, 8.3670654296875, 8.746337890625, 9.1256103515625, 9.5048828125, 9.8841552734375, 10.263427734375, 10.6427001953125, 11.02197265625, 11.4012451171875, 11.780517578125, 12.1597900390625, 12.5390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 7.0, 6.0, 10.0, 14.0, 19.0, 23.0, 19.0, 26.0, 16.0, 41.0, 37.0, 41.0, 47.0, 46.0, 46.0, 44.0, 53.0, 35.0, 48.0, 52.0, 38.0, 41.0, 36.0, 41.0, 29.0, 37.0, 29.0, 28.0, 19.0, 11.0, 7.0, 10.0, 5.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27239990234375, -4.1307373046875, -3.98907470703125, -3.847412109375, -3.70574951171875, -3.5640869140625, -3.42242431640625, -3.28076171875, -3.13909912109375, -2.9974365234375, -2.85577392578125, -2.714111328125, -2.57244873046875, -2.4307861328125, -2.28912353515625, -2.1474609375, -2.00579833984375, -1.8641357421875, -1.72247314453125, -1.580810546875, -1.43914794921875, -1.2974853515625, -1.15582275390625, -1.01416015625, -0.87249755859375, -0.7308349609375, -0.58917236328125, -0.447509765625, -0.30584716796875, -0.1641845703125, -0.02252197265625, 0.119140625, 0.26080322265625, 0.4024658203125, 0.54412841796875, 0.685791015625, 0.82745361328125, 0.9691162109375, 1.11077880859375, 1.25244140625, 1.39410400390625, 1.5357666015625, 1.67742919921875, 1.819091796875, 1.96075439453125, 2.1024169921875, 2.24407958984375, 2.3857421875, 2.52740478515625, 2.6690673828125, 2.81072998046875, 2.952392578125, 3.09405517578125, 3.2357177734375, 3.37738037109375, 3.51904296875, 3.66070556640625, 3.8023681640625, 3.94403076171875, 4.085693359375, 4.22735595703125, 4.3690185546875, 4.51068115234375, 4.65234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 8.0, 22.0, 13.0, 18.0, 30.0, 50.0, 65.0, 73.0, 107.0, 140.0, 214.0, 240.0, 319.0, 509.0, 792.0, 1201.0, 2366.0, 9063.0, 74688.0, 631130.0, 290679.0, 27531.0, 4454.0, 1621.0, 881.0, 638.0, 458.0, 334.0, 233.0, 163.0, 134.0, 89.0, 71.0, 54.0, 33.0, 29.0, 27.0, 15.0, 13.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.96875, -28.027587890625, -27.08642578125, -26.145263671875, -25.2041015625, -24.262939453125, -23.32177734375, -22.380615234375, -21.439453125, -20.498291015625, -19.55712890625, -18.615966796875, -17.6748046875, -16.733642578125, -15.79248046875, -14.851318359375, -13.91015625, -12.968994140625, -12.02783203125, -11.086669921875, -10.1455078125, -9.204345703125, -8.26318359375, -7.322021484375, -6.380859375, -5.439697265625, -4.49853515625, -3.557373046875, -2.6162109375, -1.675048828125, -0.73388671875, 0.207275390625, 1.1484375, 2.089599609375, 3.03076171875, 3.971923828125, 4.9130859375, 5.854248046875, 6.79541015625, 7.736572265625, 8.677734375, 9.618896484375, 10.56005859375, 11.501220703125, 12.4423828125, 13.383544921875, 14.32470703125, 15.265869140625, 16.20703125, 17.148193359375, 18.08935546875, 19.030517578125, 19.9716796875, 20.912841796875, 21.85400390625, 22.795166015625, 23.736328125, 24.677490234375, 25.61865234375, 26.559814453125, 27.5009765625, 28.442138671875, 29.38330078125, 30.324462890625, 31.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 19.0, 16.0, 22.0, 24.0, 30.0, 45.0, 50.0, 57.0, 60.0, 65.0, 68.0, 68.0, 67.0, 56.0, 63.0, 58.0, 46.0, 26.0, 37.0, 32.0, 27.0, 21.0, 10.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.689697265625, -37.78564453125, -36.881591796875, -35.9775390625, -35.073486328125, -34.16943359375, -33.265380859375, -32.361328125, -31.457275390625, -30.55322265625, -29.649169921875, -28.7451171875, -27.841064453125, -26.93701171875, -26.032958984375, -25.12890625, -24.224853515625, -23.32080078125, -22.416748046875, -21.5126953125, -20.608642578125, -19.70458984375, -18.800537109375, -17.896484375, -16.992431640625, -16.08837890625, -15.184326171875, -14.2802734375, -13.376220703125, -12.47216796875, -11.568115234375, -10.6640625, -9.760009765625, -8.85595703125, -7.951904296875, -7.0478515625, -6.143798828125, -5.23974609375, -4.335693359375, -3.431640625, -2.527587890625, -1.62353515625, -0.719482421875, 0.1845703125, 1.088623046875, 1.99267578125, 2.896728515625, 3.80078125, 4.704833984375, 5.60888671875, 6.512939453125, 7.4169921875, 8.321044921875, 9.22509765625, 10.129150390625, 11.033203125, 11.937255859375, 12.84130859375, 13.745361328125, 14.6494140625, 15.553466796875, 16.45751953125, 17.361572265625, 18.265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 17.0, 19.0, 32.0, 30.0, 46.0, 64.0, 118.0, 172.0, 299.0, 549.0, 1125.0, 2232.0, 6220.0, 20764.0, 106445.0, 574049.0, 274360.0, 44071.0, 10883.0, 3623.0, 1571.0, 738.0, 396.0, 237.0, 146.0, 95.0, 61.0, 50.0, 38.0, 16.0, 14.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.96875, -11.56640625, -11.1640625, -10.76171875, -10.359375, -9.95703125, -9.5546875, -9.15234375, -8.75, -8.34765625, -7.9453125, -7.54296875, -7.140625, -6.73828125, -6.3359375, -5.93359375, -5.53125, -5.12890625, -4.7265625, -4.32421875, -3.921875, -3.51953125, -3.1171875, -2.71484375, -2.3125, -1.91015625, -1.5078125, -1.10546875, -0.703125, -0.30078125, 0.1015625, 0.50390625, 0.90625, 1.30859375, 1.7109375, 2.11328125, 2.515625, 2.91796875, 3.3203125, 3.72265625, 4.125, 4.52734375, 4.9296875, 5.33203125, 5.734375, 6.13671875, 6.5390625, 6.94140625, 7.34375, 7.74609375, 8.1484375, 8.55078125, 8.953125, 9.35546875, 9.7578125, 10.16015625, 10.5625, 10.96484375, 11.3671875, 11.76953125, 12.171875, 12.57421875, 12.9765625, 13.37890625, 13.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 10.0, 8.0, 20.0, 19.0, 29.0, 43.0, 52.0, 54.0, 86.0, 87.0, 106.0, 95.0, 87.0, 89.0, 53.0, 39.0, 39.0, 25.0, 10.0, 8.0, 5.0, 3.0, 2.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00232696533203125, -0.0022652000188827515, -0.002203434705734253, -0.0021416693925857544, -0.002079904079437256, -0.0020181387662887573, -0.001956373453140259, -0.0018946081399917603, -0.0018328428268432617, -0.0017710775136947632, -0.0017093122005462646, -0.0016475468873977661, -0.0015857815742492676, -0.001524016261100769, -0.0014622509479522705, -0.001400485634803772, -0.0013387203216552734, -0.001276955008506775, -0.0012151896953582764, -0.0011534243822097778, -0.0010916590690612793, -0.0010298937559127808, -0.0009681284427642822, -0.0009063631296157837, -0.0008445978164672852, -0.0007828325033187866, -0.0007210671901702881, -0.0006593018770217896, -0.000597536563873291, -0.0005357712507247925, -0.00047400593757629395, -0.0004122406244277954, -0.0003504753112792969, -0.00028870999813079834, -0.0002269446849822998, -0.00016517937183380127, -0.00010341405868530273, -4.16487455368042e-05, 2.0116567611694336e-05, 8.188188076019287e-05, 0.0001436471939086914, 0.00020541250705718994, 0.0002671778202056885, 0.000328943133354187, 0.00039070844650268555, 0.0004524737596511841, 0.0005142390727996826, 0.0005760043859481812, 0.0006377696990966797, 0.0006995350122451782, 0.0007613003253936768, 0.0008230656385421753, 0.0008848309516906738, 0.0009465962648391724, 0.001008361577987671, 0.0010701268911361694, 0.001131892204284668, 0.0011936575174331665, 0.001255422830581665, 0.0013171881437301636, 0.0013789534568786621, 0.0014407187700271606, 0.0015024840831756592, 0.0015642493963241577, 0.0016260147094726562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 14.0, 13.0, 16.0, 32.0, 55.0, 94.0, 240.0, 500.0, 1552.0, 7867.0, 184862.0, 826295.0, 22564.0, 2976.0, 817.0, 302.0, 160.0, 85.0, 39.0, 21.0, 10.0, 10.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.456298828125, -32.50634765625, -31.556396484375, -30.6064453125, -29.656494140625, -28.70654296875, -27.756591796875, -26.806640625, -25.856689453125, -24.90673828125, -23.956787109375, -23.0068359375, -22.056884765625, -21.10693359375, -20.156982421875, -19.20703125, -18.257080078125, -17.30712890625, -16.357177734375, -15.4072265625, -14.457275390625, -13.50732421875, -12.557373046875, -11.607421875, -10.657470703125, -9.70751953125, -8.757568359375, -7.8076171875, -6.857666015625, -5.90771484375, -4.957763671875, -4.0078125, -3.057861328125, -2.10791015625, -1.157958984375, -0.2080078125, 0.741943359375, 1.69189453125, 2.641845703125, 3.591796875, 4.541748046875, 5.49169921875, 6.441650390625, 7.3916015625, 8.341552734375, 9.29150390625, 10.241455078125, 11.19140625, 12.141357421875, 13.09130859375, 14.041259765625, 14.9912109375, 15.941162109375, 16.89111328125, 17.841064453125, 18.791015625, 19.740966796875, 20.69091796875, 21.640869140625, 22.5908203125, 23.540771484375, 24.49072265625, 25.440673828125, 26.390625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 11.0, 12.0, 27.0, 43.0, 59.0, 72.0, 103.0, 134.0, 131.0, 128.0, 92.0, 55.0, 44.0, 22.0, 16.0, 17.0, 15.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.78125, -13.210205078125, -12.63916015625, -12.068115234375, -11.4970703125, -10.926025390625, -10.35498046875, -9.783935546875, -9.212890625, -8.641845703125, -8.07080078125, -7.499755859375, -6.9287109375, -6.357666015625, -5.78662109375, -5.215576171875, -4.64453125, -4.073486328125, -3.50244140625, -2.931396484375, -2.3603515625, -1.789306640625, -1.21826171875, -0.647216796875, -0.076171875, 0.494873046875, 1.06591796875, 1.636962890625, 2.2080078125, 2.779052734375, 3.35009765625, 3.921142578125, 4.4921875, 5.063232421875, 5.63427734375, 6.205322265625, 6.7763671875, 7.347412109375, 7.91845703125, 8.489501953125, 9.060546875, 9.631591796875, 10.20263671875, 10.773681640625, 11.3447265625, 11.915771484375, 12.48681640625, 13.057861328125, 13.62890625, 14.199951171875, 14.77099609375, 15.342041015625, 15.9130859375, 16.484130859375, 17.05517578125, 17.626220703125, 18.197265625, 18.768310546875, 19.33935546875, 19.910400390625, 20.4814453125, 21.052490234375, 21.62353515625, 22.194580078125, 22.765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 36.0, 165.0, 378.0, 283.0, 105.0, 26.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-695.87353515625, -679.59033203125, -663.3070678710938, -647.0238647460938, -630.7406005859375, -614.4573974609375, -598.1741943359375, -581.8909301757812, -565.6077270507812, -549.3245239257812, -533.041259765625, -516.758056640625, -500.4748229980469, -484.19158935546875, -467.90838623046875, -451.6251525878906, -435.3419189453125, -419.0586853027344, -402.77545166015625, -386.49224853515625, -370.2090148925781, -353.92578125, -337.642578125, -321.3593444824219, -305.07611083984375, -288.7928771972656, -272.5096435546875, -256.2264404296875, -239.94320678710938, -223.65997314453125, -207.3767547607422, -191.09353637695312, -174.81024169921875, -158.52700805664062, -142.24378967285156, -125.96056365966797, -109.67733764648438, -93.39411163330078, -77.11088562011719, -60.827659606933594, -44.54443359375, -28.261207580566406, -11.977981567382812, 4.305244445800781, 20.588470458984375, 36.87169647216797, 53.15492248535156, 69.43814849853516, 85.72137451171875, 102.00460052490234, 118.28782653808594, 134.571044921875, 150.85427856445312, 167.13751220703125, 183.4207305908203, 199.70394897460938, 215.9871826171875, 232.27041625976562, 248.5536346435547, 264.83685302734375, 281.1200866699219, 297.4033203125, 313.6865234375, 329.9697570800781, 346.25299072265625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 4.0, 9.0, 10.0, 6.0, 15.0, 12.0, 13.0, 22.0, 16.0, 25.0, 25.0, 52.0, 29.0, 42.0, 41.0, 47.0, 45.0, 48.0, 49.0, 67.0, 34.0, 35.0, 45.0, 42.0, 41.0, 27.0, 32.0, 23.0, 16.0, 30.0, 12.0, 12.0, 13.0, 11.0, 6.0, 10.0, 9.0, 6.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-104.74134826660156, -101.6285171508789, -98.51568603515625, -95.40284729003906, -92.2900161743164, -89.17718505859375, -86.06434631347656, -82.9515151977539, -79.83868408203125, -76.7258529663086, -73.61302185058594, -70.50018310546875, -67.3873519897461, -64.27452087402344, -61.161685943603516, -58.048851013183594, -54.93601989746094, -51.82318878173828, -48.71035385131836, -45.59751892089844, -42.48468780517578, -39.371856689453125, -36.2590217590332, -33.14618682861328, -30.033355712890625, -26.920522689819336, -23.807689666748047, -20.694856643676758, -17.58202362060547, -14.46919059753418, -11.35635757446289, -8.243524551391602, -5.1306915283203125, -2.0178585052490234, 1.0949745178222656, 4.207807540893555, 7.320640563964844, 10.433473587036133, 13.546306610107422, 16.65913963317871, 19.77197265625, 22.88480567932129, 25.997638702392578, 29.110471725463867, 32.223304748535156, 35.33613586425781, 38.448970794677734, 41.561805725097656, 44.67463684082031, 47.78746795654297, 50.90030288696289, 54.01313781738281, 57.12596893310547, 60.238800048828125, 63.35163497924805, 66.46446990966797, 69.57730102539062, 72.69013214111328, 75.80296325683594, 78.91580200195312, 82.02863311767578, 85.14146423339844, 88.25430297851562, 91.36713409423828, 94.47996520996094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 9.0, 21.0, 35.0, 41.0, 60.0, 105.0, 210.0, 361.0, 784.0, 1935.0, 5577.0, 24944.0, 465784.0, 3650697.0, 32645.0, 6889.0, 2220.0, 914.0, 388.0, 244.0, 132.0, 72.0, 62.0, 46.0, 21.0, 15.0, 12.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.125, -33.02685546875, -31.9287109375, -30.83056640625, -29.732421875, -28.63427734375, -27.5361328125, -26.43798828125, -25.33984375, -24.24169921875, -23.1435546875, -22.04541015625, -20.947265625, -19.84912109375, -18.7509765625, -17.65283203125, -16.5546875, -15.45654296875, -14.3583984375, -13.26025390625, -12.162109375, -11.06396484375, -9.9658203125, -8.86767578125, -7.76953125, -6.67138671875, -5.5732421875, -4.47509765625, -3.376953125, -2.27880859375, -1.1806640625, -0.08251953125, 1.015625, 2.11376953125, 3.2119140625, 4.31005859375, 5.408203125, 6.50634765625, 7.6044921875, 8.70263671875, 9.80078125, 10.89892578125, 11.9970703125, 13.09521484375, 14.193359375, 15.29150390625, 16.3896484375, 17.48779296875, 18.5859375, 19.68408203125, 20.7822265625, 21.88037109375, 22.978515625, 24.07666015625, 25.1748046875, 26.27294921875, 27.37109375, 28.46923828125, 29.5673828125, 30.66552734375, 31.763671875, 32.86181640625, 33.9599609375, 35.05810546875, 36.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 14.0, 8.0, 14.0, 13.0, 17.0, 19.0, 31.0, 41.0, 40.0, 32.0, 40.0, 35.0, 50.0, 60.0, 51.0, 51.0, 43.0, 47.0, 43.0, 39.0, 42.0, 37.0, 35.0, 28.0, 27.0, 22.0, 18.0, 9.0, 8.0, 12.0, 14.0, 10.0, 4.0, 4.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.843414306640625, -3.70831298828125, -3.573211669921875, -3.4381103515625, -3.303009033203125, -3.16790771484375, -3.032806396484375, -2.897705078125, -2.762603759765625, -2.62750244140625, -2.492401123046875, -2.3572998046875, -2.222198486328125, -2.08709716796875, -1.951995849609375, -1.81689453125, -1.681793212890625, -1.54669189453125, -1.411590576171875, -1.2764892578125, -1.141387939453125, -1.00628662109375, -0.871185302734375, -0.736083984375, -0.600982666015625, -0.46588134765625, -0.330780029296875, -0.1956787109375, -0.060577392578125, 0.07452392578125, 0.209625244140625, 0.3447265625, 0.479827880859375, 0.61492919921875, 0.750030517578125, 0.8851318359375, 1.020233154296875, 1.15533447265625, 1.290435791015625, 1.425537109375, 1.560638427734375, 1.69573974609375, 1.830841064453125, 1.9659423828125, 2.101043701171875, 2.23614501953125, 2.371246337890625, 2.50634765625, 2.641448974609375, 2.77655029296875, 2.911651611328125, 3.0467529296875, 3.181854248046875, 3.31695556640625, 3.452056884765625, 3.587158203125, 3.722259521484375, 3.85736083984375, 3.992462158203125, 4.1275634765625, 4.262664794921875, 4.39776611328125, 4.532867431640625, 4.66796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 6.0, 17.0, 27.0, 31.0, 47.0, 65.0, 99.0, 156.0, 210.0, 277.0, 427.0, 660.0, 996.0, 1423.0, 2486.0, 4067.0, 7324.0, 15124.0, 38313.0, 141681.0, 3428633.0, 433769.0, 69858.0, 23873.0, 10347.0, 5655.0, 3080.0, 1902.0, 1228.0, 872.0, 478.0, 341.0, 217.0, 174.0, 138.0, 84.0, 60.0, 34.0, 29.0, 23.0, 13.0, 11.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.9818115234375, -11.565185546875, -11.1485595703125, -10.73193359375, -10.3153076171875, -9.898681640625, -9.4820556640625, -9.0654296875, -8.6488037109375, -8.232177734375, -7.8155517578125, -7.39892578125, -6.9822998046875, -6.565673828125, -6.1490478515625, -5.732421875, -5.3157958984375, -4.899169921875, -4.4825439453125, -4.06591796875, -3.6492919921875, -3.232666015625, -2.8160400390625, -2.3994140625, -1.9827880859375, -1.566162109375, -1.1495361328125, -0.73291015625, -0.3162841796875, 0.100341796875, 0.5169677734375, 0.93359375, 1.3502197265625, 1.766845703125, 2.1834716796875, 2.60009765625, 3.0167236328125, 3.433349609375, 3.8499755859375, 4.2666015625, 4.6832275390625, 5.099853515625, 5.5164794921875, 5.93310546875, 6.3497314453125, 6.766357421875, 7.1829833984375, 7.599609375, 8.0162353515625, 8.432861328125, 8.8494873046875, 9.26611328125, 9.6827392578125, 10.099365234375, 10.5159912109375, 10.9326171875, 11.3492431640625, 11.765869140625, 12.1824951171875, 12.59912109375, 13.0157470703125, 13.432373046875, 13.8489990234375, 14.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 11.0, 11.0, 14.0, 23.0, 39.0, 46.0, 75.0, 151.0, 323.0, 2387.0, 478.0, 199.0, 95.0, 58.0, 41.0, 26.0, 16.0, 13.0, 8.0, 10.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.01446533203125, -2.8922119140625, -2.76995849609375, -2.647705078125, -2.52545166015625, -2.4031982421875, -2.28094482421875, -2.15869140625, -2.03643798828125, -1.9141845703125, -1.79193115234375, -1.669677734375, -1.54742431640625, -1.4251708984375, -1.30291748046875, -1.1806640625, -1.05841064453125, -0.9361572265625, -0.81390380859375, -0.691650390625, -0.56939697265625, -0.4471435546875, -0.32489013671875, -0.20263671875, -0.08038330078125, 0.0418701171875, 0.16412353515625, 0.286376953125, 0.40863037109375, 0.5308837890625, 0.65313720703125, 0.775390625, 0.89764404296875, 1.0198974609375, 1.14215087890625, 1.264404296875, 1.38665771484375, 1.5089111328125, 1.63116455078125, 1.75341796875, 1.87567138671875, 1.9979248046875, 2.12017822265625, 2.242431640625, 2.36468505859375, 2.4869384765625, 2.60919189453125, 2.7314453125, 2.85369873046875, 2.9759521484375, 3.09820556640625, 3.220458984375, 3.34271240234375, 3.4649658203125, 3.58721923828125, 3.70947265625, 3.83172607421875, 3.9539794921875, 4.07623291015625, 4.198486328125, 4.32073974609375, 4.4429931640625, 4.56524658203125, 4.6875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 36.0, 125.0, 266.0, 280.0, 190.0, 66.0, 24.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.20384216308594, -31.24742317199707, -29.291004180908203, -27.334583282470703, -25.378164291381836, -23.42174530029297, -21.46532440185547, -19.5089054107666, -17.552486419677734, -15.596067428588867, -13.639647483825684, -11.6832275390625, -9.726808547973633, -7.770389556884766, -5.813969612121582, -3.8575496673583984, -1.9011306762695312, 0.05528879165649414, 2.0117082595825195, 3.968127727508545, 5.92454719543457, 7.8809661865234375, 9.837386131286621, 11.793806076049805, 13.750225067138672, 15.706644058227539, 17.663063049316406, 19.619483947753906, 21.575902938842773, 23.53232192993164, 25.48874282836914, 27.445161819458008, 29.401580810546875, 31.357999801635742, 33.31441879272461, 35.27083969116211, 37.227256774902344, 39.183677673339844, 41.140098571777344, 43.096519470214844, 45.05293655395508, 47.00935745239258, 48.96577453613281, 50.92219543457031, 52.87861633300781, 54.83503341674805, 56.79145431518555, 58.74787139892578, 60.70429229736328, 62.66071319580078, 64.61713409423828, 66.57354736328125, 68.52996826171875, 70.48638916015625, 72.44281005859375, 74.39923095703125, 76.35565185546875, 78.31207275390625, 80.26849365234375, 82.22490692138672, 84.18132781982422, 86.13774871826172, 88.09416961669922, 90.05059051513672, 92.00700378417969]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 10.0, 9.0, 19.0, 19.0, 20.0, 23.0, 21.0, 33.0, 31.0, 27.0, 37.0, 29.0, 35.0, 43.0, 42.0, 30.0, 47.0, 44.0, 46.0, 49.0, 34.0, 32.0, 22.0, 35.0, 31.0, 17.0, 38.0, 21.0, 19.0, 19.0, 13.0, 16.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.307706832885742, -10.970895767211914, -10.634084701538086, -10.297273635864258, -9.960461616516113, -9.623650550842285, -9.286839485168457, -8.950028419494629, -8.613216400146484, -8.276405334472656, -7.93959379196167, -7.602782726287842, -7.2659711837768555, -6.929160118103027, -6.592349052429199, -6.255537986755371, -5.918726921081543, -5.581915855407715, -5.2451043128967285, -4.9082932472229, -4.571481704711914, -4.234670639038086, -3.897859573364258, -3.5610482692718506, -3.2242369651794434, -2.887425661087036, -2.550614356994629, -2.213803291320801, -1.8769919872283936, -1.5401806831359863, -1.2033696174621582, -0.866558313369751, -0.5297470092773438, -0.1929357647895813, 0.14387547969818115, 0.48068666458129883, 0.817497968673706, 1.1543092727661133, 1.4911203384399414, 1.8279316425323486, 2.164742946624756, 2.501554250717163, 2.8383655548095703, 3.1751766204833984, 3.5119879245758057, 3.848799228668213, 4.185610294342041, 4.522421836853027, 4.8592329025268555, 5.196043968200684, 5.53285551071167, 5.869666576385498, 6.206478118896484, 6.5432891845703125, 6.880100250244141, 7.216911315917969, 7.553722858428955, 7.890533924102783, 8.22734546661377, 8.564156532287598, 8.900967597961426, 9.23777961730957, 9.574590682983398, 9.911401748657227, 10.248212814331055]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 16.0, 26.0, 39.0, 39.0, 73.0, 107.0, 170.0, 249.0, 385.0, 564.0, 959.0, 1681.0, 2932.0, 5498.0, 10842.0, 22879.0, 49054.0, 103132.0, 191439.0, 251251.0, 198055.0, 108452.0, 51971.0, 24042.0, 11424.0, 5673.0, 3116.0, 1691.0, 1032.0, 662.0, 348.0, 260.0, 153.0, 108.0, 79.0, 50.0, 31.0, 18.0, 5.0, 3.0, 13.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 12.0, 12.0, 16.0, 16.0, 17.0, 24.0, 23.0, 34.0, 31.0, 33.0, 38.0, 35.0, 32.0, 50.0, 55.0, 56.0, 59.0, 39.0, 38.0, 49.0, 34.0, 35.0, 37.0, 28.0, 28.0, 21.0, 16.0, 16.0, 16.0, 12.0, 16.0, 11.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.994140625, -3.856597900390625, -3.71905517578125, -3.581512451171875, -3.4439697265625, -3.306427001953125, -3.16888427734375, -3.031341552734375, -2.893798828125, -2.756256103515625, -2.61871337890625, -2.481170654296875, -2.3436279296875, -2.206085205078125, -2.06854248046875, -1.930999755859375, -1.79345703125, -1.655914306640625, -1.51837158203125, -1.380828857421875, -1.2432861328125, -1.105743408203125, -0.96820068359375, -0.830657958984375, -0.693115234375, -0.555572509765625, -0.41802978515625, -0.280487060546875, -0.1429443359375, -0.005401611328125, 0.13214111328125, 0.269683837890625, 0.4072265625, 0.544769287109375, 0.68231201171875, 0.819854736328125, 0.9573974609375, 1.094940185546875, 1.23248291015625, 1.370025634765625, 1.507568359375, 1.645111083984375, 1.78265380859375, 1.920196533203125, 2.0577392578125, 2.195281982421875, 2.33282470703125, 2.470367431640625, 2.60791015625, 2.745452880859375, 2.88299560546875, 3.020538330078125, 3.1580810546875, 3.295623779296875, 3.43316650390625, 3.570709228515625, 3.708251953125, 3.845794677734375, 3.98333740234375, 4.120880126953125, 4.2584228515625, 4.395965576171875, 4.53350830078125, 4.671051025390625, 4.80859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 16.0, 11.0, 14.0, 30.0, 29.0, 39.0, 69.0, 77.0, 107.0, 146.0, 196.0, 283.0, 333.0, 484.0, 697.0, 1107.0, 1845.0, 5059.0, 31541.0, 387526.0, 557290.0, 48966.0, 6628.0, 2050.0, 1191.0, 719.0, 532.0, 382.0, 273.0, 231.0, 174.0, 136.0, 98.0, 69.0, 58.0, 32.0, 28.0, 16.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-23.84375, -23.076904296875, -22.31005859375, -21.543212890625, -20.7763671875, -20.009521484375, -19.24267578125, -18.475830078125, -17.708984375, -16.942138671875, -16.17529296875, -15.408447265625, -14.6416015625, -13.874755859375, -13.10791015625, -12.341064453125, -11.57421875, -10.807373046875, -10.04052734375, -9.273681640625, -8.5068359375, -7.739990234375, -6.97314453125, -6.206298828125, -5.439453125, -4.672607421875, -3.90576171875, -3.138916015625, -2.3720703125, -1.605224609375, -0.83837890625, -0.071533203125, 0.6953125, 1.462158203125, 2.22900390625, 2.995849609375, 3.7626953125, 4.529541015625, 5.29638671875, 6.063232421875, 6.830078125, 7.596923828125, 8.36376953125, 9.130615234375, 9.8974609375, 10.664306640625, 11.43115234375, 12.197998046875, 12.96484375, 13.731689453125, 14.49853515625, 15.265380859375, 16.0322265625, 16.799072265625, 17.56591796875, 18.332763671875, 19.099609375, 19.866455078125, 20.63330078125, 21.400146484375, 22.1669921875, 22.933837890625, 23.70068359375, 24.467529296875, 25.234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 11.0, 14.0, 14.0, 11.0, 17.0, 17.0, 14.0, 23.0, 19.0, 24.0, 32.0, 42.0, 34.0, 32.0, 42.0, 48.0, 41.0, 49.0, 39.0, 57.0, 40.0, 44.0, 40.0, 38.0, 28.0, 37.0, 26.0, 23.0, 20.0, 16.0, 20.0, 13.0, 13.0, 7.0, 5.0, 4.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.4375, -19.834228515625, -19.23095703125, -18.627685546875, -18.0244140625, -17.421142578125, -16.81787109375, -16.214599609375, -15.611328125, -15.008056640625, -14.40478515625, -13.801513671875, -13.1982421875, -12.594970703125, -11.99169921875, -11.388427734375, -10.78515625, -10.181884765625, -9.57861328125, -8.975341796875, -8.3720703125, -7.768798828125, -7.16552734375, -6.562255859375, -5.958984375, -5.355712890625, -4.75244140625, -4.149169921875, -3.5458984375, -2.942626953125, -2.33935546875, -1.736083984375, -1.1328125, -0.529541015625, 0.07373046875, 0.677001953125, 1.2802734375, 1.883544921875, 2.48681640625, 3.090087890625, 3.693359375, 4.296630859375, 4.89990234375, 5.503173828125, 6.1064453125, 6.709716796875, 7.31298828125, 7.916259765625, 8.51953125, 9.122802734375, 9.72607421875, 10.329345703125, 10.9326171875, 11.535888671875, 12.13916015625, 12.742431640625, 13.345703125, 13.948974609375, 14.55224609375, 15.155517578125, 15.7587890625, 16.362060546875, 16.96533203125, 17.568603515625, 18.171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 18.0, 32.0, 55.0, 105.0, 183.0, 374.0, 1083.0, 7161.0, 727211.0, 306399.0, 4311.0, 865.0, 378.0, 179.0, 68.0, 44.0, 25.0, 20.0, 5.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.555419921875, -31.67333984375, -30.791259765625, -29.9091796875, -29.027099609375, -28.14501953125, -27.262939453125, -26.380859375, -25.498779296875, -24.61669921875, -23.734619140625, -22.8525390625, -21.970458984375, -21.08837890625, -20.206298828125, -19.32421875, -18.442138671875, -17.56005859375, -16.677978515625, -15.7958984375, -14.913818359375, -14.03173828125, -13.149658203125, -12.267578125, -11.385498046875, -10.50341796875, -9.621337890625, -8.7392578125, -7.857177734375, -6.97509765625, -6.093017578125, -5.2109375, -4.328857421875, -3.44677734375, -2.564697265625, -1.6826171875, -0.800537109375, 0.08154296875, 0.963623046875, 1.845703125, 2.727783203125, 3.60986328125, 4.491943359375, 5.3740234375, 6.256103515625, 7.13818359375, 8.020263671875, 8.90234375, 9.784423828125, 10.66650390625, 11.548583984375, 12.4306640625, 13.312744140625, 14.19482421875, 15.076904296875, 15.958984375, 16.841064453125, 17.72314453125, 18.605224609375, 19.4873046875, 20.369384765625, 21.25146484375, 22.133544921875, 23.015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 4.0, 8.0, 13.0, 19.0, 21.0, 40.0, 64.0, 68.0, 119.0, 119.0, 153.0, 88.0, 82.0, 62.0, 43.0, 26.0, 21.0, 12.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002300262451171875, -0.0022467374801635742, -0.0021932125091552734, -0.0021396875381469727, -0.002086162567138672, -0.002032637596130371, -0.0019791126251220703, -0.0019255876541137695, -0.0018720626831054688, -0.001818537712097168, -0.0017650127410888672, -0.0017114877700805664, -0.0016579627990722656, -0.0016044378280639648, -0.001550912857055664, -0.0014973878860473633, -0.0014438629150390625, -0.0013903379440307617, -0.001336812973022461, -0.0012832880020141602, -0.0012297630310058594, -0.0011762380599975586, -0.0011227130889892578, -0.001069188117980957, -0.0010156631469726562, -0.0009621381759643555, -0.0009086132049560547, -0.0008550882339477539, -0.0008015632629394531, -0.0007480382919311523, -0.0006945133209228516, -0.0006409883499145508, -0.00058746337890625, -0.0005339384078979492, -0.00048041343688964844, -0.00042688846588134766, -0.0003733634948730469, -0.0003198385238647461, -0.0002663135528564453, -0.00021278858184814453, -0.00015926361083984375, -0.00010573863983154297, -5.221366882324219e-05, 1.3113021850585938e-06, 5.4836273193359375e-05, 0.00010836124420166016, 0.00016188621520996094, 0.00021541118621826172, 0.0002689361572265625, 0.0003224611282348633, 0.00037598609924316406, 0.00042951107025146484, 0.0004830360412597656, 0.0005365610122680664, 0.0005900859832763672, 0.000643610954284668, 0.0006971359252929688, 0.0007506608963012695, 0.0008041858673095703, 0.0008577108383178711, 0.0009112358093261719, 0.0009647607803344727, 0.0010182857513427734, 0.0010718107223510742, 0.001125335693359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 19.0, 21.0, 40.0, 99.0, 228.0, 806.0, 5583.0, 932535.0, 106097.0, 2314.0, 447.0, 178.0, 91.0, 39.0, 19.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.625, -42.208984375, -40.79296875, -39.376953125, -37.9609375, -36.544921875, -35.12890625, -33.712890625, -32.296875, -30.880859375, -29.46484375, -28.048828125, -26.6328125, -25.216796875, -23.80078125, -22.384765625, -20.96875, -19.552734375, -18.13671875, -16.720703125, -15.3046875, -13.888671875, -12.47265625, -11.056640625, -9.640625, -8.224609375, -6.80859375, -5.392578125, -3.9765625, -2.560546875, -1.14453125, 0.271484375, 1.6875, 3.103515625, 4.51953125, 5.935546875, 7.3515625, 8.767578125, 10.18359375, 11.599609375, 13.015625, 14.431640625, 15.84765625, 17.263671875, 18.6796875, 20.095703125, 21.51171875, 22.927734375, 24.34375, 25.759765625, 27.17578125, 28.591796875, 30.0078125, 31.423828125, 32.83984375, 34.255859375, 35.671875, 37.087890625, 38.50390625, 39.919921875, 41.3359375, 42.751953125, 44.16796875, 45.583984375, 47.0]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 20.0, 25.0, 55.0, 87.0, 160.0, 209.0, 211.0, 117.0, 53.0, 27.0, 13.0, 9.0, 6.0, 5.0, 2.0, 2.0], "bins": [-41.21875, -40.4508056640625, -39.682861328125, -38.9149169921875, -38.14697265625, -37.3790283203125, -36.611083984375, -35.8431396484375, -35.0751953125, -34.3072509765625, -33.539306640625, -32.7713623046875, -32.00341796875, -31.2354736328125, -30.467529296875, -29.6995849609375, -28.931640625, -28.1636962890625, -27.395751953125, -26.6278076171875, -25.85986328125, -25.0919189453125, -24.323974609375, -23.5560302734375, -22.7880859375, -22.0201416015625, -21.252197265625, -20.4842529296875, -19.71630859375, -18.9483642578125, -18.180419921875, -17.4124755859375, -16.64453125, -15.8765869140625, -15.108642578125, -14.3406982421875, -13.57275390625, -12.8048095703125, -12.036865234375, -11.2689208984375, -10.5009765625, -9.7330322265625, -8.965087890625, -8.1971435546875, -7.42919921875, -6.6612548828125, -5.893310546875, -5.1253662109375, -4.357421875, -3.5894775390625, -2.821533203125, -2.0535888671875, -1.28564453125, -0.5177001953125, 0.250244140625, 1.0181884765625, 1.7861328125, 2.5540771484375, 3.322021484375, 4.0899658203125, 4.85791015625, 5.6258544921875, 6.393798828125, 7.1617431640625, 7.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 23.0, 112.0, 613.0, 233.0, 23.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-711.9569702148438, -688.7424926757812, -665.5280151367188, -642.3134765625, -619.0989990234375, -595.884521484375, -572.6700439453125, -549.45556640625, -526.2410888671875, -503.026611328125, -479.8121032714844, -456.5976257324219, -433.38311767578125, -410.16864013671875, -386.95416259765625, -363.73968505859375, -340.525146484375, -317.3106689453125, -294.0961608886719, -270.8816833496094, -247.6671905517578, -224.45269775390625, -201.23822021484375, -178.0237274169922, -154.80923461914062, -131.59474182128906, -108.38025665283203, -85.165771484375, -61.95127868652344, -38.736785888671875, -15.522308349609375, 7.6921844482421875, 30.9066162109375, 54.1211051940918, 77.3355941772461, 100.55007934570312, 123.76457214355469, 146.97906494140625, 170.19354248046875, 193.4080352783203, 216.62252807617188, 239.83702087402344, 263.051513671875, 286.2659912109375, 309.48046875, 332.6949768066406, 355.9094543457031, 379.12396240234375, 402.33843994140625, 425.55291748046875, 448.7674255371094, 471.9819030761719, 495.1964111328125, 518.410888671875, 541.6253662109375, 564.83984375, 588.0543212890625, 611.268798828125, 634.4832763671875, 657.69775390625, 680.9122924804688, 704.1267700195312, 727.3412475585938, 750.5557250976562, 773.770263671875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 3.0, 6.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 22.0, 23.0, 26.0, 28.0, 42.0, 41.0, 45.0, 46.0, 50.0, 52.0, 54.0, 52.0, 56.0, 44.0, 40.0, 46.0, 36.0, 34.0, 20.0, 29.0, 28.0, 18.0, 13.0, 13.0, 12.0, 5.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-121.19415283203125, -117.8420181274414, -114.48988342285156, -111.13775634765625, -107.7856216430664, -104.43348693847656, -101.08135223388672, -97.72921752929688, -94.37709045410156, -91.02495574951172, -87.67282104492188, -84.32069396972656, -80.96855926513672, -77.61642456054688, -74.26428985595703, -70.91215515136719, -67.56002044677734, -64.2078857421875, -60.85575485229492, -57.50362014770508, -54.1514892578125, -50.799354553222656, -47.44721984863281, -44.09508514404297, -40.74295425415039, -37.39081954956055, -34.03868865966797, -30.686553955078125, -27.334421157836914, -23.982288360595703, -20.63015365600586, -17.27802085876465, -13.925888061523438, -10.573755264282227, -7.221621513366699, -3.869487762451172, -0.5173549652099609, 2.83477783203125, 6.186912536621094, 9.539045333862305, 12.891178131103516, 16.243310928344727, 19.595443725585938, 22.94757843017578, 26.299711227416992, 29.651844024658203, 33.00397872924805, 36.356109619140625, 39.70824432373047, 43.06037902832031, 46.41250991821289, 49.764644622802734, 53.11677551269531, 56.468910217285156, 59.821044921875, 63.173179626464844, 66.52531433105469, 69.87744903564453, 73.22958374023438, 76.58171081542969, 79.93384552001953, 83.28598022460938, 86.63811492919922, 89.99024963378906, 93.34237670898438]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 13.0, 19.0, 35.0, 60.0, 94.0, 129.0, 197.0, 376.0, 664.0, 1215.0, 2896.0, 8312.0, 40211.0, 4025306.0, 93984.0, 13036.0, 4050.0, 1685.0, 797.0, 481.0, 254.0, 179.0, 102.0, 57.0, 43.0, 28.0, 10.0, 12.0, 10.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.271240234375, -25.35498046875, -24.438720703125, -23.5224609375, -22.606201171875, -21.68994140625, -20.773681640625, -19.857421875, -18.941162109375, -18.02490234375, -17.108642578125, -16.1923828125, -15.276123046875, -14.35986328125, -13.443603515625, -12.52734375, -11.611083984375, -10.69482421875, -9.778564453125, -8.8623046875, -7.946044921875, -7.02978515625, -6.113525390625, -5.197265625, -4.281005859375, -3.36474609375, -2.448486328125, -1.5322265625, -0.615966796875, 0.30029296875, 1.216552734375, 2.1328125, 3.049072265625, 3.96533203125, 4.881591796875, 5.7978515625, 6.714111328125, 7.63037109375, 8.546630859375, 9.462890625, 10.379150390625, 11.29541015625, 12.211669921875, 13.1279296875, 14.044189453125, 14.96044921875, 15.876708984375, 16.79296875, 17.709228515625, 18.62548828125, 19.541748046875, 20.4580078125, 21.374267578125, 22.29052734375, 23.206787109375, 24.123046875, 25.039306640625, 25.95556640625, 26.871826171875, 27.7880859375, 28.704345703125, 29.62060546875, 30.536865234375, 31.453125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 5.0, 4.0, 3.0, 13.0, 12.0, 22.0, 16.0, 30.0, 27.0, 49.0, 27.0, 48.0, 45.0, 53.0, 57.0, 69.0, 60.0, 54.0, 58.0, 40.0, 41.0, 44.0, 35.0, 34.0, 30.0, 26.0, 21.0, 13.0, 14.0, 9.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.4453125, -6.26812744140625, -6.0909423828125, -5.91375732421875, -5.736572265625, -5.55938720703125, -5.3822021484375, -5.20501708984375, -5.02783203125, -4.85064697265625, -4.6734619140625, -4.49627685546875, -4.319091796875, -4.14190673828125, -3.9647216796875, -3.78753662109375, -3.6103515625, -3.43316650390625, -3.2559814453125, -3.07879638671875, -2.901611328125, -2.72442626953125, -2.5472412109375, -2.37005615234375, -2.19287109375, -2.01568603515625, -1.8385009765625, -1.66131591796875, -1.484130859375, -1.30694580078125, -1.1297607421875, -0.95257568359375, -0.775390625, -0.59820556640625, -0.4210205078125, -0.24383544921875, -0.066650390625, 0.11053466796875, 0.2877197265625, 0.46490478515625, 0.64208984375, 0.81927490234375, 0.9964599609375, 1.17364501953125, 1.350830078125, 1.52801513671875, 1.7052001953125, 1.88238525390625, 2.0595703125, 2.23675537109375, 2.4139404296875, 2.59112548828125, 2.768310546875, 2.94549560546875, 3.1226806640625, 3.29986572265625, 3.47705078125, 3.65423583984375, 3.8314208984375, 4.00860595703125, 4.185791015625, 4.36297607421875, 4.5401611328125, 4.71734619140625, 4.89453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 16.0, 18.0, 22.0, 49.0, 48.0, 73.0, 87.0, 135.0, 174.0, 232.0, 339.0, 476.0, 742.0, 1121.0, 1824.0, 3351.0, 6936.0, 20008.0, 106971.0, 3938167.0, 82046.0, 17133.0, 6257.0, 3034.0, 1644.0, 1018.0, 716.0, 486.0, 314.0, 241.0, 159.0, 119.0, 86.0, 62.0, 51.0, 39.0, 20.0, 13.0, 13.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.970458984375, -16.39404296875, -15.817626953125, -15.2412109375, -14.664794921875, -14.08837890625, -13.511962890625, -12.935546875, -12.359130859375, -11.78271484375, -11.206298828125, -10.6298828125, -10.053466796875, -9.47705078125, -8.900634765625, -8.32421875, -7.747802734375, -7.17138671875, -6.594970703125, -6.0185546875, -5.442138671875, -4.86572265625, -4.289306640625, -3.712890625, -3.136474609375, -2.56005859375, -1.983642578125, -1.4072265625, -0.830810546875, -0.25439453125, 0.322021484375, 0.8984375, 1.474853515625, 2.05126953125, 2.627685546875, 3.2041015625, 3.780517578125, 4.35693359375, 4.933349609375, 5.509765625, 6.086181640625, 6.66259765625, 7.239013671875, 7.8154296875, 8.391845703125, 8.96826171875, 9.544677734375, 10.12109375, 10.697509765625, 11.27392578125, 11.850341796875, 12.4267578125, 13.003173828125, 13.57958984375, 14.156005859375, 14.732421875, 15.308837890625, 15.88525390625, 16.461669921875, 17.0380859375, 17.614501953125, 18.19091796875, 18.767333984375, 19.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 8.0, 7.0, 16.0, 19.0, 35.0, 79.0, 253.0, 3338.0, 169.0, 69.0, 28.0, 23.0, 9.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.578125, -5.39453125, -5.2109375, -5.02734375, -4.84375, -4.66015625, -4.4765625, -4.29296875, -4.109375, -3.92578125, -3.7421875, -3.55859375, -3.375, -3.19140625, -3.0078125, -2.82421875, -2.640625, -2.45703125, -2.2734375, -2.08984375, -1.90625, -1.72265625, -1.5390625, -1.35546875, -1.171875, -0.98828125, -0.8046875, -0.62109375, -0.4375, -0.25390625, -0.0703125, 0.11328125, 0.296875, 0.48046875, 0.6640625, 0.84765625, 1.03125, 1.21484375, 1.3984375, 1.58203125, 1.765625, 1.94921875, 2.1328125, 2.31640625, 2.5, 2.68359375, 2.8671875, 3.05078125, 3.234375, 3.41796875, 3.6015625, 3.78515625, 3.96875, 4.15234375, 4.3359375, 4.51953125, 4.703125, 4.88671875, 5.0703125, 5.25390625, 5.4375, 5.62109375, 5.8046875, 5.98828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 10.0, 35.0, 78.0, 192.0, 302.0, 229.0, 112.0, 23.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.132436752319336, -24.480453491210938, -22.828472137451172, -21.176488876342773, -19.524505615234375, -17.872522354125977, -16.220539093017578, -14.568557739257812, -12.916574478149414, -11.264591217041016, -9.612608909606934, -7.960626125335693, -6.308643341064453, -4.656660079956055, -3.0046777725219727, -1.3526954650878906, 0.2992877960205078, 1.951270580291748, 3.6032533645629883, 5.2552361488342285, 6.907218933105469, 8.559202194213867, 10.21118450164795, 11.863166809082031, 13.51515007019043, 15.167133331298828, 16.819114685058594, 18.471097946166992, 20.12308120727539, 21.77506446838379, 23.427047729492188, 25.079029083251953, 26.73101043701172, 28.382993698120117, 30.034976959228516, 31.68695831298828, 33.33894348144531, 34.99092483520508, 36.642906188964844, 38.294891357421875, 39.94687271118164, 41.598854064941406, 43.25083923339844, 44.9028205871582, 46.55480194091797, 48.206787109375, 49.858768463134766, 51.51074981689453, 53.16273498535156, 54.81471633911133, 56.46670150756836, 58.118682861328125, 59.770668029785156, 61.42264938354492, 63.07463073730469, 64.72661590576172, 66.37860107421875, 68.03058624267578, 69.68256378173828, 71.33454895019531, 72.98653411865234, 74.63851928710938, 76.29049682617188, 77.9424819946289, 79.5944595336914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 11.0, 16.0, 14.0, 12.0, 23.0, 9.0, 14.0, 16.0, 23.0, 21.0, 24.0, 22.0, 29.0, 36.0, 37.0, 45.0, 41.0, 42.0, 44.0, 38.0, 33.0, 55.0, 39.0, 35.0, 27.0, 29.0, 38.0, 32.0, 20.0, 21.0, 26.0, 14.0, 25.0, 25.0, 15.0, 12.0, 13.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.527572631835938, -11.191959381103516, -10.856346130371094, -10.520732879638672, -10.18511962890625, -9.849506378173828, -9.513893127441406, -9.178279876708984, -8.842666625976562, -8.50705337524414, -8.171440124511719, -7.835826873779297, -7.500213623046875, -7.164600372314453, -6.828987121582031, -6.493373870849609, -6.157760143280029, -5.822146892547607, -5.4865336418151855, -5.150920391082764, -4.815307140350342, -4.47969388961792, -4.14408016204834, -3.808467149734497, -3.472853899002075, -3.1372406482696533, -2.8016273975372314, -2.4660139083862305, -2.1304006576538086, -1.7947875261306763, -1.4591741561889648, -1.123560905456543, -0.7879476547241211, -0.45233437418937683, -0.11672109365463257, 0.21889221668243408, 0.554505467414856, 0.8901187181472778, 1.2257320880889893, 1.5613453388214111, 1.896958589553833, 2.232571840286255, 2.5681850910186768, 2.9037985801696777, 3.2394118309020996, 3.5750250816345215, 3.9106383323669434, 4.246251583099365, 4.581864833831787, 4.917478084564209, 5.253091335296631, 5.588704586029053, 5.924317836761475, 6.2599310874938965, 6.595544815063477, 6.931158065795898, 7.26677131652832, 7.602384567260742, 7.937997817993164, 8.273611068725586, 8.609224319458008, 8.94483757019043, 9.280450820922852, 9.616064071655273, 9.951677322387695]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 7.0, 4.0, 17.0, 21.0, 41.0, 47.0, 81.0, 160.0, 251.0, 461.0, 1019.0, 2788.0, 8815.0, 33563.0, 142130.0, 447799.0, 307244.0, 76930.0, 18460.0, 5159.0, 1854.0, 809.0, 357.0, 196.0, 108.0, 66.0, 41.0, 38.0, 31.0, 22.0, 5.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.6474609375, -14.138671875, -13.6298828125, -13.12109375, -12.6123046875, -12.103515625, -11.5947265625, -11.0859375, -10.5771484375, -10.068359375, -9.5595703125, -9.05078125, -8.5419921875, -8.033203125, -7.5244140625, -7.015625, -6.5068359375, -5.998046875, -5.4892578125, -4.98046875, -4.4716796875, -3.962890625, -3.4541015625, -2.9453125, -2.4365234375, -1.927734375, -1.4189453125, -0.91015625, -0.4013671875, 0.107421875, 0.6162109375, 1.125, 1.6337890625, 2.142578125, 2.6513671875, 3.16015625, 3.6689453125, 4.177734375, 4.6865234375, 5.1953125, 5.7041015625, 6.212890625, 6.7216796875, 7.23046875, 7.7392578125, 8.248046875, 8.7568359375, 9.265625, 9.7744140625, 10.283203125, 10.7919921875, 11.30078125, 11.8095703125, 12.318359375, 12.8271484375, 13.3359375, 13.8447265625, 14.353515625, 14.8623046875, 15.37109375, 15.8798828125, 16.388671875, 16.8974609375, 17.40625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 3.0, 7.0, 13.0, 6.0, 19.0, 19.0, 33.0, 37.0, 30.0, 42.0, 33.0, 45.0, 61.0, 47.0, 55.0, 59.0, 57.0, 48.0, 45.0, 37.0, 45.0, 43.0, 33.0, 23.0, 33.0, 18.0, 22.0, 15.0, 16.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-6.5546875, -6.37615966796875, -6.1976318359375, -6.01910400390625, -5.840576171875, -5.66204833984375, -5.4835205078125, -5.30499267578125, -5.12646484375, -4.94793701171875, -4.7694091796875, -4.59088134765625, -4.412353515625, -4.23382568359375, -4.0552978515625, -3.87677001953125, -3.6982421875, -3.51971435546875, -3.3411865234375, -3.16265869140625, -2.984130859375, -2.80560302734375, -2.6270751953125, -2.44854736328125, -2.27001953125, -2.09149169921875, -1.9129638671875, -1.73443603515625, -1.555908203125, -1.37738037109375, -1.1988525390625, -1.02032470703125, -0.841796875, -0.66326904296875, -0.4847412109375, -0.30621337890625, -0.127685546875, 0.05084228515625, 0.2293701171875, 0.40789794921875, 0.58642578125, 0.76495361328125, 0.9434814453125, 1.12200927734375, 1.300537109375, 1.47906494140625, 1.6575927734375, 1.83612060546875, 2.0146484375, 2.19317626953125, 2.3717041015625, 2.55023193359375, 2.728759765625, 2.90728759765625, 3.0858154296875, 3.26434326171875, 3.44287109375, 3.62139892578125, 3.7999267578125, 3.97845458984375, 4.156982421875, 4.33551025390625, 4.5140380859375, 4.69256591796875, 4.87109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 10.0, 16.0, 17.0, 19.0, 42.0, 52.0, 79.0, 117.0, 161.0, 216.0, 286.0, 452.0, 664.0, 1201.0, 2790.0, 13694.0, 189636.0, 769256.0, 58729.0, 6528.0, 1866.0, 899.0, 590.0, 357.0, 252.0, 162.0, 143.0, 89.0, 69.0, 43.0, 38.0, 25.0, 11.0, 17.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.25048828125, -20.3759765625, -19.50146484375, -18.626953125, -17.75244140625, -16.8779296875, -16.00341796875, -15.12890625, -14.25439453125, -13.3798828125, -12.50537109375, -11.630859375, -10.75634765625, -9.8818359375, -9.00732421875, -8.1328125, -7.25830078125, -6.3837890625, -5.50927734375, -4.634765625, -3.76025390625, -2.8857421875, -2.01123046875, -1.13671875, -0.26220703125, 0.6123046875, 1.48681640625, 2.361328125, 3.23583984375, 4.1103515625, 4.98486328125, 5.859375, 6.73388671875, 7.6083984375, 8.48291015625, 9.357421875, 10.23193359375, 11.1064453125, 11.98095703125, 12.85546875, 13.72998046875, 14.6044921875, 15.47900390625, 16.353515625, 17.22802734375, 18.1025390625, 18.97705078125, 19.8515625, 20.72607421875, 21.6005859375, 22.47509765625, 23.349609375, 24.22412109375, 25.0986328125, 25.97314453125, 26.84765625, 27.72216796875, 28.5966796875, 29.47119140625, 30.345703125, 31.22021484375, 32.0947265625, 32.96923828125, 33.84375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 9.0, 17.0, 14.0, 22.0, 23.0, 16.0, 28.0, 29.0, 36.0, 38.0, 44.0, 43.0, 64.0, 40.0, 46.0, 42.0, 51.0, 52.0, 44.0, 38.0, 43.0, 38.0, 25.0, 30.0, 27.0, 22.0, 14.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.515625, -22.7724609375, -22.029296875, -21.2861328125, -20.54296875, -19.7998046875, -19.056640625, -18.3134765625, -17.5703125, -16.8271484375, -16.083984375, -15.3408203125, -14.59765625, -13.8544921875, -13.111328125, -12.3681640625, -11.625, -10.8818359375, -10.138671875, -9.3955078125, -8.65234375, -7.9091796875, -7.166015625, -6.4228515625, -5.6796875, -4.9365234375, -4.193359375, -3.4501953125, -2.70703125, -1.9638671875, -1.220703125, -0.4775390625, 0.265625, 1.0087890625, 1.751953125, 2.4951171875, 3.23828125, 3.9814453125, 4.724609375, 5.4677734375, 6.2109375, 6.9541015625, 7.697265625, 8.4404296875, 9.18359375, 9.9267578125, 10.669921875, 11.4130859375, 12.15625, 12.8994140625, 13.642578125, 14.3857421875, 15.12890625, 15.8720703125, 16.615234375, 17.3583984375, 18.1015625, 18.8447265625, 19.587890625, 20.3310546875, 21.07421875, 21.8173828125, 22.560546875, 23.3037109375, 24.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 9.0, 7.0, 8.0, 9.0, 16.0, 16.0, 17.0, 20.0, 38.0, 56.0, 104.0, 185.0, 357.0, 803.0, 4056.0, 126993.0, 897667.0, 15387.0, 1637.0, 526.0, 209.0, 123.0, 79.0, 56.0, 38.0, 30.0, 14.0, 14.0, 16.0, 10.0, 4.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.484375, -24.694091796875, -23.90380859375, -23.113525390625, -22.3232421875, -21.532958984375, -20.74267578125, -19.952392578125, -19.162109375, -18.371826171875, -17.58154296875, -16.791259765625, -16.0009765625, -15.210693359375, -14.42041015625, -13.630126953125, -12.83984375, -12.049560546875, -11.25927734375, -10.468994140625, -9.6787109375, -8.888427734375, -8.09814453125, -7.307861328125, -6.517578125, -5.727294921875, -4.93701171875, -4.146728515625, -3.3564453125, -2.566162109375, -1.77587890625, -0.985595703125, -0.1953125, 0.594970703125, 1.38525390625, 2.175537109375, 2.9658203125, 3.756103515625, 4.54638671875, 5.336669921875, 6.126953125, 6.917236328125, 7.70751953125, 8.497802734375, 9.2880859375, 10.078369140625, 10.86865234375, 11.658935546875, 12.44921875, 13.239501953125, 14.02978515625, 14.820068359375, 15.6103515625, 16.400634765625, 17.19091796875, 17.981201171875, 18.771484375, 19.561767578125, 20.35205078125, 21.142333984375, 21.9326171875, 22.722900390625, 23.51318359375, 24.303466796875, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 9.0, 4.0, 3.0, 21.0, 19.0, 27.0, 24.0, 30.0, 40.0, 57.0, 71.0, 100.0, 93.0, 89.0, 75.0, 61.0, 39.0, 35.0, 31.0, 31.0, 18.0, 19.0, 13.0, 20.0, 10.0, 12.0, 1.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0012960433959960938, -0.0012586414813995361, -0.0012212395668029785, -0.001183837652206421, -0.0011464357376098633, -0.0011090338230133057, -0.001071631908416748, -0.0010342299938201904, -0.0009968280792236328, -0.0009594261646270752, -0.0009220242500305176, -0.00088462233543396, -0.0008472204208374023, -0.0008098185062408447, -0.0007724165916442871, -0.0007350146770477295, -0.0006976127624511719, -0.0006602108478546143, -0.0006228089332580566, -0.000585407018661499, -0.0005480051040649414, -0.0005106031894683838, -0.00047320127487182617, -0.00043579936027526855, -0.00039839744567871094, -0.0003609955310821533, -0.0003235936164855957, -0.0002861917018890381, -0.00024878978729248047, -0.00021138787269592285, -0.00017398595809936523, -0.00013658404350280762, -9.918212890625e-05, -6.178021430969238e-05, -2.4378299713134766e-05, 1.3023614883422852e-05, 5.042552947998047e-05, 8.782744407653809e-05, 0.0001252293586730957, 0.00016263127326965332, 0.00020003318786621094, 0.00023743510246276855, 0.00027483701705932617, 0.0003122389316558838, 0.0003496408462524414, 0.000387042760848999, 0.00042444467544555664, 0.00046184659004211426, 0.0004992485046386719, 0.0005366504192352295, 0.0005740523338317871, 0.0006114542484283447, 0.0006488561630249023, 0.00068625807762146, 0.0007236599922180176, 0.0007610619068145752, 0.0007984638214111328, 0.0008358657360076904, 0.000873267650604248, 0.0009106695652008057, 0.0009480714797973633, 0.000985473394393921, 0.0010228753089904785, 0.0010602772235870361, 0.0010976791381835938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 3.0, 10.0, 14.0, 25.0, 36.0, 46.0, 98.0, 165.0, 297.0, 562.0, 1311.0, 4644.0, 43848.0, 851379.0, 133982.0, 8484.0, 1951.0, 804.0, 367.0, 200.0, 117.0, 76.0, 36.0, 22.0, 15.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.125, -20.515625, -19.90625, -19.296875, -18.6875, -18.078125, -17.46875, -16.859375, -16.25, -15.640625, -15.03125, -14.421875, -13.8125, -13.203125, -12.59375, -11.984375, -11.375, -10.765625, -10.15625, -9.546875, -8.9375, -8.328125, -7.71875, -7.109375, -6.5, -5.890625, -5.28125, -4.671875, -4.0625, -3.453125, -2.84375, -2.234375, -1.625, -1.015625, -0.40625, 0.203125, 0.8125, 1.421875, 2.03125, 2.640625, 3.25, 3.859375, 4.46875, 5.078125, 5.6875, 6.296875, 6.90625, 7.515625, 8.125, 8.734375, 9.34375, 9.953125, 10.5625, 11.171875, 11.78125, 12.390625, 13.0, 13.609375, 14.21875, 14.828125, 15.4375, 16.046875, 16.65625, 17.265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 16.0, 27.0, 34.0, 51.0, 60.0, 123.0, 158.0, 168.0, 124.0, 78.0, 47.0, 36.0, 23.0, 16.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.053466796875, -12.51318359375, -11.972900390625, -11.4326171875, -10.892333984375, -10.35205078125, -9.811767578125, -9.271484375, -8.731201171875, -8.19091796875, -7.650634765625, -7.1103515625, -6.570068359375, -6.02978515625, -5.489501953125, -4.94921875, -4.408935546875, -3.86865234375, -3.328369140625, -2.7880859375, -2.247802734375, -1.70751953125, -1.167236328125, -0.626953125, -0.086669921875, 0.45361328125, 0.993896484375, 1.5341796875, 2.074462890625, 2.61474609375, 3.155029296875, 3.6953125, 4.235595703125, 4.77587890625, 5.316162109375, 5.8564453125, 6.396728515625, 6.93701171875, 7.477294921875, 8.017578125, 8.557861328125, 9.09814453125, 9.638427734375, 10.1787109375, 10.718994140625, 11.25927734375, 11.799560546875, 12.33984375, 12.880126953125, 13.42041015625, 13.960693359375, 14.5009765625, 15.041259765625, 15.58154296875, 16.121826171875, 16.662109375, 17.202392578125, 17.74267578125, 18.282958984375, 18.8232421875, 19.363525390625, 19.90380859375, 20.444091796875, 20.984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 42.0, 196.0, 406.0, 268.0, 63.0, 9.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-594.6671142578125, -580.3751831054688, -566.083251953125, -551.791259765625, -537.4993286132812, -523.2073974609375, -508.91546630859375, -494.6235046386719, -480.33154296875, -466.03961181640625, -451.7476501464844, -437.4557189941406, -423.16375732421875, -408.871826171875, -394.57989501953125, -380.2879333496094, -365.9960021972656, -351.7040710449219, -337.412109375, -323.12017822265625, -308.8282165527344, -294.5362854003906, -280.24432373046875, -265.952392578125, -251.6604461669922, -237.36849975585938, -223.07655334472656, -208.78460693359375, -194.49267578125, -180.20071411132812, -165.90878295898438, -151.61683654785156, -137.32485961914062, -123.03291320800781, -108.740966796875, -94.44902801513672, -80.1570816040039, -65.8651351928711, -51.57319641113281, -37.28125, -22.989303588867188, -8.697359085083008, 5.594585418701172, 19.88652801513672, 34.17847442626953, 48.470420837402344, 62.762359619140625, 77.05430603027344, 91.34625244140625, 105.63819885253906, 119.93014526367188, 134.22207641601562, 148.5140380859375, 162.80596923828125, 177.09791564941406, 191.38986206054688, 205.6818084716797, 219.9737548828125, 234.2657012939453, 248.55764770507812, 262.8495788574219, 277.14154052734375, 291.4334716796875, 305.72540283203125, 320.0173645019531]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 12.0, 16.0, 17.0, 12.0, 13.0, 25.0, 20.0, 31.0, 35.0, 24.0, 40.0, 44.0, 41.0, 38.0, 45.0, 41.0, 52.0, 50.0, 36.0, 48.0, 33.0, 43.0, 43.0, 32.0, 25.0, 23.0, 25.0, 21.0, 20.0, 13.0, 9.0, 8.0, 12.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.62222290039062, -95.3524169921875, -92.08261108398438, -88.81279754638672, -85.5429916381836, -82.27318572998047, -79.00337982177734, -75.73356628417969, -72.46376037597656, -69.19395446777344, -65.92414855957031, -62.65433883666992, -59.38452911376953, -56.114723205566406, -52.84491729736328, -49.57510757446289, -46.305301666259766, -43.03549575805664, -39.76568603515625, -36.495880126953125, -33.226070404052734, -29.95626449584961, -26.68645668029785, -23.416648864746094, -20.146841049194336, -16.877033233642578, -13.60722541809082, -10.337418556213379, -7.067610740661621, -3.7978038787841797, -0.5279960632324219, 2.741811752319336, 6.011619567871094, 9.281427383422852, 12.55123519897461, 15.82104206085205, 19.090850830078125, 22.36065673828125, 25.630464553833008, 28.900272369384766, 32.170082092285156, 35.43988800048828, 38.70969772338867, 41.9795036315918, 45.24931335449219, 48.51911926269531, 51.78892517089844, 55.05873489379883, 58.32854080200195, 61.59834671020508, 64.86815643310547, 68.1379623413086, 71.40776824951172, 74.67758178710938, 77.9473876953125, 81.21719360351562, 84.48699951171875, 87.75680541992188, 91.026611328125, 94.29642486572266, 97.56623077392578, 100.8360366821289, 104.10584259033203, 107.37565612792969, 110.64546203613281]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 13.0, 16.0, 31.0, 44.0, 73.0, 123.0, 208.0, 368.0, 684.0, 1526.0, 3486.0, 9732.0, 43435.0, 3771377.0, 324038.0, 26608.0, 7176.0, 2696.0, 1208.0, 591.0, 317.0, 203.0, 104.0, 69.0, 44.0, 31.0, 13.0, 15.0, 12.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.078125, -24.31494140625, -23.5517578125, -22.78857421875, -22.025390625, -21.26220703125, -20.4990234375, -19.73583984375, -18.97265625, -18.20947265625, -17.4462890625, -16.68310546875, -15.919921875, -15.15673828125, -14.3935546875, -13.63037109375, -12.8671875, -12.10400390625, -11.3408203125, -10.57763671875, -9.814453125, -9.05126953125, -8.2880859375, -7.52490234375, -6.76171875, -5.99853515625, -5.2353515625, -4.47216796875, -3.708984375, -2.94580078125, -2.1826171875, -1.41943359375, -0.65625, 0.10693359375, 0.8701171875, 1.63330078125, 2.396484375, 3.15966796875, 3.9228515625, 4.68603515625, 5.44921875, 6.21240234375, 6.9755859375, 7.73876953125, 8.501953125, 9.26513671875, 10.0283203125, 10.79150390625, 11.5546875, 12.31787109375, 13.0810546875, 13.84423828125, 14.607421875, 15.37060546875, 16.1337890625, 16.89697265625, 17.66015625, 18.42333984375, 19.1865234375, 19.94970703125, 20.712890625, 21.47607421875, 22.2392578125, 23.00244140625, 23.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 10.0, 14.0, 18.0, 30.0, 37.0, 53.0, 50.0, 62.0, 72.0, 74.0, 82.0, 72.0, 78.0, 65.0, 53.0, 49.0, 47.0, 26.0, 17.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.36566162109375, -7.1180419921875, -6.87042236328125, -6.622802734375, -6.37518310546875, -6.1275634765625, -5.87994384765625, -5.63232421875, -5.38470458984375, -5.1370849609375, -4.88946533203125, -4.641845703125, -4.39422607421875, -4.1466064453125, -3.89898681640625, -3.6513671875, -3.40374755859375, -3.1561279296875, -2.90850830078125, -2.660888671875, -2.41326904296875, -2.1656494140625, -1.91802978515625, -1.67041015625, -1.42279052734375, -1.1751708984375, -0.92755126953125, -0.679931640625, -0.43231201171875, -0.1846923828125, 0.06292724609375, 0.310546875, 0.55816650390625, 0.8057861328125, 1.05340576171875, 1.301025390625, 1.54864501953125, 1.7962646484375, 2.04388427734375, 2.29150390625, 2.53912353515625, 2.7867431640625, 3.03436279296875, 3.281982421875, 3.52960205078125, 3.7772216796875, 4.02484130859375, 4.2724609375, 4.52008056640625, 4.7677001953125, 5.01531982421875, 5.262939453125, 5.51055908203125, 5.7581787109375, 6.00579833984375, 6.25341796875, 6.50103759765625, 6.7486572265625, 6.99627685546875, 7.243896484375, 7.49151611328125, 7.7391357421875, 7.98675537109375, 8.234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 11.0, 12.0, 13.0, 10.0, 33.0, 37.0, 63.0, 98.0, 124.0, 202.0, 324.0, 470.0, 725.0, 1270.0, 2251.0, 4501.0, 9980.0, 27988.0, 131674.0, 3771402.0, 187312.0, 33414.0, 11329.0, 4914.0, 2395.0, 1456.0, 829.0, 488.0, 324.0, 203.0, 113.0, 89.0, 74.0, 46.0, 28.0, 25.0, 13.0, 11.0, 13.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.46142578125, -12.0400390625, -11.61865234375, -11.197265625, -10.77587890625, -10.3544921875, -9.93310546875, -9.51171875, -9.09033203125, -8.6689453125, -8.24755859375, -7.826171875, -7.40478515625, -6.9833984375, -6.56201171875, -6.140625, -5.71923828125, -5.2978515625, -4.87646484375, -4.455078125, -4.03369140625, -3.6123046875, -3.19091796875, -2.76953125, -2.34814453125, -1.9267578125, -1.50537109375, -1.083984375, -0.66259765625, -0.2412109375, 0.18017578125, 0.6015625, 1.02294921875, 1.4443359375, 1.86572265625, 2.287109375, 2.70849609375, 3.1298828125, 3.55126953125, 3.97265625, 4.39404296875, 4.8154296875, 5.23681640625, 5.658203125, 6.07958984375, 6.5009765625, 6.92236328125, 7.34375, 7.76513671875, 8.1865234375, 8.60791015625, 9.029296875, 9.45068359375, 9.8720703125, 10.29345703125, 10.71484375, 11.13623046875, 11.5576171875, 11.97900390625, 12.400390625, 12.82177734375, 13.2431640625, 13.66455078125, 14.0859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 13.0, 19.0, 28.0, 33.0, 87.0, 248.0, 2590.0, 675.0, 168.0, 63.0, 52.0, 26.0, 21.0, 14.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.76104736328125, -6.5181884765625, -6.27532958984375, -6.032470703125, -5.78961181640625, -5.5467529296875, -5.30389404296875, -5.06103515625, -4.81817626953125, -4.5753173828125, -4.33245849609375, -4.089599609375, -3.84674072265625, -3.6038818359375, -3.36102294921875, -3.1181640625, -2.87530517578125, -2.6324462890625, -2.38958740234375, -2.146728515625, -1.90386962890625, -1.6610107421875, -1.41815185546875, -1.17529296875, -0.93243408203125, -0.6895751953125, -0.44671630859375, -0.203857421875, 0.03900146484375, 0.2818603515625, 0.52471923828125, 0.767578125, 1.01043701171875, 1.2532958984375, 1.49615478515625, 1.739013671875, 1.98187255859375, 2.2247314453125, 2.46759033203125, 2.71044921875, 2.95330810546875, 3.1961669921875, 3.43902587890625, 3.681884765625, 3.92474365234375, 4.1676025390625, 4.41046142578125, 4.6533203125, 4.89617919921875, 5.1390380859375, 5.38189697265625, 5.624755859375, 5.86761474609375, 6.1104736328125, 6.35333251953125, 6.59619140625, 6.83905029296875, 7.0819091796875, 7.32476806640625, 7.567626953125, 7.81048583984375, 8.0533447265625, 8.29620361328125, 8.5390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 13.0, 23.0, 37.0, 68.0, 82.0, 101.0, 127.0, 153.0, 100.0, 101.0, 59.0, 39.0, 30.0, 21.0, 14.0, 6.0, 9.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.00275421142578, -17.037540435791016, -16.07232666015625, -15.1071138381958, -14.141900062561035, -13.17668628692627, -12.21147346496582, -11.246259689331055, -10.281045913696289, -9.315832138061523, -8.350618362426758, -7.385405540466309, -6.420191764831543, -5.454977989196777, -4.48976469039917, -3.5245513916015625, -2.559337615966797, -1.5941240787506104, -0.6289105415344238, 0.3363029956817627, 1.3015165328979492, 2.266730308532715, 3.2319436073303223, 4.19715690612793, 5.162370681762695, 6.127584457397461, 7.092797756195068, 8.058011054992676, 9.023224830627441, 9.988438606262207, 10.953651428222656, 11.918865203857422, 12.884078979492188, 13.849292755126953, 14.814506530761719, 15.779719352722168, 16.74493408203125, 17.710147857666016, 18.67535972595215, 19.640573501586914, 20.60578727722168, 21.571001052856445, 22.53621482849121, 23.501428604125977, 24.46664047241211, 25.431854248046875, 26.39706802368164, 27.362281799316406, 28.327495574951172, 29.292709350585938, 30.257923126220703, 31.22313690185547, 32.188350677490234, 33.153564453125, 34.118778228759766, 35.08399200439453, 36.04920196533203, 37.0144157409668, 37.97962951660156, 38.94484329223633, 39.910057067871094, 40.87527084350586, 41.840484619140625, 42.805694580078125, 43.770912170410156]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 9.0, 4.0, 9.0, 13.0, 23.0, 18.0, 24.0, 15.0, 33.0, 25.0, 33.0, 30.0, 37.0, 32.0, 30.0, 25.0, 40.0, 53.0, 56.0, 50.0, 42.0, 41.0, 48.0, 35.0, 29.0, 21.0, 24.0, 24.0, 24.0, 27.0, 21.0, 23.0, 13.0, 17.0, 10.0, 7.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.932306289672852, -12.515914916992188, -12.099523544311523, -11.68313217163086, -11.266739845275879, -10.850348472595215, -10.43395709991455, -10.017565727233887, -9.601173400878906, -9.184782028198242, -8.768390655517578, -8.351999282836914, -7.935606956481934, -7.5192155838012695, -7.1028242111206055, -6.686432838439941, -6.270041465759277, -5.853650093078613, -5.437258243560791, -5.020866870880127, -4.604475021362305, -4.188083648681641, -3.7716922760009766, -3.3553006649017334, -2.9389090538024902, -2.522517442703247, -2.106125831604004, -1.6897344589233398, -1.2733428478240967, -0.8569512367248535, -0.44055986404418945, -0.02416825294494629, 0.3922233581542969, 0.8086149096488953, 1.2250064611434937, 1.6413979530334473, 2.0577895641326904, 2.4741811752319336, 2.8905725479125977, 3.306964159011841, 3.723355770111084, 4.139747142791748, 4.55613899230957, 4.972530364990234, 5.388921737670898, 5.805313587188721, 6.221704959869385, 6.638096809387207, 7.054488182067871, 7.470879554748535, 7.887271404266357, 8.30366325378418, 8.720054626464844, 9.136445999145508, 9.552837371826172, 9.969228744506836, 10.3856201171875, 10.802011489868164, 11.218402862548828, 11.634794235229492, 12.051186561584473, 12.467577934265137, 12.8839693069458, 13.300360679626465, 13.716753005981445]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 10.0, 11.0, 15.0, 18.0, 20.0, 51.0, 90.0, 121.0, 244.0, 411.0, 792.0, 1816.0, 4240.0, 11600.0, 37067.0, 129310.0, 406521.0, 319418.0, 94755.0, 27179.0, 8660.0, 3298.0, 1367.0, 682.0, 372.0, 192.0, 104.0, 73.0, 42.0, 30.0, 13.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.8404541015625, -14.266845703125, -13.6932373046875, -13.11962890625, -12.5460205078125, -11.972412109375, -11.3988037109375, -10.8251953125, -10.2515869140625, -9.677978515625, -9.1043701171875, -8.53076171875, -7.9571533203125, -7.383544921875, -6.8099365234375, -6.236328125, -5.6627197265625, -5.089111328125, -4.5155029296875, -3.94189453125, -3.3682861328125, -2.794677734375, -2.2210693359375, -1.6474609375, -1.0738525390625, -0.500244140625, 0.0733642578125, 0.64697265625, 1.2205810546875, 1.794189453125, 2.3677978515625, 2.94140625, 3.5150146484375, 4.088623046875, 4.6622314453125, 5.23583984375, 5.8094482421875, 6.383056640625, 6.9566650390625, 7.5302734375, 8.1038818359375, 8.677490234375, 9.2510986328125, 9.82470703125, 10.3983154296875, 10.971923828125, 11.5455322265625, 12.119140625, 12.6927490234375, 13.266357421875, 13.8399658203125, 14.41357421875, 14.9871826171875, 15.560791015625, 16.1343994140625, 16.7080078125, 17.2816162109375, 17.855224609375, 18.4288330078125, 19.00244140625, 19.5760498046875, 20.149658203125, 20.7232666015625, 21.296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 10.0, 6.0, 17.0, 33.0, 34.0, 51.0, 47.0, 51.0, 82.0, 75.0, 80.0, 71.0, 76.0, 73.0, 59.0, 47.0, 43.0, 31.0, 31.0, 20.0, 16.0, 9.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9854736328125, -7.728759765625, -7.4720458984375, -7.21533203125, -6.9586181640625, -6.701904296875, -6.4451904296875, -6.1884765625, -5.9317626953125, -5.675048828125, -5.4183349609375, -5.16162109375, -4.9049072265625, -4.648193359375, -4.3914794921875, -4.134765625, -3.8780517578125, -3.621337890625, -3.3646240234375, -3.10791015625, -2.8511962890625, -2.594482421875, -2.3377685546875, -2.0810546875, -1.8243408203125, -1.567626953125, -1.3109130859375, -1.05419921875, -0.7974853515625, -0.540771484375, -0.2840576171875, -0.02734375, 0.2293701171875, 0.486083984375, 0.7427978515625, 0.99951171875, 1.2562255859375, 1.512939453125, 1.7696533203125, 2.0263671875, 2.2830810546875, 2.539794921875, 2.7965087890625, 3.05322265625, 3.3099365234375, 3.566650390625, 3.8233642578125, 4.080078125, 4.3367919921875, 4.593505859375, 4.8502197265625, 5.10693359375, 5.3636474609375, 5.620361328125, 5.8770751953125, 6.1337890625, 6.3905029296875, 6.647216796875, 6.9039306640625, 7.16064453125, 7.4173583984375, 7.674072265625, 7.9307861328125, 8.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 18.0, 11.0, 28.0, 41.0, 69.0, 89.0, 137.0, 285.0, 615.0, 1597.0, 7916.0, 354026.0, 669276.0, 11116.0, 1836.0, 685.0, 337.0, 200.0, 92.0, 67.0, 22.0, 26.0, 17.0, 14.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.25, -65.57177734375, -63.8935546875, -62.21533203125, -60.537109375, -58.85888671875, -57.1806640625, -55.50244140625, -53.82421875, -52.14599609375, -50.4677734375, -48.78955078125, -47.111328125, -45.43310546875, -43.7548828125, -42.07666015625, -40.3984375, -38.72021484375, -37.0419921875, -35.36376953125, -33.685546875, -32.00732421875, -30.3291015625, -28.65087890625, -26.97265625, -25.29443359375, -23.6162109375, -21.93798828125, -20.259765625, -18.58154296875, -16.9033203125, -15.22509765625, -13.546875, -11.86865234375, -10.1904296875, -8.51220703125, -6.833984375, -5.15576171875, -3.4775390625, -1.79931640625, -0.12109375, 1.55712890625, 3.2353515625, 4.91357421875, 6.591796875, 8.27001953125, 9.9482421875, 11.62646484375, 13.3046875, 14.98291015625, 16.6611328125, 18.33935546875, 20.017578125, 21.69580078125, 23.3740234375, 25.05224609375, 26.73046875, 28.40869140625, 30.0869140625, 31.76513671875, 33.443359375, 35.12158203125, 36.7998046875, 38.47802734375, 40.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 7.0, 10.0, 11.0, 15.0, 18.0, 27.0, 22.0, 45.0, 40.0, 52.0, 46.0, 58.0, 61.0, 59.0, 45.0, 62.0, 46.0, 64.0, 44.0, 47.0, 31.0, 38.0, 32.0, 18.0, 20.0, 10.0, 13.0, 8.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.390625, -24.551513671875, -23.71240234375, -22.873291015625, -22.0341796875, -21.195068359375, -20.35595703125, -19.516845703125, -18.677734375, -17.838623046875, -16.99951171875, -16.160400390625, -15.3212890625, -14.482177734375, -13.64306640625, -12.803955078125, -11.96484375, -11.125732421875, -10.28662109375, -9.447509765625, -8.6083984375, -7.769287109375, -6.93017578125, -6.091064453125, -5.251953125, -4.412841796875, -3.57373046875, -2.734619140625, -1.8955078125, -1.056396484375, -0.21728515625, 0.621826171875, 1.4609375, 2.300048828125, 3.13916015625, 3.978271484375, 4.8173828125, 5.656494140625, 6.49560546875, 7.334716796875, 8.173828125, 9.012939453125, 9.85205078125, 10.691162109375, 11.5302734375, 12.369384765625, 13.20849609375, 14.047607421875, 14.88671875, 15.725830078125, 16.56494140625, 17.404052734375, 18.2431640625, 19.082275390625, 19.92138671875, 20.760498046875, 21.599609375, 22.438720703125, 23.27783203125, 24.116943359375, 24.9560546875, 25.795166015625, 26.63427734375, 27.473388671875, 28.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 17.0, 24.0, 55.0, 95.0, 227.0, 520.0, 1627.0, 8040.0, 118375.0, 861153.0, 51678.0, 4831.0, 1169.0, 385.0, 171.0, 75.0, 42.0, 29.0, 15.0, 14.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.128173828125, -8.63134765625, -8.134521484375, -7.6376953125, -7.140869140625, -6.64404296875, -6.147216796875, -5.650390625, -5.153564453125, -4.65673828125, -4.159912109375, -3.6630859375, -3.166259765625, -2.66943359375, -2.172607421875, -1.67578125, -1.178955078125, -0.68212890625, -0.185302734375, 0.3115234375, 0.808349609375, 1.30517578125, 1.802001953125, 2.298828125, 2.795654296875, 3.29248046875, 3.789306640625, 4.2861328125, 4.782958984375, 5.27978515625, 5.776611328125, 6.2734375, 6.770263671875, 7.26708984375, 7.763916015625, 8.2607421875, 8.757568359375, 9.25439453125, 9.751220703125, 10.248046875, 10.744873046875, 11.24169921875, 11.738525390625, 12.2353515625, 12.732177734375, 13.22900390625, 13.725830078125, 14.22265625, 14.719482421875, 15.21630859375, 15.713134765625, 16.2099609375, 16.706787109375, 17.20361328125, 17.700439453125, 18.197265625, 18.694091796875, 19.19091796875, 19.687744140625, 20.1845703125, 20.681396484375, 21.17822265625, 21.675048828125, 22.171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 22.0, 25.0, 30.0, 65.0, 92.0, 168.0, 220.0, 142.0, 96.0, 50.0, 29.0, 17.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002590179443359375, -0.0024915337562561035, -0.002392888069152832, -0.0022942423820495605, -0.002195596694946289, -0.0020969510078430176, -0.001998305320739746, -0.0018996596336364746, -0.0018010139465332031, -0.0017023682594299316, -0.0016037225723266602, -0.0015050768852233887, -0.0014064311981201172, -0.0013077855110168457, -0.0012091398239135742, -0.0011104941368103027, -0.0010118484497070312, -0.0009132027626037598, -0.0008145570755004883, -0.0007159113883972168, -0.0006172657012939453, -0.0005186200141906738, -0.00041997432708740234, -0.00032132863998413086, -0.00022268295288085938, -0.0001240372657775879, -2.5391578674316406e-05, 7.325410842895508e-05, 0.00017189979553222656, 0.00027054548263549805, 0.00036919116973876953, 0.000467836856842041, 0.0005664825439453125, 0.000665128231048584, 0.0007637739181518555, 0.000862419605255127, 0.0009610652923583984, 0.00105971097946167, 0.0011583566665649414, 0.0012570023536682129, 0.0013556480407714844, 0.0014542937278747559, 0.0015529394149780273, 0.0016515851020812988, 0.0017502307891845703, 0.0018488764762878418, 0.0019475221633911133, 0.0020461678504943848, 0.0021448135375976562, 0.0022434592247009277, 0.0023421049118041992, 0.0024407505989074707, 0.002539396286010742, 0.0026380419731140137, 0.002736687660217285, 0.0028353333473205566, 0.002933979034423828, 0.0030326247215270996, 0.003131270408630371, 0.0032299160957336426, 0.003328561782836914, 0.0034272074699401855, 0.003525853157043457, 0.0036244988441467285, 0.00372314453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 0.0, 2.0, 6.0, 13.0, 16.0, 9.0, 23.0, 42.0, 50.0, 90.0, 118.0, 227.0, 410.0, 876.0, 2545.0, 12340.0, 151381.0, 808073.0, 61994.0, 6967.0, 1810.0, 711.0, 326.0, 176.0, 102.0, 70.0, 59.0, 39.0, 20.0, 12.0, 10.0, 7.0, 8.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.625, -12.1796875, -11.734375, -11.2890625, -10.84375, -10.3984375, -9.953125, -9.5078125, -9.0625, -8.6171875, -8.171875, -7.7265625, -7.28125, -6.8359375, -6.390625, -5.9453125, -5.5, -5.0546875, -4.609375, -4.1640625, -3.71875, -3.2734375, -2.828125, -2.3828125, -1.9375, -1.4921875, -1.046875, -0.6015625, -0.15625, 0.2890625, 0.734375, 1.1796875, 1.625, 2.0703125, 2.515625, 2.9609375, 3.40625, 3.8515625, 4.296875, 4.7421875, 5.1875, 5.6328125, 6.078125, 6.5234375, 6.96875, 7.4140625, 7.859375, 8.3046875, 8.75, 9.1953125, 9.640625, 10.0859375, 10.53125, 10.9765625, 11.421875, 11.8671875, 12.3125, 12.7578125, 13.203125, 13.6484375, 14.09375, 14.5390625, 14.984375, 15.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 4.0, 7.0, 14.0, 12.0, 11.0, 17.0, 27.0, 21.0, 37.0, 41.0, 42.0, 67.0, 96.0, 90.0, 103.0, 80.0, 73.0, 49.0, 41.0, 30.0, 26.0, 24.0, 17.0, 11.0, 13.0, 5.0, 9.0, 12.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.68731689453125, -5.4410400390625, -5.19476318359375, -4.948486328125, -4.70220947265625, -4.4559326171875, -4.20965576171875, -3.96337890625, -3.71710205078125, -3.4708251953125, -3.22454833984375, -2.978271484375, -2.73199462890625, -2.4857177734375, -2.23944091796875, -1.9931640625, -1.74688720703125, -1.5006103515625, -1.25433349609375, -1.008056640625, -0.76177978515625, -0.5155029296875, -0.26922607421875, -0.02294921875, 0.22332763671875, 0.4696044921875, 0.71588134765625, 0.962158203125, 1.20843505859375, 1.4547119140625, 1.70098876953125, 1.947265625, 2.19354248046875, 2.4398193359375, 2.68609619140625, 2.932373046875, 3.17864990234375, 3.4249267578125, 3.67120361328125, 3.91748046875, 4.16375732421875, 4.4100341796875, 4.65631103515625, 4.902587890625, 5.14886474609375, 5.3951416015625, 5.64141845703125, 5.8876953125, 6.13397216796875, 6.3802490234375, 6.62652587890625, 6.872802734375, 7.11907958984375, 7.3653564453125, 7.61163330078125, 7.85791015625, 8.10418701171875, 8.3504638671875, 8.59674072265625, 8.843017578125, 9.08929443359375, 9.3355712890625, 9.58184814453125, 9.828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 12.0, 16.0, 36.0, 60.0, 111.0, 159.0, 161.0, 157.0, 129.0, 74.0, 28.0, 20.0, 17.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.7603759765625, -159.92202758789062, -154.08367919921875, -148.24534606933594, -142.40699768066406, -136.5686492919922, -130.7303009033203, -124.89196014404297, -119.05361938476562, -113.21527099609375, -107.3769302368164, -101.53858184814453, -95.70024108886719, -89.86189270019531, -84.02354431152344, -78.1852035522461, -72.34685516357422, -66.50850677490234, -60.670166015625, -54.831817626953125, -48.99347686767578, -43.155128479003906, -37.3167839050293, -31.478439331054688, -25.640094757080078, -19.80175018310547, -13.963404655456543, -8.125059127807617, -2.286714553833008, 3.5516300201416016, 9.389976501464844, 15.228321075439453, 21.066665649414062, 26.905010223388672, 32.74335479736328, 38.581703186035156, 44.4200439453125, 50.258392333984375, 56.096736907958984, 61.935081481933594, 67.77342224121094, 73.61177062988281, 79.45011138916016, 85.28845977783203, 91.12680053710938, 96.96514892578125, 102.80349731445312, 108.64183807373047, 114.48018646240234, 120.31853485107422, 126.15687561035156, 131.99522399902344, 137.8335723876953, 143.67190551757812, 149.51025390625, 155.34860229492188, 161.18695068359375, 167.02529907226562, 172.8636474609375, 178.7019805908203, 184.5403289794922, 190.37867736816406, 196.21702575683594, 202.05535888671875, 207.89370727539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 17.0, 18.0, 14.0, 14.0, 15.0, 36.0, 23.0, 31.0, 33.0, 42.0, 27.0, 37.0, 61.0, 44.0, 48.0, 59.0, 39.0, 48.0, 46.0, 42.0, 31.0, 36.0, 26.0, 26.0, 21.0, 21.0, 23.0, 14.0, 8.0, 8.0, 10.0, 8.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.928466796875, -86.89380645751953, -83.85914611816406, -80.8244857788086, -77.78982543945312, -74.75516510009766, -71.72050476074219, -68.68584442138672, -65.65118408203125, -62.61652374267578, -59.58186340332031, -56.547203063964844, -53.512542724609375, -50.477882385253906, -47.44322204589844, -44.40856170654297, -41.373905181884766, -38.3392448425293, -35.30458450317383, -32.26992416381836, -29.23526382446289, -26.200603485107422, -23.165945053100586, -20.131284713745117, -17.09662437438965, -14.06196403503418, -11.027303695678711, -7.992644309997559, -4.95798397064209, -1.923323631286621, 1.1113357543945312, 4.14599609375, 7.180656433105469, 10.215316772460938, 13.249977111816406, 16.284637451171875, 19.319297790527344, 22.353958129882812, 25.38861656188965, 28.423276901245117, 31.457937240600586, 34.49259567260742, 37.52725601196289, 40.56191635131836, 43.59657669067383, 46.6312370300293, 49.665897369384766, 52.700557708740234, 55.7352180480957, 58.76987838745117, 61.80453872680664, 64.83919525146484, 67.87385559082031, 70.90851593017578, 73.94317626953125, 76.97783660888672, 80.01249694824219, 83.04715728759766, 86.08181762695312, 89.1164779663086, 92.15113830566406, 95.18579864501953, 98.220458984375, 101.25511932373047, 104.28977966308594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 9.0, 16.0, 23.0, 32.0, 41.0, 59.0, 77.0, 141.0, 210.0, 358.0, 592.0, 998.0, 1724.0, 3194.0, 6415.0, 14281.0, 36363.0, 120781.0, 807056.0, 2760203.0, 326489.0, 70209.0, 24095.0, 10104.0, 4705.0, 2523.0, 1371.0, 788.0, 488.0, 311.0, 191.0, 119.0, 86.0, 59.0, 38.0, 32.0, 20.0, 13.0, 6.0, 15.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.390625, -9.0806884765625, -8.770751953125, -8.4608154296875, -8.15087890625, -7.8409423828125, -7.531005859375, -7.2210693359375, -6.9111328125, -6.6011962890625, -6.291259765625, -5.9813232421875, -5.67138671875, -5.3614501953125, -5.051513671875, -4.7415771484375, -4.431640625, -4.1217041015625, -3.811767578125, -3.5018310546875, -3.19189453125, -2.8819580078125, -2.572021484375, -2.2620849609375, -1.9521484375, -1.6422119140625, -1.332275390625, -1.0223388671875, -0.71240234375, -0.4024658203125, -0.092529296875, 0.2174072265625, 0.52734375, 0.8372802734375, 1.147216796875, 1.4571533203125, 1.76708984375, 2.0770263671875, 2.386962890625, 2.6968994140625, 3.0068359375, 3.3167724609375, 3.626708984375, 3.9366455078125, 4.24658203125, 4.5565185546875, 4.866455078125, 5.1763916015625, 5.486328125, 5.7962646484375, 6.106201171875, 6.4161376953125, 6.72607421875, 7.0360107421875, 7.345947265625, 7.6558837890625, 7.9658203125, 8.2757568359375, 8.585693359375, 8.8956298828125, 9.20556640625, 9.5155029296875, 9.825439453125, 10.1353759765625, 10.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 12.0, 7.0, 8.0, 10.0, 20.0, 22.0, 23.0, 27.0, 31.0, 49.0, 56.0, 44.0, 52.0, 58.0, 62.0, 62.0, 69.0, 47.0, 56.0, 42.0, 35.0, 36.0, 32.0, 24.0, 29.0, 15.0, 15.0, 8.0, 10.0, 4.0, 8.0, 9.0, 7.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.88671875, -5.6990966796875, -5.511474609375, -5.3238525390625, -5.13623046875, -4.9486083984375, -4.760986328125, -4.5733642578125, -4.3857421875, -4.1981201171875, -4.010498046875, -3.8228759765625, -3.63525390625, -3.4476318359375, -3.260009765625, -3.0723876953125, -2.884765625, -2.6971435546875, -2.509521484375, -2.3218994140625, -2.13427734375, -1.9466552734375, -1.759033203125, -1.5714111328125, -1.3837890625, -1.1961669921875, -1.008544921875, -0.8209228515625, -0.63330078125, -0.4456787109375, -0.258056640625, -0.0704345703125, 0.1171875, 0.3048095703125, 0.492431640625, 0.6800537109375, 0.86767578125, 1.0552978515625, 1.242919921875, 1.4305419921875, 1.6181640625, 1.8057861328125, 1.993408203125, 2.1810302734375, 2.36865234375, 2.5562744140625, 2.743896484375, 2.9315185546875, 3.119140625, 3.3067626953125, 3.494384765625, 3.6820068359375, 3.86962890625, 4.0572509765625, 4.244873046875, 4.4324951171875, 4.6201171875, 4.8077392578125, 4.995361328125, 5.1829833984375, 5.37060546875, 5.5582275390625, 5.745849609375, 5.9334716796875, 6.12109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 8.0, 15.0, 17.0, 44.0, 53.0, 90.0, 190.0, 421.0, 1279.0, 4323.0, 18795.0, 142568.0, 3637602.0, 346968.0, 32064.0, 6854.0, 1888.0, 591.0, 237.0, 99.0, 64.0, 38.0, 15.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.517578125, -17.84765625, -17.177734375, -16.5078125, -15.837890625, -15.16796875, -14.498046875, -13.828125, -13.158203125, -12.48828125, -11.818359375, -11.1484375, -10.478515625, -9.80859375, -9.138671875, -8.46875, -7.798828125, -7.12890625, -6.458984375, -5.7890625, -5.119140625, -4.44921875, -3.779296875, -3.109375, -2.439453125, -1.76953125, -1.099609375, -0.4296875, 0.240234375, 0.91015625, 1.580078125, 2.25, 2.919921875, 3.58984375, 4.259765625, 4.9296875, 5.599609375, 6.26953125, 6.939453125, 7.609375, 8.279296875, 8.94921875, 9.619140625, 10.2890625, 10.958984375, 11.62890625, 12.298828125, 12.96875, 13.638671875, 14.30859375, 14.978515625, 15.6484375, 16.318359375, 16.98828125, 17.658203125, 18.328125, 18.998046875, 19.66796875, 20.337890625, 21.0078125, 21.677734375, 22.34765625, 23.017578125, 23.6875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 15.0, 13.0, 12.0, 27.0, 29.0, 52.0, 72.0, 123.0, 203.0, 354.0, 658.0, 875.0, 596.0, 342.0, 200.0, 141.0, 90.0, 46.0, 49.0, 29.0, 25.0, 22.0, 11.0, 13.0, 12.0, 6.0, 3.0, 9.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.5479736328125, -13.142822265625, -12.7376708984375, -12.33251953125, -11.9273681640625, -11.522216796875, -11.1170654296875, -10.7119140625, -10.3067626953125, -9.901611328125, -9.4964599609375, -9.09130859375, -8.6861572265625, -8.281005859375, -7.8758544921875, -7.470703125, -7.0655517578125, -6.660400390625, -6.2552490234375, -5.85009765625, -5.4449462890625, -5.039794921875, -4.6346435546875, -4.2294921875, -3.8243408203125, -3.419189453125, -3.0140380859375, -2.60888671875, -2.2037353515625, -1.798583984375, -1.3934326171875, -0.98828125, -0.5831298828125, -0.177978515625, 0.2271728515625, 0.63232421875, 1.0374755859375, 1.442626953125, 1.8477783203125, 2.2529296875, 2.6580810546875, 3.063232421875, 3.4683837890625, 3.87353515625, 4.2786865234375, 4.683837890625, 5.0889892578125, 5.494140625, 5.8992919921875, 6.304443359375, 6.7095947265625, 7.11474609375, 7.5198974609375, 7.925048828125, 8.3302001953125, 8.7353515625, 9.1405029296875, 9.545654296875, 9.9508056640625, 10.35595703125, 10.7611083984375, 11.166259765625, 11.5714111328125, 11.9765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 23.0, 86.0, 251.0, 318.0, 187.0, 79.0, 24.0, 14.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.29956817626953, -98.4058609008789, -89.51216125488281, -80.61845397949219, -71.72474670410156, -62.83104705810547, -53.937339782714844, -45.043636322021484, -36.149932861328125, -27.256229400634766, -18.362524032592773, -9.468818664550781, -0.5751152038574219, 8.318588256835938, 17.212295532226562, 26.105998992919922, 34.99970245361328, 43.89340591430664, 52.787109375, 61.680816650390625, 70.57452392578125, 79.46822357177734, 88.36193084716797, 97.25563049316406, 106.14933776855469, 115.04304504394531, 123.9367446899414, 132.8304443359375, 141.72415161132812, 150.61785888671875, 159.51156616210938, 168.4052734375, 177.29898071289062, 186.19268798828125, 195.08639526367188, 203.9801025390625, 212.87379455566406, 221.7675018310547, 230.6612091064453, 239.55491638183594, 248.4486083984375, 257.3423156738281, 266.23602294921875, 275.1297302246094, 284.0234375, 292.9171142578125, 301.81085205078125, 310.70452880859375, 319.5982666015625, 328.4919738769531, 337.38568115234375, 346.2793884277344, 355.173095703125, 364.0667724609375, 372.96051025390625, 381.85418701171875, 390.7478942871094, 399.6416015625, 408.5353088378906, 417.42901611328125, 426.3227233886719, 435.2164306640625, 444.110107421875, 453.0038146972656, 461.89752197265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 2.0, 9.0, 15.0, 30.0, 24.0, 29.0, 29.0, 45.0, 44.0, 43.0, 42.0, 53.0, 43.0, 65.0, 54.0, 57.0, 58.0, 48.0, 46.0, 48.0, 34.0, 36.0, 29.0, 18.0, 17.0, 16.0, 20.0, 8.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.30931091308594, -65.72479248046875, -63.14027404785156, -60.555755615234375, -57.97124099731445, -55.386722564697266, -52.80220413208008, -50.217689514160156, -47.63317108154297, -45.04865264892578, -42.464134216308594, -39.879615783691406, -37.295101165771484, -34.7105827331543, -32.12606430053711, -29.541547775268555, -26.957027435302734, -24.372509002685547, -21.787992477416992, -19.203474044799805, -16.61895751953125, -14.034439086914062, -11.449920654296875, -8.86540412902832, -6.280885696411133, -3.6963679790496826, -1.1118502616882324, 1.4726676940917969, 4.057185173034668, 6.641702651977539, 9.226221084594727, 11.810737609863281, 14.395256042480469, 16.979774475097656, 19.56429100036621, 22.1488094329834, 24.733325958251953, 27.31784439086914, 29.902362823486328, 32.48687744140625, 35.07139587402344, 37.655914306640625, 40.24043273925781, 42.824951171875, 45.40946578979492, 47.99398422241211, 50.5785026550293, 53.16301727294922, 55.74753952026367, 58.33205795288086, 60.91657638549805, 63.50109100341797, 66.08560943603516, 68.67012786865234, 71.25464630126953, 73.83916473388672, 76.4236831665039, 79.0082015991211, 81.59272003173828, 84.17723846435547, 86.76175689697266, 89.34626770019531, 91.9307861328125, 94.51530456542969, 97.09982299804688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 8.0, 8.0, 19.0, 25.0, 26.0, 33.0, 75.0, 129.0, 174.0, 277.0, 428.0, 704.0, 998.0, 1930.0, 3369.0, 6166.0, 12047.0, 24929.0, 52666.0, 121172.0, 296287.0, 299336.0, 123068.0, 53084.0, 24996.0, 12180.0, 6215.0, 3347.0, 1846.0, 1122.0, 701.0, 416.0, 276.0, 164.0, 114.0, 64.0, 41.0, 32.0, 33.0, 8.0, 14.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.428955078125, -9.09228515625, -8.755615234375, -8.4189453125, -8.082275390625, -7.74560546875, -7.408935546875, -7.072265625, -6.735595703125, -6.39892578125, -6.062255859375, -5.7255859375, -5.388916015625, -5.05224609375, -4.715576171875, -4.37890625, -4.042236328125, -3.70556640625, -3.368896484375, -3.0322265625, -2.695556640625, -2.35888671875, -2.022216796875, -1.685546875, -1.348876953125, -1.01220703125, -0.675537109375, -0.3388671875, -0.002197265625, 0.33447265625, 0.671142578125, 1.0078125, 1.344482421875, 1.68115234375, 2.017822265625, 2.3544921875, 2.691162109375, 3.02783203125, 3.364501953125, 3.701171875, 4.037841796875, 4.37451171875, 4.711181640625, 5.0478515625, 5.384521484375, 5.72119140625, 6.057861328125, 6.39453125, 6.731201171875, 7.06787109375, 7.404541015625, 7.7412109375, 8.077880859375, 8.41455078125, 8.751220703125, 9.087890625, 9.424560546875, 9.76123046875, 10.097900390625, 10.4345703125, 10.771240234375, 11.10791015625, 11.444580078125, 11.78125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 14.0, 6.0, 11.0, 19.0, 17.0, 25.0, 32.0, 30.0, 31.0, 39.0, 54.0, 43.0, 46.0, 46.0, 53.0, 53.0, 37.0, 47.0, 51.0, 44.0, 31.0, 55.0, 23.0, 36.0, 22.0, 21.0, 25.0, 20.0, 10.0, 5.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.828125, -4.65985107421875, -4.4915771484375, -4.32330322265625, -4.155029296875, -3.98675537109375, -3.8184814453125, -3.65020751953125, -3.48193359375, -3.31365966796875, -3.1453857421875, -2.97711181640625, -2.808837890625, -2.64056396484375, -2.4722900390625, -2.30401611328125, -2.1357421875, -1.96746826171875, -1.7991943359375, -1.63092041015625, -1.462646484375, -1.29437255859375, -1.1260986328125, -0.95782470703125, -0.78955078125, -0.62127685546875, -0.4530029296875, -0.28472900390625, -0.116455078125, 0.05181884765625, 0.2200927734375, 0.38836669921875, 0.556640625, 0.72491455078125, 0.8931884765625, 1.06146240234375, 1.229736328125, 1.39801025390625, 1.5662841796875, 1.73455810546875, 1.90283203125, 2.07110595703125, 2.2393798828125, 2.40765380859375, 2.575927734375, 2.74420166015625, 2.9124755859375, 3.08074951171875, 3.2490234375, 3.41729736328125, 3.5855712890625, 3.75384521484375, 3.922119140625, 4.09039306640625, 4.2586669921875, 4.42694091796875, 4.59521484375, 4.76348876953125, 4.9317626953125, 5.10003662109375, 5.268310546875, 5.43658447265625, 5.6048583984375, 5.77313232421875, 5.94140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 9.0, 8.0, 11.0, 12.0, 28.0, 36.0, 57.0, 64.0, 108.0, 185.0, 351.0, 688.0, 1750.0, 8350.0, 168364.0, 837132.0, 25841.0, 3349.0, 1076.0, 476.0, 239.0, 165.0, 71.0, 50.0, 30.0, 31.0, 19.0, 14.0, 7.0, 5.0, 9.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-43.0625, -41.68359375, -40.3046875, -38.92578125, -37.546875, -36.16796875, -34.7890625, -33.41015625, -32.03125, -30.65234375, -29.2734375, -27.89453125, -26.515625, -25.13671875, -23.7578125, -22.37890625, -21.0, -19.62109375, -18.2421875, -16.86328125, -15.484375, -14.10546875, -12.7265625, -11.34765625, -9.96875, -8.58984375, -7.2109375, -5.83203125, -4.453125, -3.07421875, -1.6953125, -0.31640625, 1.0625, 2.44140625, 3.8203125, 5.19921875, 6.578125, 7.95703125, 9.3359375, 10.71484375, 12.09375, 13.47265625, 14.8515625, 16.23046875, 17.609375, 18.98828125, 20.3671875, 21.74609375, 23.125, 24.50390625, 25.8828125, 27.26171875, 28.640625, 30.01953125, 31.3984375, 32.77734375, 34.15625, 35.53515625, 36.9140625, 38.29296875, 39.671875, 41.05078125, 42.4296875, 43.80859375, 45.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 1.0, 7.0, 8.0, 11.0, 15.0, 12.0, 16.0, 18.0, 25.0, 25.0, 23.0, 39.0, 32.0, 51.0, 50.0, 63.0, 58.0, 58.0, 63.0, 71.0, 48.0, 49.0, 47.0, 38.0, 25.0, 30.0, 25.0, 20.0, 8.0, 12.0, 15.0, 8.0, 1.0, 8.0, 0.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.09375, -23.235107421875, -22.37646484375, -21.517822265625, -20.6591796875, -19.800537109375, -18.94189453125, -18.083251953125, -17.224609375, -16.365966796875, -15.50732421875, -14.648681640625, -13.7900390625, -12.931396484375, -12.07275390625, -11.214111328125, -10.35546875, -9.496826171875, -8.63818359375, -7.779541015625, -6.9208984375, -6.062255859375, -5.20361328125, -4.344970703125, -3.486328125, -2.627685546875, -1.76904296875, -0.910400390625, -0.0517578125, 0.806884765625, 1.66552734375, 2.524169921875, 3.3828125, 4.241455078125, 5.10009765625, 5.958740234375, 6.8173828125, 7.676025390625, 8.53466796875, 9.393310546875, 10.251953125, 11.110595703125, 11.96923828125, 12.827880859375, 13.6865234375, 14.545166015625, 15.40380859375, 16.262451171875, 17.12109375, 17.979736328125, 18.83837890625, 19.697021484375, 20.5556640625, 21.414306640625, 22.27294921875, 23.131591796875, 23.990234375, 24.848876953125, 25.70751953125, 26.566162109375, 27.4248046875, 28.283447265625, 29.14208984375, 30.000732421875, 30.859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 14.0, 15.0, 29.0, 33.0, 45.0, 69.0, 109.0, 197.0, 387.0, 917.0, 2615.0, 13813.0, 205774.0, 780736.0, 36310.0, 4888.0, 1325.0, 535.0, 276.0, 126.0, 108.0, 54.0, 36.0, 26.0, 21.0, 21.0, 9.0, 5.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.1875, -12.7509765625, -12.314453125, -11.8779296875, -11.44140625, -11.0048828125, -10.568359375, -10.1318359375, -9.6953125, -9.2587890625, -8.822265625, -8.3857421875, -7.94921875, -7.5126953125, -7.076171875, -6.6396484375, -6.203125, -5.7666015625, -5.330078125, -4.8935546875, -4.45703125, -4.0205078125, -3.583984375, -3.1474609375, -2.7109375, -2.2744140625, -1.837890625, -1.4013671875, -0.96484375, -0.5283203125, -0.091796875, 0.3447265625, 0.78125, 1.2177734375, 1.654296875, 2.0908203125, 2.52734375, 2.9638671875, 3.400390625, 3.8369140625, 4.2734375, 4.7099609375, 5.146484375, 5.5830078125, 6.01953125, 6.4560546875, 6.892578125, 7.3291015625, 7.765625, 8.2021484375, 8.638671875, 9.0751953125, 9.51171875, 9.9482421875, 10.384765625, 10.8212890625, 11.2578125, 11.6943359375, 12.130859375, 12.5673828125, 13.00390625, 13.4404296875, 13.876953125, 14.3134765625, 14.75]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 12.0, 12.0, 15.0, 23.0, 23.0, 31.0, 55.0, 95.0, 136.0, 183.0, 125.0, 80.0, 59.0, 28.0, 35.0, 20.0, 21.0, 10.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00276947021484375, -0.0026991814374923706, -0.002628892660140991, -0.002558603882789612, -0.0024883151054382324, -0.002418026328086853, -0.0023477375507354736, -0.0022774487733840942, -0.002207159996032715, -0.0021368712186813354, -0.002066582441329956, -0.0019962936639785767, -0.0019260048866271973, -0.0018557161092758179, -0.0017854273319244385, -0.001715138554573059, -0.0016448497772216797, -0.0015745609998703003, -0.001504272222518921, -0.0014339834451675415, -0.0013636946678161621, -0.0012934058904647827, -0.0012231171131134033, -0.001152828335762024, -0.0010825395584106445, -0.0010122507810592651, -0.0009419620037078857, -0.0008716732263565063, -0.000801384449005127, -0.0007310956716537476, -0.0006608068943023682, -0.0005905181169509888, -0.0005202293395996094, -0.00044994056224823, -0.0003796517848968506, -0.0003093630075454712, -0.0002390742301940918, -0.0001687854528427124, -9.849667549133301e-05, -2.8207898139953613e-05, 4.208087921142578e-05, 0.00011236965656280518, 0.00018265843391418457, 0.00025294721126556396, 0.00032323598861694336, 0.00039352476596832275, 0.00046381354331970215, 0.0005341023206710815, 0.0006043910980224609, 0.0006746798753738403, 0.0007449686527252197, 0.0008152574300765991, 0.0008855462074279785, 0.0009558349847793579, 0.0010261237621307373, 0.0010964125394821167, 0.001166701316833496, 0.0012369900941848755, 0.0013072788715362549, 0.0013775676488876343, 0.0014478564262390137, 0.001518145203590393, 0.0015884339809417725, 0.0016587227582931519, 0.0017290115356445312]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 8.0, 15.0, 16.0, 9.0, 22.0, 30.0, 33.0, 82.0, 107.0, 147.0, 276.0, 480.0, 1009.0, 2084.0, 6492.0, 35878.0, 579863.0, 384504.0, 28029.0, 5598.0, 1877.0, 809.0, 420.0, 261.0, 150.0, 108.0, 60.0, 39.0, 26.0, 25.0, 18.0, 14.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.796875, -10.423828125, -10.05078125, -9.677734375, -9.3046875, -8.931640625, -8.55859375, -8.185546875, -7.8125, -7.439453125, -7.06640625, -6.693359375, -6.3203125, -5.947265625, -5.57421875, -5.201171875, -4.828125, -4.455078125, -4.08203125, -3.708984375, -3.3359375, -2.962890625, -2.58984375, -2.216796875, -1.84375, -1.470703125, -1.09765625, -0.724609375, -0.3515625, 0.021484375, 0.39453125, 0.767578125, 1.140625, 1.513671875, 1.88671875, 2.259765625, 2.6328125, 3.005859375, 3.37890625, 3.751953125, 4.125, 4.498046875, 4.87109375, 5.244140625, 5.6171875, 5.990234375, 6.36328125, 6.736328125, 7.109375, 7.482421875, 7.85546875, 8.228515625, 8.6015625, 8.974609375, 9.34765625, 9.720703125, 10.09375, 10.466796875, 10.83984375, 11.212890625, 11.5859375, 11.958984375, 12.33203125, 12.705078125, 13.078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 7.0, 2.0, 6.0, 4.0, 5.0, 5.0, 17.0, 17.0, 23.0, 21.0, 29.0, 32.0, 42.0, 69.0, 88.0, 101.0, 105.0, 79.0, 80.0, 47.0, 46.0, 42.0, 22.0, 20.0, 21.0, 13.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.51708984375, -8.2685546875, -8.02001953125, -7.771484375, -7.52294921875, -7.2744140625, -7.02587890625, -6.77734375, -6.52880859375, -6.2802734375, -6.03173828125, -5.783203125, -5.53466796875, -5.2861328125, -5.03759765625, -4.7890625, -4.54052734375, -4.2919921875, -4.04345703125, -3.794921875, -3.54638671875, -3.2978515625, -3.04931640625, -2.80078125, -2.55224609375, -2.3037109375, -2.05517578125, -1.806640625, -1.55810546875, -1.3095703125, -1.06103515625, -0.8125, -0.56396484375, -0.3154296875, -0.06689453125, 0.181640625, 0.43017578125, 0.6787109375, 0.92724609375, 1.17578125, 1.42431640625, 1.6728515625, 1.92138671875, 2.169921875, 2.41845703125, 2.6669921875, 2.91552734375, 3.1640625, 3.41259765625, 3.6611328125, 3.90966796875, 4.158203125, 4.40673828125, 4.6552734375, 4.90380859375, 5.15234375, 5.40087890625, 5.6494140625, 5.89794921875, 6.146484375, 6.39501953125, 6.6435546875, 6.89208984375, 7.140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 21.0, 72.0, 228.0, 357.0, 209.0, 64.0, 23.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.30621337890625, -214.85260009765625, -204.39898681640625, -193.94537353515625, -183.49176025390625, -173.03814697265625, -162.58453369140625, -152.13092041015625, -141.67730712890625, -131.22369384765625, -120.77008056640625, -110.31646728515625, -99.86285400390625, -89.40924072265625, -78.95561981201172, -68.50200653076172, -58.04838562011719, -47.59477233886719, -37.14115905761719, -26.687541961669922, -16.233928680419922, -5.780315399169922, 4.673301696777344, 15.126914978027344, 25.580528259277344, 36.034141540527344, 46.487754821777344, 56.94137191772461, 67.39498901367188, 77.84860229492188, 88.30221557617188, 98.75582885742188, 109.20944213867188, 119.66305541992188, 130.11666870117188, 140.57028198242188, 151.02389526367188, 161.47750854492188, 171.93112182617188, 182.38473510742188, 192.83834838867188, 203.29196166992188, 213.74557495117188, 224.19918823242188, 234.65280151367188, 245.10641479492188, 255.56002807617188, 266.0136413574219, 276.46728515625, 286.9208984375, 297.37451171875, 307.828125, 318.28173828125, 328.7353515625, 339.18896484375, 349.642578125, 360.09619140625, 370.5498046875, 381.00341796875, 391.45703125, 401.91064453125, 412.3642578125, 422.81787109375, 433.271484375, 443.72509765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 9.0, 9.0, 10.0, 15.0, 18.0, 18.0, 11.0, 23.0, 25.0, 18.0, 36.0, 29.0, 32.0, 35.0, 41.0, 54.0, 56.0, 52.0, 54.0, 57.0, 50.0, 39.0, 37.0, 30.0, 29.0, 25.0, 32.0, 27.0, 26.0, 15.0, 17.0, 17.0, 14.0, 8.0, 13.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-100.84375, -97.78082275390625, -94.7178955078125, -91.65496826171875, -88.592041015625, -85.52912139892578, -82.46619415283203, -79.40326690673828, -76.34033966064453, -73.27741241455078, -70.21448516845703, -67.15155792236328, -64.08863830566406, -61.02570724487305, -57.96278381347656, -54.89985656738281, -51.83692932128906, -48.77400207519531, -45.71107482910156, -42.64815139770508, -39.58522415161133, -36.52229690551758, -33.459373474121094, -30.396446228027344, -27.333518981933594, -24.270591735839844, -21.207666397094727, -18.14474105834961, -15.08181381225586, -12.018887519836426, -8.955961227416992, -5.893035888671875, -2.8301162719726562, 0.23281002044677734, 3.295736312866211, 6.3586626052856445, 9.421588897705078, 12.484515190124512, 15.547441482543945, 18.610366821289062, 21.673294067382812, 24.736221313476562, 27.79914665222168, 30.862071990966797, 33.92499923706055, 36.9879264831543, 40.05084991455078, 43.11377716064453, 46.17670440673828, 49.23963165283203, 52.30255889892578, 55.365482330322266, 58.428409576416016, 61.491336822509766, 64.55426025390625, 67.6171875, 70.68011474609375, 73.7430419921875, 76.80596923828125, 79.868896484375, 82.93182373046875, 85.99474334716797, 89.05767059326172, 92.12059783935547, 95.18352508544922]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 17.0, 33.0, 47.0, 75.0, 134.0, 276.0, 1533.0, 4142497.0, 48625.0, 548.0, 206.0, 109.0, 80.0, 42.0, 12.0, 14.0, 9.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9375, -85.73828125, -82.5390625, -79.33984375, -76.140625, -72.94140625, -69.7421875, -66.54296875, -63.34375, -60.14453125, -56.9453125, -53.74609375, -50.546875, -47.34765625, -44.1484375, -40.94921875, -37.75, -34.55078125, -31.3515625, -28.15234375, -24.953125, -21.75390625, -18.5546875, -15.35546875, -12.15625, -8.95703125, -5.7578125, -2.55859375, 0.640625, 3.83984375, 7.0390625, 10.23828125, 13.4375, 16.63671875, 19.8359375, 23.03515625, 26.234375, 29.43359375, 32.6328125, 35.83203125, 39.03125, 42.23046875, 45.4296875, 48.62890625, 51.828125, 55.02734375, 58.2265625, 61.42578125, 64.625, 67.82421875, 71.0234375, 74.22265625, 77.421875, 80.62109375, 83.8203125, 87.01953125, 90.21875, 93.41796875, 96.6171875, 99.81640625, 103.015625, 106.21484375, 109.4140625, 112.61328125, 115.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 14.0, 6.0, 23.0, 32.0, 27.0, 39.0, 60.0, 61.0, 71.0, 83.0, 75.0, 76.0, 73.0, 79.0, 56.0, 53.0, 40.0, 33.0, 24.0, 23.0, 14.0, 11.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.87994384765625, -7.6348876953125, -7.38983154296875, -7.144775390625, -6.89971923828125, -6.6546630859375, -6.40960693359375, -6.16455078125, -5.91949462890625, -5.6744384765625, -5.42938232421875, -5.184326171875, -4.93927001953125, -4.6942138671875, -4.44915771484375, -4.2041015625, -3.95904541015625, -3.7139892578125, -3.46893310546875, -3.223876953125, -2.97882080078125, -2.7337646484375, -2.48870849609375, -2.24365234375, -1.99859619140625, -1.7535400390625, -1.50848388671875, -1.263427734375, -1.01837158203125, -0.7733154296875, -0.52825927734375, -0.283203125, -0.03814697265625, 0.2069091796875, 0.45196533203125, 0.697021484375, 0.94207763671875, 1.1871337890625, 1.43218994140625, 1.67724609375, 1.92230224609375, 2.1673583984375, 2.41241455078125, 2.657470703125, 2.90252685546875, 3.1475830078125, 3.39263916015625, 3.6376953125, 3.88275146484375, 4.1278076171875, 4.37286376953125, 4.617919921875, 4.86297607421875, 5.1080322265625, 5.35308837890625, 5.59814453125, 5.84320068359375, 6.0882568359375, 6.33331298828125, 6.578369140625, 6.82342529296875, 7.0684814453125, 7.31353759765625, 7.55859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 8.0, 17.0, 17.0, 18.0, 61.0, 89.0, 187.0, 339.0, 746.0, 1488.0, 3316.0, 7818.0, 20905.0, 78085.0, 738732.0, 3063094.0, 213607.0, 41030.0, 13418.0, 5756.0, 2690.0, 1338.0, 704.0, 396.0, 184.0, 96.0, 52.0, 35.0, 21.0, 8.0, 5.0, 8.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.015625, -10.6517333984375, -10.287841796875, -9.9239501953125, -9.56005859375, -9.1961669921875, -8.832275390625, -8.4683837890625, -8.1044921875, -7.7406005859375, -7.376708984375, -7.0128173828125, -6.64892578125, -6.2850341796875, -5.921142578125, -5.5572509765625, -5.193359375, -4.8294677734375, -4.465576171875, -4.1016845703125, -3.73779296875, -3.3739013671875, -3.010009765625, -2.6461181640625, -2.2822265625, -1.9183349609375, -1.554443359375, -1.1905517578125, -0.82666015625, -0.4627685546875, -0.098876953125, 0.2650146484375, 0.62890625, 0.9927978515625, 1.356689453125, 1.7205810546875, 2.08447265625, 2.4483642578125, 2.812255859375, 3.1761474609375, 3.5400390625, 3.9039306640625, 4.267822265625, 4.6317138671875, 4.99560546875, 5.3594970703125, 5.723388671875, 6.0872802734375, 6.451171875, 6.8150634765625, 7.178955078125, 7.5428466796875, 7.90673828125, 8.2706298828125, 8.634521484375, 8.9984130859375, 9.3623046875, 9.7261962890625, 10.090087890625, 10.4539794921875, 10.81787109375, 11.1817626953125, 11.545654296875, 11.9095458984375, 12.2734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 12.0, 11.0, 15.0, 26.0, 24.0, 37.0, 72.0, 91.0, 142.0, 243.0, 469.0, 799.0, 800.0, 503.0, 292.0, 159.0, 98.0, 67.0, 42.0, 33.0, 24.0, 18.0, 18.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.390625, -9.0677490234375, -8.744873046875, -8.4219970703125, -8.09912109375, -7.7762451171875, -7.453369140625, -7.1304931640625, -6.8076171875, -6.4847412109375, -6.161865234375, -5.8389892578125, -5.51611328125, -5.1932373046875, -4.870361328125, -4.5474853515625, -4.224609375, -3.9017333984375, -3.578857421875, -3.2559814453125, -2.93310546875, -2.6102294921875, -2.287353515625, -1.9644775390625, -1.6416015625, -1.3187255859375, -0.995849609375, -0.6729736328125, -0.35009765625, -0.0272216796875, 0.295654296875, 0.6185302734375, 0.94140625, 1.2642822265625, 1.587158203125, 1.9100341796875, 2.23291015625, 2.5557861328125, 2.878662109375, 3.2015380859375, 3.5244140625, 3.8472900390625, 4.170166015625, 4.4930419921875, 4.81591796875, 5.1387939453125, 5.461669921875, 5.7845458984375, 6.107421875, 6.4302978515625, 6.753173828125, 7.0760498046875, 7.39892578125, 7.7218017578125, 8.044677734375, 8.3675537109375, 8.6904296875, 9.0133056640625, 9.336181640625, 9.6590576171875, 9.98193359375, 10.3048095703125, 10.627685546875, 10.9505615234375, 11.2734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 11.0, 14.0, 20.0, 48.0, 68.0, 133.0, 169.0, 163.0, 130.0, 96.0, 53.0, 27.0, 16.0, 17.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15904235839844, -59.059532165527344, -55.96002197265625, -52.860511779785156, -49.76100158691406, -46.66149139404297, -43.56197738647461, -40.462467193603516, -37.36295700073242, -34.26344680786133, -31.163936614990234, -28.064424514770508, -24.964914321899414, -21.86540412902832, -18.765892028808594, -15.6663818359375, -12.566871643066406, -9.467361450195312, -6.367850303649902, -3.268339157104492, -0.16882896423339844, 2.9306812286376953, 6.030193328857422, 9.129703521728516, 12.22921371459961, 15.328723907470703, 18.428234100341797, 21.527746200561523, 24.627256393432617, 27.72676658630371, 30.826278686523438, 33.92578887939453, 37.025299072265625, 40.12480926513672, 43.22431945800781, 46.323829650878906, 49.42333984375, 52.522850036621094, 55.62236404418945, 58.72187423706055, 61.82138442993164, 64.9208984375, 68.0204086303711, 71.11991882324219, 74.21942901611328, 77.31893920898438, 80.41844940185547, 83.51795959472656, 86.61746978759766, 89.71697998046875, 92.81649017333984, 95.91600036621094, 99.01551055908203, 102.11502075195312, 105.21453857421875, 108.31404113769531, 111.41355895996094, 114.51306915283203, 117.61257934570312, 120.71208953857422, 123.81159973144531, 126.9111099243164, 130.0106201171875, 133.11013793945312, 136.2096405029297]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 8.0, 17.0, 25.0, 37.0, 38.0, 32.0, 41.0, 38.0, 41.0, 61.0, 66.0, 68.0, 56.0, 42.0, 51.0, 45.0, 38.0, 39.0, 43.0, 40.0, 26.0, 20.0, 17.0, 19.0, 15.0, 14.0, 10.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.64141082763672, -45.89904022216797, -44.15666961669922, -42.41429901123047, -40.67192840576172, -38.92955780029297, -37.18718338012695, -35.4448127746582, -33.70244216918945, -31.960071563720703, -30.217700958251953, -28.47532844543457, -26.73295783996582, -24.99058723449707, -23.248214721679688, -21.505844116210938, -19.763473510742188, -18.021102905273438, -16.278732299804688, -14.536359786987305, -12.793989181518555, -11.051618576049805, -9.309247016906738, -7.566875457763672, -5.824504852294922, -4.082133769989014, -2.3397626876831055, -0.5973916053771973, 1.144979476928711, 2.887350082397461, 4.629721641540527, 6.372093200683594, 8.114459991455078, 9.856830596923828, 11.599202156066895, 13.341573715209961, 15.083944320678711, 16.82631492614746, 18.568687438964844, 20.311058044433594, 22.053428649902344, 23.795799255371094, 25.538169860839844, 27.280542373657227, 29.022912979125977, 30.765283584594727, 32.50765609741211, 34.25002670288086, 35.99239730834961, 37.73476791381836, 39.47713851928711, 41.21950912475586, 42.961883544921875, 44.704254150390625, 46.446624755859375, 48.188995361328125, 49.931365966796875, 51.673736572265625, 53.416107177734375, 55.158477783203125, 56.900848388671875, 58.643218994140625, 60.38559341430664, 62.12796401977539, 63.87033462524414]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 13.0, 21.0, 30.0, 44.0, 66.0, 126.0, 204.0, 342.0, 646.0, 1353.0, 2779.0, 6186.0, 14034.0, 34194.0, 91336.0, 291574.0, 396674.0, 129155.0, 46125.0, 18544.0, 8131.0, 3516.0, 1657.0, 821.0, 370.0, 251.0, 131.0, 79.0, 58.0, 24.0, 24.0, 14.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.3046875, -12.92626953125, -12.5478515625, -12.16943359375, -11.791015625, -11.41259765625, -11.0341796875, -10.65576171875, -10.27734375, -9.89892578125, -9.5205078125, -9.14208984375, -8.763671875, -8.38525390625, -8.0068359375, -7.62841796875, -7.25, -6.87158203125, -6.4931640625, -6.11474609375, -5.736328125, -5.35791015625, -4.9794921875, -4.60107421875, -4.22265625, -3.84423828125, -3.4658203125, -3.08740234375, -2.708984375, -2.33056640625, -1.9521484375, -1.57373046875, -1.1953125, -0.81689453125, -0.4384765625, -0.06005859375, 0.318359375, 0.69677734375, 1.0751953125, 1.45361328125, 1.83203125, 2.21044921875, 2.5888671875, 2.96728515625, 3.345703125, 3.72412109375, 4.1025390625, 4.48095703125, 4.859375, 5.23779296875, 5.6162109375, 5.99462890625, 6.373046875, 6.75146484375, 7.1298828125, 7.50830078125, 7.88671875, 8.26513671875, 8.6435546875, 9.02197265625, 9.400390625, 9.77880859375, 10.1572265625, 10.53564453125, 10.9140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 12.0, 9.0, 14.0, 14.0, 16.0, 27.0, 33.0, 41.0, 50.0, 54.0, 50.0, 64.0, 57.0, 78.0, 66.0, 73.0, 58.0, 61.0, 37.0, 43.0, 31.0, 27.0, 19.0, 21.0, 17.0, 12.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.87176513671875, -7.6575927734375, -7.44342041015625, -7.229248046875, -7.01507568359375, -6.8009033203125, -6.58673095703125, -6.37255859375, -6.15838623046875, -5.9442138671875, -5.73004150390625, -5.515869140625, -5.30169677734375, -5.0875244140625, -4.87335205078125, -4.6591796875, -4.44500732421875, -4.2308349609375, -4.01666259765625, -3.802490234375, -3.58831787109375, -3.3741455078125, -3.15997314453125, -2.94580078125, -2.73162841796875, -2.5174560546875, -2.30328369140625, -2.089111328125, -1.87493896484375, -1.6607666015625, -1.44659423828125, -1.232421875, -1.01824951171875, -0.8040771484375, -0.58990478515625, -0.375732421875, -0.16156005859375, 0.0526123046875, 0.26678466796875, 0.48095703125, 0.69512939453125, 0.9093017578125, 1.12347412109375, 1.337646484375, 1.55181884765625, 1.7659912109375, 1.98016357421875, 2.1943359375, 2.40850830078125, 2.6226806640625, 2.83685302734375, 3.051025390625, 3.26519775390625, 3.4793701171875, 3.69354248046875, 3.90771484375, 4.12188720703125, 4.3360595703125, 4.55023193359375, 4.764404296875, 4.97857666015625, 5.1927490234375, 5.40692138671875, 5.62109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 16.0, 28.0, 40.0, 59.0, 101.0, 174.0, 305.0, 632.0, 1518.0, 5438.0, 34976.0, 545917.0, 420516.0, 31123.0, 5023.0, 1423.0, 556.0, 274.0, 146.0, 84.0, 60.0, 42.0, 35.0, 17.0, 15.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.413818359375, -24.59326171875, -23.772705078125, -22.9521484375, -22.131591796875, -21.31103515625, -20.490478515625, -19.669921875, -18.849365234375, -18.02880859375, -17.208251953125, -16.3876953125, -15.567138671875, -14.74658203125, -13.926025390625, -13.10546875, -12.284912109375, -11.46435546875, -10.643798828125, -9.8232421875, -9.002685546875, -8.18212890625, -7.361572265625, -6.541015625, -5.720458984375, -4.89990234375, -4.079345703125, -3.2587890625, -2.438232421875, -1.61767578125, -0.797119140625, 0.0234375, 0.843994140625, 1.66455078125, 2.485107421875, 3.3056640625, 4.126220703125, 4.94677734375, 5.767333984375, 6.587890625, 7.408447265625, 8.22900390625, 9.049560546875, 9.8701171875, 10.690673828125, 11.51123046875, 12.331787109375, 13.15234375, 13.972900390625, 14.79345703125, 15.614013671875, 16.4345703125, 17.255126953125, 18.07568359375, 18.896240234375, 19.716796875, 20.537353515625, 21.35791015625, 22.178466796875, 22.9990234375, 23.819580078125, 24.64013671875, 25.460693359375, 26.28125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 13.0, 15.0, 29.0, 33.0, 30.0, 34.0, 39.0, 49.0, 46.0, 57.0, 51.0, 59.0, 55.0, 60.0, 62.0, 58.0, 28.0, 39.0, 35.0, 26.0, 28.0, 27.0, 10.0, 18.0, 12.0, 12.0, 10.0, 9.0, 5.0, 1.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.109375, -19.44091796875, -18.7724609375, -18.10400390625, -17.435546875, -16.76708984375, -16.0986328125, -15.43017578125, -14.76171875, -14.09326171875, -13.4248046875, -12.75634765625, -12.087890625, -11.41943359375, -10.7509765625, -10.08251953125, -9.4140625, -8.74560546875, -8.0771484375, -7.40869140625, -6.740234375, -6.07177734375, -5.4033203125, -4.73486328125, -4.06640625, -3.39794921875, -2.7294921875, -2.06103515625, -1.392578125, -0.72412109375, -0.0556640625, 0.61279296875, 1.28125, 1.94970703125, 2.6181640625, 3.28662109375, 3.955078125, 4.62353515625, 5.2919921875, 5.96044921875, 6.62890625, 7.29736328125, 7.9658203125, 8.63427734375, 9.302734375, 9.97119140625, 10.6396484375, 11.30810546875, 11.9765625, 12.64501953125, 13.3134765625, 13.98193359375, 14.650390625, 15.31884765625, 15.9873046875, 16.65576171875, 17.32421875, 17.99267578125, 18.6611328125, 19.32958984375, 19.998046875, 20.66650390625, 21.3349609375, 22.00341796875, 22.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 17.0, 23.0, 45.0, 83.0, 165.0, 330.0, 1036.0, 5303.0, 173858.0, 852774.0, 12304.0, 1694.0, 469.0, 183.0, 89.0, 54.0, 29.0, 19.0, 13.0, 4.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.8125, -23.135498046875, -22.45849609375, -21.781494140625, -21.1044921875, -20.427490234375, -19.75048828125, -19.073486328125, -18.396484375, -17.719482421875, -17.04248046875, -16.365478515625, -15.6884765625, -15.011474609375, -14.33447265625, -13.657470703125, -12.98046875, -12.303466796875, -11.62646484375, -10.949462890625, -10.2724609375, -9.595458984375, -8.91845703125, -8.241455078125, -7.564453125, -6.887451171875, -6.21044921875, -5.533447265625, -4.8564453125, -4.179443359375, -3.50244140625, -2.825439453125, -2.1484375, -1.471435546875, -0.79443359375, -0.117431640625, 0.5595703125, 1.236572265625, 1.91357421875, 2.590576171875, 3.267578125, 3.944580078125, 4.62158203125, 5.298583984375, 5.9755859375, 6.652587890625, 7.32958984375, 8.006591796875, 8.68359375, 9.360595703125, 10.03759765625, 10.714599609375, 11.3916015625, 12.068603515625, 12.74560546875, 13.422607421875, 14.099609375, 14.776611328125, 15.45361328125, 16.130615234375, 16.8076171875, 17.484619140625, 18.16162109375, 18.838623046875, 19.515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 5.0, 14.0, 7.0, 11.0, 7.0, 12.0, 19.0, 22.0, 14.0, 40.0, 34.0, 56.0, 64.0, 83.0, 118.0, 112.0, 82.0, 49.0, 48.0, 33.0, 28.0, 35.0, 20.0, 17.0, 7.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013256072998046875, -0.0012864917516708374, -0.0012473762035369873, -0.0012082606554031372, -0.0011691451072692871, -0.001130029559135437, -0.001090914011001587, -0.0010517984628677368, -0.0010126829147338867, -0.0009735673666000366, -0.0009344518184661865, -0.0008953362703323364, -0.0008562207221984863, -0.0008171051740646362, -0.0007779896259307861, -0.000738874077796936, -0.0006997585296630859, -0.0006606429815292358, -0.0006215274333953857, -0.0005824118852615356, -0.0005432963371276855, -0.0005041807889938354, -0.00046506524085998535, -0.00042594969272613525, -0.00038683414459228516, -0.00034771859645843506, -0.00030860304832458496, -0.00026948750019073486, -0.00023037195205688477, -0.00019125640392303467, -0.00015214085578918457, -0.00011302530765533447, -7.390975952148438e-05, -3.479421138763428e-05, 4.32133674621582e-06, 4.343688488006592e-05, 8.255243301391602e-05, 0.00012166798114776611, 0.0001607835292816162, 0.0001998990774154663, 0.0002390146255493164, 0.0002781301736831665, 0.0003172457218170166, 0.0003563612699508667, 0.0003954768180847168, 0.0004345923662185669, 0.000473707914352417, 0.0005128234624862671, 0.0005519390106201172, 0.0005910545587539673, 0.0006301701068878174, 0.0006692856550216675, 0.0007084012031555176, 0.0007475167512893677, 0.0007866322994232178, 0.0008257478475570679, 0.000864863395690918, 0.0009039789438247681, 0.0009430944919586182, 0.0009822100400924683, 0.0010213255882263184, 0.0010604411363601685, 0.0010995566844940186, 0.0011386722326278687, 0.0011777877807617188]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 17.0, 20.0, 42.0, 74.0, 167.0, 387.0, 1019.0, 4143.0, 47402.0, 914051.0, 73900.0, 5253.0, 1256.0, 404.0, 179.0, 104.0, 39.0, 26.0, 19.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.2398681640625, -12.721923828125, -12.2039794921875, -11.68603515625, -11.1680908203125, -10.650146484375, -10.1322021484375, -9.6142578125, -9.0963134765625, -8.578369140625, -8.0604248046875, -7.54248046875, -7.0245361328125, -6.506591796875, -5.9886474609375, -5.470703125, -4.9527587890625, -4.434814453125, -3.9168701171875, -3.39892578125, -2.8809814453125, -2.363037109375, -1.8450927734375, -1.3271484375, -0.8092041015625, -0.291259765625, 0.2266845703125, 0.74462890625, 1.2625732421875, 1.780517578125, 2.2984619140625, 2.81640625, 3.3343505859375, 3.852294921875, 4.3702392578125, 4.88818359375, 5.4061279296875, 5.924072265625, 6.4420166015625, 6.9599609375, 7.4779052734375, 7.995849609375, 8.5137939453125, 9.03173828125, 9.5496826171875, 10.067626953125, 10.5855712890625, 11.103515625, 11.6214599609375, 12.139404296875, 12.6573486328125, 13.17529296875, 13.6932373046875, 14.211181640625, 14.7291259765625, 15.2470703125, 15.7650146484375, 16.282958984375, 16.8009033203125, 17.31884765625, 17.8367919921875, 18.354736328125, 18.8726806640625, 19.390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 27.0, 32.0, 41.0, 53.0, 73.0, 81.0, 116.0, 116.0, 104.0, 84.0, 74.0, 38.0, 33.0, 28.0, 14.0, 11.0, 7.0, 9.0, 3.0, 9.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.4442138671875, -5.177490234375, -4.9107666015625, -4.64404296875, -4.3773193359375, -4.110595703125, -3.8438720703125, -3.5771484375, -3.3104248046875, -3.043701171875, -2.7769775390625, -2.51025390625, -2.2435302734375, -1.976806640625, -1.7100830078125, -1.443359375, -1.1766357421875, -0.909912109375, -0.6431884765625, -0.37646484375, -0.1097412109375, 0.156982421875, 0.4237060546875, 0.6904296875, 0.9571533203125, 1.223876953125, 1.4906005859375, 1.75732421875, 2.0240478515625, 2.290771484375, 2.5574951171875, 2.82421875, 3.0909423828125, 3.357666015625, 3.6243896484375, 3.89111328125, 4.1578369140625, 4.424560546875, 4.6912841796875, 4.9580078125, 5.2247314453125, 5.491455078125, 5.7581787109375, 6.02490234375, 6.2916259765625, 6.558349609375, 6.8250732421875, 7.091796875, 7.3585205078125, 7.625244140625, 7.8919677734375, 8.15869140625, 8.4254150390625, 8.692138671875, 8.9588623046875, 9.2255859375, 9.4923095703125, 9.759033203125, 10.0257568359375, 10.29248046875, 10.5592041015625, 10.825927734375, 11.0926513671875, 11.359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 12.0, 17.0, 49.0, 104.0, 149.0, 250.0, 207.0, 108.0, 45.0, 26.0, 14.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.82061767578125, -161.58380126953125, -156.3470001220703, -151.1101837158203, -145.8733673095703, -140.63656616210938, -135.39974975585938, -130.16293334960938, -124.9261245727539, -119.68931579589844, -114.45249938964844, -109.21569061279297, -103.9788818359375, -98.7420654296875, -93.50525665283203, -88.26844787597656, -83.03163146972656, -77.7948226928711, -72.5580062866211, -67.32119750976562, -62.08438491821289, -56.847572326660156, -51.61076354980469, -46.37395095825195, -41.13713836669922, -35.900325775146484, -30.663515090942383, -25.42670440673828, -20.189891815185547, -14.953079223632812, -9.716268539428711, -4.479457855224609, 0.757354736328125, 5.994166374206543, 11.230978012084961, 16.467788696289062, 21.704601287841797, 26.94141387939453, 32.17822265625, 37.415035247802734, 42.65184783935547, 47.8886604309082, 53.12547302246094, 58.362281799316406, 63.59909439086914, 68.83590698242188, 74.07271575927734, 79.30952453613281, 84.54634094238281, 89.78314971923828, 95.01996612548828, 100.25677490234375, 105.49359130859375, 110.73040008544922, 115.96720886230469, 121.20402526855469, 126.44083404541016, 131.67764282226562, 136.91445922851562, 142.15127563476562, 147.38807678222656, 152.62489318847656, 157.86170959472656, 163.0985107421875, 168.3353271484375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 13.0, 18.0, 22.0, 21.0, 35.0, 41.0, 45.0, 43.0, 66.0, 79.0, 79.0, 101.0, 82.0, 57.0, 60.0, 30.0, 47.0, 36.0, 19.0, 21.0, 20.0, 15.0, 9.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-160.51768493652344, -156.69285583496094, -152.8680419921875, -149.043212890625, -145.21839904785156, -141.39356994628906, -137.56875610351562, -133.74392700195312, -129.91909790039062, -126.09427642822266, -122.26945495605469, -118.44462585449219, -114.61980438232422, -110.79498291015625, -106.97016143798828, -103.14533996582031, -99.32052612304688, -95.4957046508789, -91.67088317871094, -87.84605407714844, -84.02123260498047, -80.1964111328125, -76.37158966064453, -72.54676818847656, -68.72193908691406, -64.8971176147461, -61.07229232788086, -57.24747085571289, -53.42264938354492, -49.59782409667969, -45.77300262451172, -41.94818115234375, -38.12335968017578, -34.29853820800781, -30.47371482849121, -26.64889144897461, -22.82406997680664, -18.99924659729004, -15.174423217773438, -11.349601745605469, -7.524778366088867, -3.699955701828003, 0.12486696243286133, 3.9496898651123047, 7.77451229095459, 11.599334716796875, 15.424158096313477, 19.248979568481445, 23.073802947998047, 26.89862632751465, 30.723447799682617, 34.54827117919922, 38.37309265136719, 42.197914123535156, 46.02273941040039, 49.84756088256836, 53.672386169433594, 57.49720764160156, 61.3220329284668, 65.1468505859375, 68.9716796875, 72.79650115966797, 76.62132263183594, 80.4461441040039, 84.27096557617188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 26.0, 26.0, 41.0, 99.0, 174.0, 365.0, 1067.0, 3576.0, 24636.0, 1001600.0, 3099298.0, 55508.0, 5590.0, 1374.0, 479.0, 210.0, 85.0, 48.0, 25.0, 16.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.6083984375, -18.935546875, -18.2626953125, -17.58984375, -16.9169921875, -16.244140625, -15.5712890625, -14.8984375, -14.2255859375, -13.552734375, -12.8798828125, -12.20703125, -11.5341796875, -10.861328125, -10.1884765625, -9.515625, -8.8427734375, -8.169921875, -7.4970703125, -6.82421875, -6.1513671875, -5.478515625, -4.8056640625, -4.1328125, -3.4599609375, -2.787109375, -2.1142578125, -1.44140625, -0.7685546875, -0.095703125, 0.5771484375, 1.25, 1.9228515625, 2.595703125, 3.2685546875, 3.94140625, 4.6142578125, 5.287109375, 5.9599609375, 6.6328125, 7.3056640625, 7.978515625, 8.6513671875, 9.32421875, 9.9970703125, 10.669921875, 11.3427734375, 12.015625, 12.6884765625, 13.361328125, 14.0341796875, 14.70703125, 15.3798828125, 16.052734375, 16.7255859375, 17.3984375, 18.0712890625, 18.744140625, 19.4169921875, 20.08984375, 20.7626953125, 21.435546875, 22.1083984375, 22.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 24.0, 25.0, 36.0, 47.0, 51.0, 38.0, 49.0, 50.0, 61.0, 67.0, 72.0, 55.0, 48.0, 58.0, 62.0, 38.0, 27.0, 22.0, 28.0, 24.0, 18.0, 10.0, 7.0, 7.0, 8.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.71258544921875, -6.5384521484375, -6.36431884765625, -6.190185546875, -6.01605224609375, -5.8419189453125, -5.66778564453125, -5.49365234375, -5.31951904296875, -5.1453857421875, -4.97125244140625, -4.797119140625, -4.62298583984375, -4.4488525390625, -4.27471923828125, -4.1005859375, -3.92645263671875, -3.7523193359375, -3.57818603515625, -3.404052734375, -3.22991943359375, -3.0557861328125, -2.88165283203125, -2.70751953125, -2.53338623046875, -2.3592529296875, -2.18511962890625, -2.010986328125, -1.83685302734375, -1.6627197265625, -1.48858642578125, -1.314453125, -1.14031982421875, -0.9661865234375, -0.79205322265625, -0.617919921875, -0.44378662109375, -0.2696533203125, -0.09552001953125, 0.07861328125, 0.25274658203125, 0.4268798828125, 0.60101318359375, 0.775146484375, 0.94927978515625, 1.1234130859375, 1.29754638671875, 1.4716796875, 1.64581298828125, 1.8199462890625, 1.99407958984375, 2.168212890625, 2.34234619140625, 2.5164794921875, 2.69061279296875, 2.86474609375, 3.03887939453125, 3.2130126953125, 3.38714599609375, 3.561279296875, 3.73541259765625, 3.9095458984375, 4.08367919921875, 4.2578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 10.0, 12.0, 15.0, 24.0, 36.0, 45.0, 40.0, 86.0, 157.0, 282.0, 603.0, 1486.0, 3395.0, 9498.0, 30531.0, 128485.0, 1171253.0, 2531952.0, 243601.0, 49212.0, 14454.0, 5039.0, 2094.0, 908.0, 462.0, 239.0, 108.0, 95.0, 40.0, 37.0, 27.0, 15.0, 7.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.73876953125, -10.4150390625, -10.09130859375, -9.767578125, -9.44384765625, -9.1201171875, -8.79638671875, -8.47265625, -8.14892578125, -7.8251953125, -7.50146484375, -7.177734375, -6.85400390625, -6.5302734375, -6.20654296875, -5.8828125, -5.55908203125, -5.2353515625, -4.91162109375, -4.587890625, -4.26416015625, -3.9404296875, -3.61669921875, -3.29296875, -2.96923828125, -2.6455078125, -2.32177734375, -1.998046875, -1.67431640625, -1.3505859375, -1.02685546875, -0.703125, -0.37939453125, -0.0556640625, 0.26806640625, 0.591796875, 0.91552734375, 1.2392578125, 1.56298828125, 1.88671875, 2.21044921875, 2.5341796875, 2.85791015625, 3.181640625, 3.50537109375, 3.8291015625, 4.15283203125, 4.4765625, 4.80029296875, 5.1240234375, 5.44775390625, 5.771484375, 6.09521484375, 6.4189453125, 6.74267578125, 7.06640625, 7.39013671875, 7.7138671875, 8.03759765625, 8.361328125, 8.68505859375, 9.0087890625, 9.33251953125, 9.65625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 6.0, 12.0, 7.0, 14.0, 13.0, 21.0, 37.0, 30.0, 34.0, 63.0, 101.0, 151.0, 237.0, 308.0, 421.0, 629.0, 590.0, 462.0, 270.0, 201.0, 117.0, 84.0, 68.0, 40.0, 28.0, 27.0, 27.0, 23.0, 13.0, 5.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7969970703125, -9.445556640625, -9.0941162109375, -8.74267578125, -8.3912353515625, -8.039794921875, -7.6883544921875, -7.3369140625, -6.9854736328125, -6.634033203125, -6.2825927734375, -5.93115234375, -5.5797119140625, -5.228271484375, -4.8768310546875, -4.525390625, -4.1739501953125, -3.822509765625, -3.4710693359375, -3.11962890625, -2.7681884765625, -2.416748046875, -2.0653076171875, -1.7138671875, -1.3624267578125, -1.010986328125, -0.6595458984375, -0.30810546875, 0.0433349609375, 0.394775390625, 0.7462158203125, 1.09765625, 1.4490966796875, 1.800537109375, 2.1519775390625, 2.50341796875, 2.8548583984375, 3.206298828125, 3.5577392578125, 3.9091796875, 4.2606201171875, 4.612060546875, 4.9635009765625, 5.31494140625, 5.6663818359375, 6.017822265625, 6.3692626953125, 6.720703125, 7.0721435546875, 7.423583984375, 7.7750244140625, 8.12646484375, 8.4779052734375, 8.829345703125, 9.1807861328125, 9.5322265625, 9.8836669921875, 10.235107421875, 10.5865478515625, 10.93798828125, 11.2894287109375, 11.640869140625, 11.9923095703125, 12.34375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 30.0, 114.0, 323.0, 322.0, 141.0, 35.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.8511962890625, -238.32566833496094, -229.80014038085938, -221.2746124267578, -212.74908447265625, -204.2235565185547, -195.69802856445312, -187.1724853515625, -178.64697265625, -170.12144470214844, -161.59591674804688, -153.0703887939453, -144.54486083984375, -136.0193328857422, -127.4937973022461, -118.96826934814453, -110.44273376464844, -101.91720581054688, -93.39167785644531, -84.86614990234375, -76.34062194824219, -67.81509399414062, -59.28955841064453, -50.76403045654297, -42.238502502441406, -33.712974548339844, -25.18744468688965, -16.661914825439453, -8.13638687133789, 0.3891410827636719, 8.9146728515625, 17.440200805664062, 25.965728759765625, 34.49125671386719, 43.01678466796875, 51.54231643676758, 60.06784439086914, 68.59336853027344, 77.11890411376953, 85.6444320678711, 94.16996002197266, 102.69548797607422, 111.22101593017578, 119.74655151367188, 128.27207946777344, 136.797607421875, 145.32313537597656, 153.84866333007812, 162.3741912841797, 170.89971923828125, 179.4252471923828, 187.95077514648438, 196.47630310058594, 205.0018310546875, 213.52737426757812, 222.05288696289062, 230.57843017578125, 239.1039581298828, 247.62948608398438, 256.155029296875, 264.6805419921875, 273.2060852050781, 281.7315979003906, 290.25714111328125, 298.78265380859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 11.0, 4.0, 5.0, 17.0, 11.0, 17.0, 9.0, 17.0, 21.0, 20.0, 30.0, 30.0, 26.0, 37.0, 38.0, 33.0, 45.0, 47.0, 42.0, 49.0, 49.0, 43.0, 54.0, 43.0, 39.0, 44.0, 33.0, 27.0, 36.0, 28.0, 14.0, 18.0, 10.0, 7.0, 15.0, 2.0, 11.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.165855407714844, -55.31768035888672, -53.469505310058594, -51.62133026123047, -49.773155212402344, -47.92498016357422, -46.076805114746094, -44.22863006591797, -42.380455017089844, -40.53227996826172, -38.684104919433594, -36.83592987060547, -34.987754821777344, -33.13957977294922, -31.29140281677246, -29.443227767944336, -27.595050811767578, -25.746875762939453, -23.898700714111328, -22.050525665283203, -20.202350616455078, -18.354175567626953, -16.505998611450195, -14.65782356262207, -12.809648513793945, -10.96147346496582, -9.113298416137695, -7.265122413635254, -5.416947364807129, -3.568772315979004, -1.7205963134765625, 0.1275787353515625, 1.9757537841796875, 3.8239290714263916, 5.672104358673096, 7.520279884338379, 9.368454933166504, 11.216629981994629, 13.06480598449707, 14.912981033325195, 16.76115608215332, 18.609331130981445, 20.45750617980957, 22.305683135986328, 24.153858184814453, 26.002033233642578, 27.850208282470703, 29.698383331298828, 31.546558380126953, 33.39473342895508, 35.2429084777832, 37.09108352661133, 38.93925857543945, 40.78743362426758, 42.63561248779297, 44.483787536621094, 46.33196258544922, 48.180137634277344, 50.02831268310547, 51.876487731933594, 53.72466278076172, 55.572837829589844, 57.42101287841797, 59.269187927246094, 61.11736297607422]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 10.0, 6.0, 15.0, 23.0, 29.0, 37.0, 63.0, 93.0, 120.0, 244.0, 376.0, 655.0, 1026.0, 1838.0, 3571.0, 7530.0, 16480.0, 38121.0, 91035.0, 220679.0, 351571.0, 181054.0, 75141.0, 31649.0, 13792.0, 6343.0, 3030.0, 1611.0, 908.0, 543.0, 360.0, 200.0, 132.0, 79.0, 44.0, 40.0, 26.0, 20.0, 15.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.953125, -9.655029296875, -9.35693359375, -9.058837890625, -8.7607421875, -8.462646484375, -8.16455078125, -7.866455078125, -7.568359375, -7.270263671875, -6.97216796875, -6.674072265625, -6.3759765625, -6.077880859375, -5.77978515625, -5.481689453125, -5.18359375, -4.885498046875, -4.58740234375, -4.289306640625, -3.9912109375, -3.693115234375, -3.39501953125, -3.096923828125, -2.798828125, -2.500732421875, -2.20263671875, -1.904541015625, -1.6064453125, -1.308349609375, -1.01025390625, -0.712158203125, -0.4140625, -0.115966796875, 0.18212890625, 0.480224609375, 0.7783203125, 1.076416015625, 1.37451171875, 1.672607421875, 1.970703125, 2.268798828125, 2.56689453125, 2.864990234375, 3.1630859375, 3.461181640625, 3.75927734375, 4.057373046875, 4.35546875, 4.653564453125, 4.95166015625, 5.249755859375, 5.5478515625, 5.845947265625, 6.14404296875, 6.442138671875, 6.740234375, 7.038330078125, 7.33642578125, 7.634521484375, 7.9326171875, 8.230712890625, 8.52880859375, 8.826904296875, 9.125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 10.0, 10.0, 15.0, 17.0, 20.0, 28.0, 32.0, 38.0, 33.0, 47.0, 56.0, 55.0, 42.0, 61.0, 55.0, 63.0, 62.0, 55.0, 48.0, 50.0, 40.0, 27.0, 29.0, 28.0, 16.0, 20.0, 7.0, 11.0, 8.0, 5.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6875, -6.5133056640625, -6.339111328125, -6.1649169921875, -5.99072265625, -5.8165283203125, -5.642333984375, -5.4681396484375, -5.2939453125, -5.1197509765625, -4.945556640625, -4.7713623046875, -4.59716796875, -4.4229736328125, -4.248779296875, -4.0745849609375, -3.900390625, -3.7261962890625, -3.552001953125, -3.3778076171875, -3.20361328125, -3.0294189453125, -2.855224609375, -2.6810302734375, -2.5068359375, -2.3326416015625, -2.158447265625, -1.9842529296875, -1.81005859375, -1.6358642578125, -1.461669921875, -1.2874755859375, -1.11328125, -0.9390869140625, -0.764892578125, -0.5906982421875, -0.41650390625, -0.2423095703125, -0.068115234375, 0.1060791015625, 0.2802734375, 0.4544677734375, 0.628662109375, 0.8028564453125, 0.97705078125, 1.1512451171875, 1.325439453125, 1.4996337890625, 1.673828125, 1.8480224609375, 2.022216796875, 2.1964111328125, 2.37060546875, 2.5447998046875, 2.718994140625, 2.8931884765625, 3.0673828125, 3.2415771484375, 3.415771484375, 3.5899658203125, 3.76416015625, 3.9383544921875, 4.112548828125, 4.2867431640625, 4.4609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 14.0, 12.0, 18.0, 26.0, 24.0, 42.0, 77.0, 94.0, 139.0, 241.0, 374.0, 688.0, 1407.0, 3458.0, 15355.0, 238245.0, 744950.0, 34085.0, 5227.0, 1859.0, 866.0, 467.0, 286.0, 207.0, 103.0, 74.0, 53.0, 34.0, 31.0, 19.0, 13.0, 16.0, 6.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.0966796875, -25.099609375, -24.1025390625, -23.10546875, -22.1083984375, -21.111328125, -20.1142578125, -19.1171875, -18.1201171875, -17.123046875, -16.1259765625, -15.12890625, -14.1318359375, -13.134765625, -12.1376953125, -11.140625, -10.1435546875, -9.146484375, -8.1494140625, -7.15234375, -6.1552734375, -5.158203125, -4.1611328125, -3.1640625, -2.1669921875, -1.169921875, -0.1728515625, 0.82421875, 1.8212890625, 2.818359375, 3.8154296875, 4.8125, 5.8095703125, 6.806640625, 7.8037109375, 8.80078125, 9.7978515625, 10.794921875, 11.7919921875, 12.7890625, 13.7861328125, 14.783203125, 15.7802734375, 16.77734375, 17.7744140625, 18.771484375, 19.7685546875, 20.765625, 21.7626953125, 22.759765625, 23.7568359375, 24.75390625, 25.7509765625, 26.748046875, 27.7451171875, 28.7421875, 29.7392578125, 30.736328125, 31.7333984375, 32.73046875, 33.7275390625, 34.724609375, 35.7216796875, 36.71875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 14.0, 14.0, 14.0, 22.0, 13.0, 32.0, 27.0, 34.0, 39.0, 35.0, 47.0, 40.0, 40.0, 51.0, 49.0, 48.0, 48.0, 53.0, 39.0, 44.0, 42.0, 44.0, 26.0, 20.0, 30.0, 24.0, 18.0, 16.0, 15.0, 9.0, 11.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.209716796875, -21.56005859375, -20.910400390625, -20.2607421875, -19.611083984375, -18.96142578125, -18.311767578125, -17.662109375, -17.012451171875, -16.36279296875, -15.713134765625, -15.0634765625, -14.413818359375, -13.76416015625, -13.114501953125, -12.46484375, -11.815185546875, -11.16552734375, -10.515869140625, -9.8662109375, -9.216552734375, -8.56689453125, -7.917236328125, -7.267578125, -6.617919921875, -5.96826171875, -5.318603515625, -4.6689453125, -4.019287109375, -3.36962890625, -2.719970703125, -2.0703125, -1.420654296875, -0.77099609375, -0.121337890625, 0.5283203125, 1.177978515625, 1.82763671875, 2.477294921875, 3.126953125, 3.776611328125, 4.42626953125, 5.075927734375, 5.7255859375, 6.375244140625, 7.02490234375, 7.674560546875, 8.32421875, 8.973876953125, 9.62353515625, 10.273193359375, 10.9228515625, 11.572509765625, 12.22216796875, 12.871826171875, 13.521484375, 14.171142578125, 14.82080078125, 15.470458984375, 16.1201171875, 16.769775390625, 17.41943359375, 18.069091796875, 18.71875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 23.0, 22.0, 31.0, 51.0, 77.0, 149.0, 263.0, 527.0, 1732.0, 7142.0, 56543.0, 784221.0, 176974.0, 16054.0, 2977.0, 923.0, 340.0, 186.0, 98.0, 60.0, 29.0, 17.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.9046630859375, -10.590576171875, -10.2764892578125, -9.96240234375, -9.6483154296875, -9.334228515625, -9.0201416015625, -8.7060546875, -8.3919677734375, -8.077880859375, -7.7637939453125, -7.44970703125, -7.1356201171875, -6.821533203125, -6.5074462890625, -6.193359375, -5.8792724609375, -5.565185546875, -5.2510986328125, -4.93701171875, -4.6229248046875, -4.308837890625, -3.9947509765625, -3.6806640625, -3.3665771484375, -3.052490234375, -2.7384033203125, -2.42431640625, -2.1102294921875, -1.796142578125, -1.4820556640625, -1.16796875, -0.8538818359375, -0.539794921875, -0.2257080078125, 0.08837890625, 0.4024658203125, 0.716552734375, 1.0306396484375, 1.3447265625, 1.6588134765625, 1.972900390625, 2.2869873046875, 2.60107421875, 2.9151611328125, 3.229248046875, 3.5433349609375, 3.857421875, 4.1715087890625, 4.485595703125, 4.7996826171875, 5.11376953125, 5.4278564453125, 5.741943359375, 6.0560302734375, 6.3701171875, 6.6842041015625, 6.998291015625, 7.3123779296875, 7.62646484375, 7.9405517578125, 8.254638671875, 8.5687255859375, 8.8828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 18.0, 31.0, 33.0, 52.0, 55.0, 98.0, 165.0, 182.0, 79.0, 75.0, 49.0, 23.0, 32.0, 15.0, 16.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002140045166015625, -0.0020686984062194824, -0.00199735164642334, -0.0019260048866271973, -0.0018546581268310547, -0.0017833113670349121, -0.0017119646072387695, -0.001640617847442627, -0.0015692710876464844, -0.0014979243278503418, -0.0014265775680541992, -0.0013552308082580566, -0.001283884048461914, -0.0012125372886657715, -0.001141190528869629, -0.0010698437690734863, -0.0009984970092773438, -0.0009271502494812012, -0.0008558034896850586, -0.000784456729888916, -0.0007131099700927734, -0.0006417632102966309, -0.0005704164505004883, -0.0004990696907043457, -0.0004277229309082031, -0.00035637617111206055, -0.00028502941131591797, -0.0002136826515197754, -0.0001423358917236328, -7.098913192749023e-05, 3.5762786865234375e-07, 7.170438766479492e-05, 0.0001430511474609375, 0.00021439790725708008, 0.00028574466705322266, 0.00035709142684936523, 0.0004284381866455078, 0.0004997849464416504, 0.000571131706237793, 0.0006424784660339355, 0.0007138252258300781, 0.0007851719856262207, 0.0008565187454223633, 0.0009278655052185059, 0.0009992122650146484, 0.001070559024810791, 0.0011419057846069336, 0.0012132525444030762, 0.0012845993041992188, 0.0013559460639953613, 0.001427292823791504, 0.0014986395835876465, 0.001569986343383789, 0.0016413331031799316, 0.0017126798629760742, 0.0017840266227722168, 0.0018553733825683594, 0.001926720142364502, 0.0019980669021606445, 0.002069413661956787, 0.0021407604217529297, 0.0022121071815490723, 0.002283453941345215, 0.0023548007011413574, 0.0024261474609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 22.0, 25.0, 32.0, 33.0, 73.0, 113.0, 188.0, 363.0, 685.0, 1412.0, 3950.0, 15950.0, 136435.0, 797670.0, 74790.0, 11315.0, 3037.0, 1130.0, 563.0, 283.0, 147.0, 99.0, 57.0, 52.0, 26.0, 19.0, 17.0, 19.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.5234375, -8.242919921875, -7.96240234375, -7.681884765625, -7.4013671875, -7.120849609375, -6.84033203125, -6.559814453125, -6.279296875, -5.998779296875, -5.71826171875, -5.437744140625, -5.1572265625, -4.876708984375, -4.59619140625, -4.315673828125, -4.03515625, -3.754638671875, -3.47412109375, -3.193603515625, -2.9130859375, -2.632568359375, -2.35205078125, -2.071533203125, -1.791015625, -1.510498046875, -1.22998046875, -0.949462890625, -0.6689453125, -0.388427734375, -0.10791015625, 0.172607421875, 0.453125, 0.733642578125, 1.01416015625, 1.294677734375, 1.5751953125, 1.855712890625, 2.13623046875, 2.416748046875, 2.697265625, 2.977783203125, 3.25830078125, 3.538818359375, 3.8193359375, 4.099853515625, 4.38037109375, 4.660888671875, 4.94140625, 5.221923828125, 5.50244140625, 5.782958984375, 6.0634765625, 6.343994140625, 6.62451171875, 6.905029296875, 7.185546875, 7.466064453125, 7.74658203125, 8.027099609375, 8.3076171875, 8.588134765625, 8.86865234375, 9.149169921875, 9.4296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 2.0, 4.0, 6.0, 8.0, 12.0, 10.0, 16.0, 26.0, 22.0, 21.0, 27.0, 37.0, 36.0, 48.0, 54.0, 52.0, 71.0, 77.0, 72.0, 46.0, 54.0, 47.0, 37.0, 42.0, 29.0, 23.0, 15.0, 24.0, 12.0, 8.0, 5.0, 12.0, 7.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.37896728515625, -4.2344970703125, -4.09002685546875, -3.945556640625, -3.80108642578125, -3.6566162109375, -3.51214599609375, -3.36767578125, -3.22320556640625, -3.0787353515625, -2.93426513671875, -2.789794921875, -2.64532470703125, -2.5008544921875, -2.35638427734375, -2.2119140625, -2.06744384765625, -1.9229736328125, -1.77850341796875, -1.634033203125, -1.48956298828125, -1.3450927734375, -1.20062255859375, -1.05615234375, -0.91168212890625, -0.7672119140625, -0.62274169921875, -0.478271484375, -0.33380126953125, -0.1893310546875, -0.04486083984375, 0.099609375, 0.24407958984375, 0.3885498046875, 0.53302001953125, 0.677490234375, 0.82196044921875, 0.9664306640625, 1.11090087890625, 1.25537109375, 1.39984130859375, 1.5443115234375, 1.68878173828125, 1.833251953125, 1.97772216796875, 2.1221923828125, 2.26666259765625, 2.4111328125, 2.55560302734375, 2.7000732421875, 2.84454345703125, 2.989013671875, 3.13348388671875, 3.2779541015625, 3.42242431640625, 3.56689453125, 3.71136474609375, 3.8558349609375, 4.00030517578125, 4.144775390625, 4.28924560546875, 4.4337158203125, 4.57818603515625, 4.72265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 13.0, 15.0, 35.0, 79.0, 123.0, 205.0, 244.0, 124.0, 81.0, 37.0, 14.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.18331909179688, -122.13169860839844, -117.08008575439453, -112.0284652709961, -106.97685241699219, -101.92523193359375, -96.87361145019531, -91.8219985961914, -86.7703857421875, -81.71876525878906, -76.66715240478516, -71.61553192138672, -66.56391906738281, -61.512298583984375, -56.4606819152832, -51.40906524658203, -46.357444763183594, -41.30582809448242, -36.25421142578125, -31.202592849731445, -26.150976181030273, -21.0993595123291, -16.047740936279297, -10.996124267578125, -5.944507598876953, -0.892890453338623, 4.158726692199707, 9.210344314575195, 14.261960983276367, 19.31357765197754, 24.365196228027344, 29.416812896728516, 34.46842956542969, 39.52004623413086, 44.57166290283203, 49.62328338623047, 54.674896240234375, 59.72651672363281, 64.77813720703125, 69.82975006103516, 74.88136291503906, 79.9329833984375, 84.9845962524414, 90.03621673583984, 95.08782958984375, 100.13945007324219, 105.19107055664062, 110.24268341064453, 115.29430389404297, 120.3459243774414, 125.39753723144531, 130.44915771484375, 135.5007781982422, 140.55238342285156, 145.60400390625, 150.65562438964844, 155.70724487304688, 160.7588653564453, 165.81048583984375, 170.86209106445312, 175.91371154785156, 180.96533203125, 186.01695251464844, 191.06857299804688, 196.12017822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 12.0, 8.0, 17.0, 21.0, 26.0, 20.0, 31.0, 54.0, 36.0, 50.0, 58.0, 83.0, 78.0, 91.0, 65.0, 39.0, 33.0, 33.0, 34.0, 27.0, 26.0, 23.0, 25.0, 22.0, 13.0, 12.0, 6.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.29074096679688, -74.36323547363281, -71.43572998046875, -68.50822448730469, -65.58071899414062, -62.65321350097656, -59.7257080078125, -56.79820251464844, -53.870697021484375, -50.94319152832031, -48.01568603515625, -45.08818054199219, -42.160675048828125, -39.23316955566406, -36.3056640625, -33.37815856933594, -30.45065689086914, -27.523151397705078, -24.595645904541016, -21.668140411376953, -18.74063491821289, -15.813130378723145, -12.885625839233398, -9.958120346069336, -7.030614852905273, -4.103109359741211, -1.1756043434143066, 1.7519006729125977, 4.67940616607666, 7.606911659240723, 10.534416198730469, 13.461921691894531, 16.389427185058594, 19.316932678222656, 22.24443817138672, 25.17194366455078, 28.099449157714844, 31.026954650878906, 33.95446014404297, 36.88196563720703, 39.809471130371094, 42.736976623535156, 45.66448211669922, 48.59198760986328, 51.519493103027344, 54.446998596191406, 57.37450408935547, 60.30200958251953, 63.22951126098633, 66.15701293945312, 69.08451843261719, 72.01202392578125, 74.93952941894531, 77.86703491210938, 80.79454040527344, 83.7220458984375, 86.64955139160156, 89.57705688476562, 92.50456237792969, 95.43206787109375, 98.35957336425781, 101.28707885742188, 104.21458435058594, 107.14208984375, 110.06959533691406]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 15.0, 19.0, 33.0, 58.0, 80.0, 174.0, 324.0, 647.0, 1454.0, 3814.0, 12065.0, 51723.0, 484646.0, 3132719.0, 439709.0, 49175.0, 11404.0, 3646.0, 1339.0, 574.0, 295.0, 156.0, 82.0, 44.0, 29.0, 19.0, 13.0, 10.0, 5.0, 2.0, 6.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.90087890625, -7.5908203125, -7.28076171875, -6.970703125, -6.66064453125, -6.3505859375, -6.04052734375, -5.73046875, -5.42041015625, -5.1103515625, -4.80029296875, -4.490234375, -4.18017578125, -3.8701171875, -3.56005859375, -3.25, -2.93994140625, -2.6298828125, -2.31982421875, -2.009765625, -1.69970703125, -1.3896484375, -1.07958984375, -0.76953125, -0.45947265625, -0.1494140625, 0.16064453125, 0.470703125, 0.78076171875, 1.0908203125, 1.40087890625, 1.7109375, 2.02099609375, 2.3310546875, 2.64111328125, 2.951171875, 3.26123046875, 3.5712890625, 3.88134765625, 4.19140625, 4.50146484375, 4.8115234375, 5.12158203125, 5.431640625, 5.74169921875, 6.0517578125, 6.36181640625, 6.671875, 6.98193359375, 7.2919921875, 7.60205078125, 7.912109375, 8.22216796875, 8.5322265625, 8.84228515625, 9.15234375, 9.46240234375, 9.7724609375, 10.08251953125, 10.392578125, 10.70263671875, 11.0126953125, 11.32275390625, 11.6328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 10.0, 18.0, 24.0, 24.0, 21.0, 34.0, 37.0, 42.0, 61.0, 76.0, 51.0, 57.0, 61.0, 54.0, 60.0, 64.0, 61.0, 46.0, 32.0, 35.0, 20.0, 28.0, 16.0, 14.0, 4.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -3.97509765625, -3.7900390625, -3.60498046875, -3.419921875, -3.23486328125, -3.0498046875, -2.86474609375, -2.6796875, -2.49462890625, -2.3095703125, -2.12451171875, -1.939453125, -1.75439453125, -1.5693359375, -1.38427734375, -1.19921875, -1.01416015625, -0.8291015625, -0.64404296875, -0.458984375, -0.27392578125, -0.0888671875, 0.09619140625, 0.28125, 0.46630859375, 0.6513671875, 0.83642578125, 1.021484375, 1.20654296875, 1.3916015625, 1.57666015625, 1.76171875, 1.94677734375, 2.1318359375, 2.31689453125, 2.501953125, 2.68701171875, 2.8720703125, 3.05712890625, 3.2421875, 3.42724609375, 3.6123046875, 3.79736328125, 3.982421875, 4.16748046875, 4.3525390625, 4.53759765625, 4.72265625, 4.90771484375, 5.0927734375, 5.27783203125, 5.462890625, 5.64794921875, 5.8330078125, 6.01806640625, 6.203125, 6.38818359375, 6.5732421875, 6.75830078125, 6.943359375, 7.12841796875, 7.3134765625, 7.49853515625, 7.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 16.0, 38.0, 65.0, 107.0, 231.0, 671.0, 2224.0, 11850.0, 132969.0, 3788168.0, 235660.0, 17740.0, 3082.0, 907.0, 296.0, 132.0, 63.0, 24.0, 8.0, 11.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.766357421875, -16.11083984375, -15.455322265625, -14.7998046875, -14.144287109375, -13.48876953125, -12.833251953125, -12.177734375, -11.522216796875, -10.86669921875, -10.211181640625, -9.5556640625, -8.900146484375, -8.24462890625, -7.589111328125, -6.93359375, -6.278076171875, -5.62255859375, -4.967041015625, -4.3115234375, -3.656005859375, -3.00048828125, -2.344970703125, -1.689453125, -1.033935546875, -0.37841796875, 0.277099609375, 0.9326171875, 1.588134765625, 2.24365234375, 2.899169921875, 3.5546875, 4.210205078125, 4.86572265625, 5.521240234375, 6.1767578125, 6.832275390625, 7.48779296875, 8.143310546875, 8.798828125, 9.454345703125, 10.10986328125, 10.765380859375, 11.4208984375, 12.076416015625, 12.73193359375, 13.387451171875, 14.04296875, 14.698486328125, 15.35400390625, 16.009521484375, 16.6650390625, 17.320556640625, 17.97607421875, 18.631591796875, 19.287109375, 19.942626953125, 20.59814453125, 21.253662109375, 21.9091796875, 22.564697265625, 23.22021484375, 23.875732421875, 24.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 13.0, 17.0, 20.0, 36.0, 62.0, 81.0, 123.0, 279.0, 527.0, 962.0, 866.0, 461.0, 224.0, 127.0, 82.0, 59.0, 30.0, 26.0, 23.0, 14.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.23974609375, -16.7451171875, -16.25048828125, -15.755859375, -15.26123046875, -14.7666015625, -14.27197265625, -13.77734375, -13.28271484375, -12.7880859375, -12.29345703125, -11.798828125, -11.30419921875, -10.8095703125, -10.31494140625, -9.8203125, -9.32568359375, -8.8310546875, -8.33642578125, -7.841796875, -7.34716796875, -6.8525390625, -6.35791015625, -5.86328125, -5.36865234375, -4.8740234375, -4.37939453125, -3.884765625, -3.39013671875, -2.8955078125, -2.40087890625, -1.90625, -1.41162109375, -0.9169921875, -0.42236328125, 0.072265625, 0.56689453125, 1.0615234375, 1.55615234375, 2.05078125, 2.54541015625, 3.0400390625, 3.53466796875, 4.029296875, 4.52392578125, 5.0185546875, 5.51318359375, 6.0078125, 6.50244140625, 6.9970703125, 7.49169921875, 7.986328125, 8.48095703125, 8.9755859375, 9.47021484375, 9.96484375, 10.45947265625, 10.9541015625, 11.44873046875, 11.943359375, 12.43798828125, 12.9326171875, 13.42724609375, 13.921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 8.0, 26.0, 82.0, 198.0, 315.0, 224.0, 87.0, 29.0, 14.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.4720458984375, -174.14645385742188, -167.82086181640625, -161.49526977539062, -155.169677734375, -148.84408569335938, -142.51849365234375, -136.19290161132812, -129.8673095703125, -123.54171752929688, -117.21612548828125, -110.89053344726562, -104.56494140625, -98.23934936523438, -91.91375732421875, -85.58816528320312, -79.2625732421875, -72.93698120117188, -66.61138916015625, -60.285797119140625, -53.960205078125, -47.634613037109375, -41.30902099609375, -34.983428955078125, -28.6578369140625, -22.332244873046875, -16.00665283203125, -9.681060791015625, -3.35546875, 2.970123291015625, 9.29571533203125, 15.621307373046875, 21.946914672851562, 28.272506713867188, 34.59809875488281, 40.92369079589844, 47.24928283691406, 53.57487487792969, 59.90046691894531, 66.22605895996094, 72.55165100097656, 78.87724304199219, 85.20283508300781, 91.52842712402344, 97.85401916503906, 104.17961120605469, 110.50520324707031, 116.83079528808594, 123.15638732910156, 129.4819793701172, 135.8075714111328, 142.13316345214844, 148.45875549316406, 154.7843475341797, 161.1099395751953, 167.43553161621094, 173.76112365722656, 180.0867156982422, 186.4123077392578, 192.73789978027344, 199.06349182128906, 205.3890838623047, 211.7146759033203, 218.04026794433594, 224.36585998535156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 6.0, 8.0, 10.0, 16.0, 23.0, 19.0, 25.0, 26.0, 39.0, 26.0, 34.0, 38.0, 52.0, 50.0, 49.0, 67.0, 39.0, 42.0, 54.0, 49.0, 48.0, 50.0, 34.0, 29.0, 24.0, 24.0, 27.0, 15.0, 21.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.355377197265625, -60.53413009643555, -58.712886810302734, -56.891639709472656, -55.07039260864258, -53.2491455078125, -51.42790222167969, -49.60665512084961, -47.78540802001953, -45.96416091918945, -44.14291763305664, -42.32167053222656, -40.500423431396484, -38.679176330566406, -36.857933044433594, -35.036685943603516, -33.2154426574707, -31.394197463989258, -29.57295036315918, -27.751705169677734, -25.930458068847656, -24.10921287536621, -22.287967681884766, -20.466720581054688, -18.645475387573242, -16.824230194091797, -15.002983093261719, -13.181737899780273, -11.360491752624512, -9.53924560546875, -7.718000411987305, -5.896754264831543, -4.075504302978516, -2.254258394241333, -0.4330124855041504, 1.3882331848144531, 3.209479331970215, 5.030725479125977, 6.851970672607422, 8.673216819763184, 10.494462966918945, 12.315709114074707, 14.136955261230469, 15.958200454711914, 17.77944564819336, 19.600692749023438, 21.421937942504883, 23.243183135986328, 25.064430236816406, 26.88567543029785, 28.70692253112793, 30.528167724609375, 32.34941482543945, 34.17066192626953, 35.991905212402344, 37.81315231323242, 39.6343994140625, 41.45564651489258, 43.27688980102539, 45.09813690185547, 46.91938400268555, 48.740631103515625, 50.56187438964844, 52.383121490478516, 54.20436477661133]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 4.0, 7.0, 8.0, 17.0, 24.0, 36.0, 57.0, 77.0, 92.0, 190.0, 268.0, 403.0, 724.0, 1280.0, 2298.0, 4203.0, 8083.0, 16293.0, 35068.0, 82466.0, 218229.0, 365207.0, 182493.0, 70507.0, 30319.0, 14310.0, 7268.0, 3697.0, 2020.0, 1124.0, 661.0, 387.0, 248.0, 151.0, 101.0, 70.0, 45.0, 24.0, 13.0, 20.0, 26.0, 8.0, 0.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.948486328125, -7.67822265625, -7.407958984375, -7.1376953125, -6.867431640625, -6.59716796875, -6.326904296875, -6.056640625, -5.786376953125, -5.51611328125, -5.245849609375, -4.9755859375, -4.705322265625, -4.43505859375, -4.164794921875, -3.89453125, -3.624267578125, -3.35400390625, -3.083740234375, -2.8134765625, -2.543212890625, -2.27294921875, -2.002685546875, -1.732421875, -1.462158203125, -1.19189453125, -0.921630859375, -0.6513671875, -0.381103515625, -0.11083984375, 0.159423828125, 0.4296875, 0.699951171875, 0.97021484375, 1.240478515625, 1.5107421875, 1.781005859375, 2.05126953125, 2.321533203125, 2.591796875, 2.862060546875, 3.13232421875, 3.402587890625, 3.6728515625, 3.943115234375, 4.21337890625, 4.483642578125, 4.75390625, 5.024169921875, 5.29443359375, 5.564697265625, 5.8349609375, 6.105224609375, 6.37548828125, 6.645751953125, 6.916015625, 7.186279296875, 7.45654296875, 7.726806640625, 7.9970703125, 8.267333984375, 8.53759765625, 8.807861328125, 9.078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 5.0, 10.0, 7.0, 15.0, 14.0, 14.0, 29.0, 17.0, 29.0, 20.0, 30.0, 31.0, 45.0, 38.0, 40.0, 46.0, 45.0, 46.0, 53.0, 40.0, 41.0, 45.0, 50.0, 31.0, 37.0, 31.0, 26.0, 17.0, 26.0, 18.0, 21.0, 14.0, 4.0, 7.0, 9.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.953125, -3.8155517578125, -3.677978515625, -3.5404052734375, -3.40283203125, -3.2652587890625, -3.127685546875, -2.9901123046875, -2.8525390625, -2.7149658203125, -2.577392578125, -2.4398193359375, -2.30224609375, -2.1646728515625, -2.027099609375, -1.8895263671875, -1.751953125, -1.6143798828125, -1.476806640625, -1.3392333984375, -1.20166015625, -1.0640869140625, -0.926513671875, -0.7889404296875, -0.6513671875, -0.5137939453125, -0.376220703125, -0.2386474609375, -0.10107421875, 0.0364990234375, 0.174072265625, 0.3116455078125, 0.44921875, 0.5867919921875, 0.724365234375, 0.8619384765625, 0.99951171875, 1.1370849609375, 1.274658203125, 1.4122314453125, 1.5498046875, 1.6873779296875, 1.824951171875, 1.9625244140625, 2.10009765625, 2.2376708984375, 2.375244140625, 2.5128173828125, 2.650390625, 2.7879638671875, 2.925537109375, 3.0631103515625, 3.20068359375, 3.3382568359375, 3.475830078125, 3.6134033203125, 3.7509765625, 3.8885498046875, 4.026123046875, 4.1636962890625, 4.30126953125, 4.4388427734375, 4.576416015625, 4.7139892578125, 4.8515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 21.0, 29.0, 58.0, 82.0, 106.0, 178.0, 271.0, 516.0, 971.0, 2150.0, 6679.0, 44688.0, 776216.0, 193468.0, 16181.0, 3687.0, 1408.0, 725.0, 428.0, 204.0, 159.0, 100.0, 58.0, 44.0, 25.0, 16.0, 16.0, 9.0, 9.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.84375, -31.950439453125, -31.05712890625, -30.163818359375, -29.2705078125, -28.377197265625, -27.48388671875, -26.590576171875, -25.697265625, -24.803955078125, -23.91064453125, -23.017333984375, -22.1240234375, -21.230712890625, -20.33740234375, -19.444091796875, -18.55078125, -17.657470703125, -16.76416015625, -15.870849609375, -14.9775390625, -14.084228515625, -13.19091796875, -12.297607421875, -11.404296875, -10.510986328125, -9.61767578125, -8.724365234375, -7.8310546875, -6.937744140625, -6.04443359375, -5.151123046875, -4.2578125, -3.364501953125, -2.47119140625, -1.577880859375, -0.6845703125, 0.208740234375, 1.10205078125, 1.995361328125, 2.888671875, 3.781982421875, 4.67529296875, 5.568603515625, 6.4619140625, 7.355224609375, 8.24853515625, 9.141845703125, 10.03515625, 10.928466796875, 11.82177734375, 12.715087890625, 13.6083984375, 14.501708984375, 15.39501953125, 16.288330078125, 17.181640625, 18.074951171875, 18.96826171875, 19.861572265625, 20.7548828125, 21.648193359375, 22.54150390625, 23.434814453125, 24.328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 12.0, 10.0, 15.0, 29.0, 28.0, 38.0, 35.0, 38.0, 46.0, 57.0, 68.0, 54.0, 69.0, 71.0, 59.0, 50.0, 43.0, 42.0, 52.0, 42.0, 20.0, 27.0, 17.0, 21.0, 13.0, 13.0, 11.0, 4.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.673828125, -17.92578125, -17.177734375, -16.4296875, -15.681640625, -14.93359375, -14.185546875, -13.4375, -12.689453125, -11.94140625, -11.193359375, -10.4453125, -9.697265625, -8.94921875, -8.201171875, -7.453125, -6.705078125, -5.95703125, -5.208984375, -4.4609375, -3.712890625, -2.96484375, -2.216796875, -1.46875, -0.720703125, 0.02734375, 0.775390625, 1.5234375, 2.271484375, 3.01953125, 3.767578125, 4.515625, 5.263671875, 6.01171875, 6.759765625, 7.5078125, 8.255859375, 9.00390625, 9.751953125, 10.5, 11.248046875, 11.99609375, 12.744140625, 13.4921875, 14.240234375, 14.98828125, 15.736328125, 16.484375, 17.232421875, 17.98046875, 18.728515625, 19.4765625, 20.224609375, 20.97265625, 21.720703125, 22.46875, 23.216796875, 23.96484375, 24.712890625, 25.4609375, 26.208984375, 26.95703125, 27.705078125, 28.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 11.0, 8.0, 14.0, 17.0, 11.0, 18.0, 37.0, 54.0, 92.0, 155.0, 374.0, 1013.0, 3885.0, 28594.0, 742841.0, 252117.0, 15242.0, 2585.0, 797.0, 269.0, 167.0, 78.0, 46.0, 28.0, 25.0, 16.0, 7.0, 8.0, 9.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.4580078125, -10.095703125, -9.7333984375, -9.37109375, -9.0087890625, -8.646484375, -8.2841796875, -7.921875, -7.5595703125, -7.197265625, -6.8349609375, -6.47265625, -6.1103515625, -5.748046875, -5.3857421875, -5.0234375, -4.6611328125, -4.298828125, -3.9365234375, -3.57421875, -3.2119140625, -2.849609375, -2.4873046875, -2.125, -1.7626953125, -1.400390625, -1.0380859375, -0.67578125, -0.3134765625, 0.048828125, 0.4111328125, 0.7734375, 1.1357421875, 1.498046875, 1.8603515625, 2.22265625, 2.5849609375, 2.947265625, 3.3095703125, 3.671875, 4.0341796875, 4.396484375, 4.7587890625, 5.12109375, 5.4833984375, 5.845703125, 6.2080078125, 6.5703125, 6.9326171875, 7.294921875, 7.6572265625, 8.01953125, 8.3818359375, 8.744140625, 9.1064453125, 9.46875, 9.8310546875, 10.193359375, 10.5556640625, 10.91796875, 11.2802734375, 11.642578125, 12.0048828125, 12.3671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 9.0, 7.0, 11.0, 18.0, 14.0, 12.0, 17.0, 26.0, 27.0, 38.0, 61.0, 87.0, 134.0, 117.0, 104.0, 66.0, 50.0, 36.0, 34.0, 22.0, 14.0, 23.0, 11.0, 14.0, 6.0, 10.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.001171410083770752, -0.001129746437072754, -0.0010880827903747559, -0.0010464191436767578, -0.0010047554969787598, -0.0009630918502807617, -0.0009214282035827637, -0.0008797645568847656, -0.0008381009101867676, -0.0007964372634887695, -0.0007547736167907715, -0.0007131099700927734, -0.0006714463233947754, -0.0006297826766967773, -0.0005881190299987793, -0.0005464553833007812, -0.0005047917366027832, -0.00046312808990478516, -0.0004214644432067871, -0.00037980079650878906, -0.000338137149810791, -0.00029647350311279297, -0.0002548098564147949, -0.00021314620971679688, -0.00017148256301879883, -0.00012981891632080078, -8.815526962280273e-05, -4.649162292480469e-05, -4.827976226806641e-06, 3.6835670471191406e-05, 7.849931716918945e-05, 0.0001201629638671875, 0.00016182661056518555, 0.0002034902572631836, 0.00024515390396118164, 0.0002868175506591797, 0.00032848119735717773, 0.0003701448440551758, 0.00041180849075317383, 0.0004534721374511719, 0.0004951357841491699, 0.000536799430847168, 0.000578463077545166, 0.0006201267242431641, 0.0006617903709411621, 0.0007034540176391602, 0.0007451176643371582, 0.0007867813110351562, 0.0008284449577331543, 0.0008701086044311523, 0.0009117722511291504, 0.0009534358978271484, 0.0009950995445251465, 0.0010367631912231445, 0.0010784268379211426, 0.0011200904846191406, 0.0011617541313171387, 0.0012034177780151367, 0.0012450814247131348, 0.0012867450714111328, 0.0013284087181091309, 0.001370072364807129, 0.001411736011505127, 0.001453399658203125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 17.0, 16.0, 21.0, 46.0, 56.0, 98.0, 161.0, 306.0, 522.0, 1017.0, 2680.0, 9627.0, 65954.0, 790962.0, 153977.0, 16450.0, 3839.0, 1331.0, 634.0, 331.0, 178.0, 135.0, 62.0, 43.0, 34.0, 15.0, 16.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.0352783203125, -7.781494140625, -7.5277099609375, -7.27392578125, -7.0201416015625, -6.766357421875, -6.5125732421875, -6.2587890625, -6.0050048828125, -5.751220703125, -5.4974365234375, -5.24365234375, -4.9898681640625, -4.736083984375, -4.4822998046875, -4.228515625, -3.9747314453125, -3.720947265625, -3.4671630859375, -3.21337890625, -2.9595947265625, -2.705810546875, -2.4520263671875, -2.1982421875, -1.9444580078125, -1.690673828125, -1.4368896484375, -1.18310546875, -0.9293212890625, -0.675537109375, -0.4217529296875, -0.16796875, 0.0858154296875, 0.339599609375, 0.5933837890625, 0.84716796875, 1.1009521484375, 1.354736328125, 1.6085205078125, 1.8623046875, 2.1160888671875, 2.369873046875, 2.6236572265625, 2.87744140625, 3.1312255859375, 3.385009765625, 3.6387939453125, 3.892578125, 4.1463623046875, 4.400146484375, 4.6539306640625, 4.90771484375, 5.1614990234375, 5.415283203125, 5.6690673828125, 5.9228515625, 6.1766357421875, 6.430419921875, 6.6842041015625, 6.93798828125, 7.1917724609375, 7.445556640625, 7.6993408203125, 7.953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 14.0, 14.0, 24.0, 24.0, 30.0, 38.0, 49.0, 57.0, 82.0, 102.0, 93.0, 94.0, 73.0, 55.0, 54.0, 35.0, 25.0, 32.0, 17.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.57421875, -5.402587890625, -5.23095703125, -5.059326171875, -4.8876953125, -4.716064453125, -4.54443359375, -4.372802734375, -4.201171875, -4.029541015625, -3.85791015625, -3.686279296875, -3.5146484375, -3.343017578125, -3.17138671875, -2.999755859375, -2.828125, -2.656494140625, -2.48486328125, -2.313232421875, -2.1416015625, -1.969970703125, -1.79833984375, -1.626708984375, -1.455078125, -1.283447265625, -1.11181640625, -0.940185546875, -0.7685546875, -0.596923828125, -0.42529296875, -0.253662109375, -0.08203125, 0.089599609375, 0.26123046875, 0.432861328125, 0.6044921875, 0.776123046875, 0.94775390625, 1.119384765625, 1.291015625, 1.462646484375, 1.63427734375, 1.805908203125, 1.9775390625, 2.149169921875, 2.32080078125, 2.492431640625, 2.6640625, 2.835693359375, 3.00732421875, 3.178955078125, 3.3505859375, 3.522216796875, 3.69384765625, 3.865478515625, 4.037109375, 4.208740234375, 4.38037109375, 4.552001953125, 4.7236328125, 4.895263671875, 5.06689453125, 5.238525390625, 5.41015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 14.0, 27.0, 78.0, 142.0, 314.0, 203.0, 101.0, 49.0, 27.0, 8.0, 8.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.22621154785156, -149.6083526611328, -143.99050903320312, -138.37265014648438, -132.75479125976562, -127.1369400024414, -121.51908874511719, -115.90122985839844, -110.28337860107422, -104.66552734375, -99.04766845703125, -93.42981719970703, -87.81196594238281, -82.19410705566406, -76.57625579833984, -70.95840454101562, -65.34054565429688, -59.72269058227539, -54.104835510253906, -48.48698425292969, -42.8691291809082, -37.25127410888672, -31.6334228515625, -26.015567779541016, -20.39771270751953, -14.779858589172363, -9.162004470825195, -3.5441513061523438, 2.0737037658691406, 7.691558837890625, 13.309410095214844, 18.927265167236328, 24.54510498046875, 30.162960052490234, 35.78081512451172, 41.39866638183594, 47.01652145385742, 52.634376525878906, 58.252227783203125, 63.87008285522461, 69.4879379272461, 75.10578918457031, 80.72364807128906, 86.34149932861328, 91.9593505859375, 97.57720947265625, 103.19506072998047, 108.81291198730469, 114.43077087402344, 120.04862213134766, 125.6664810180664, 131.28433227539062, 136.90219116210938, 142.52005004882812, 148.1378936767578, 153.75575256347656, 159.37359619140625, 164.991455078125, 170.6092987060547, 176.22715759277344, 181.8450164794922, 187.46286010742188, 193.08071899414062, 198.69857788085938, 204.31643676757812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 10.0, 11.0, 22.0, 12.0, 23.0, 30.0, 29.0, 32.0, 20.0, 29.0, 56.0, 59.0, 84.0, 82.0, 80.0, 50.0, 47.0, 42.0, 39.0, 37.0, 33.0, 41.0, 23.0, 17.0, 15.0, 9.0, 12.0, 7.0, 9.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0], "bins": [-104.61738586425781, -102.0246810913086, -99.43196868896484, -96.83926391601562, -94.24655151367188, -91.65384674072266, -89.06114196777344, -86.46842956542969, -83.87572479248047, -81.28302001953125, -78.6903076171875, -76.09760284423828, -73.50489807128906, -70.91218566894531, -68.3194808959961, -65.72677612304688, -63.134063720703125, -60.54135513305664, -57.948646545410156, -55.35594177246094, -52.76323318481445, -50.17052459716797, -47.57781982421875, -44.985111236572266, -42.39240264892578, -39.7996940612793, -37.20698547363281, -34.614280700683594, -32.02157211303711, -29.428863525390625, -26.836156845092773, -24.243450164794922, -21.650741577148438, -19.058032989501953, -16.4653263092041, -13.872618675231934, -11.279911041259766, -8.687203407287598, -6.09449577331543, -3.501789093017578, -0.9090805053710938, 1.6836271286010742, 4.276334762573242, 6.86904239654541, 9.461750030517578, 12.054457664489746, 14.647165298461914, 17.239871978759766, 19.83258056640625, 22.425289154052734, 25.017995834350586, 27.610702514648438, 30.203411102294922, 32.796119689941406, 35.388824462890625, 37.98153305053711, 40.574241638183594, 43.16695022583008, 45.75965881347656, 48.35236358642578, 50.945072174072266, 53.53778076171875, 56.13048553466797, 58.72319412231445, 61.31590270996094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 16.0, 16.0, 21.0, 30.0, 66.0, 91.0, 145.0, 271.0, 486.0, 1163.0, 2744.0, 8630.0, 42001.0, 742483.0, 3203506.0, 164209.0, 19792.0, 5186.0, 1825.0, 776.0, 368.0, 193.0, 105.0, 53.0, 35.0, 15.0, 14.0, 9.0, 11.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5408935546875, -11.183349609375, -10.8258056640625, -10.46826171875, -10.1107177734375, -9.753173828125, -9.3956298828125, -9.0380859375, -8.6805419921875, -8.322998046875, -7.9654541015625, -7.60791015625, -7.2503662109375, -6.892822265625, -6.5352783203125, -6.177734375, -5.8201904296875, -5.462646484375, -5.1051025390625, -4.74755859375, -4.3900146484375, -4.032470703125, -3.6749267578125, -3.3173828125, -2.9598388671875, -2.602294921875, -2.2447509765625, -1.88720703125, -1.5296630859375, -1.172119140625, -0.8145751953125, -0.45703125, -0.0994873046875, 0.258056640625, 0.6156005859375, 0.97314453125, 1.3306884765625, 1.688232421875, 2.0457763671875, 2.4033203125, 2.7608642578125, 3.118408203125, 3.4759521484375, 3.83349609375, 4.1910400390625, 4.548583984375, 4.9061279296875, 5.263671875, 5.6212158203125, 5.978759765625, 6.3363037109375, 6.69384765625, 7.0513916015625, 7.408935546875, 7.7664794921875, 8.1240234375, 8.4815673828125, 8.839111328125, 9.1966552734375, 9.55419921875, 9.9117431640625, 10.269287109375, 10.6268310546875, 10.984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 9.0, 12.0, 16.0, 8.0, 14.0, 27.0, 26.0, 31.0, 30.0, 37.0, 39.0, 42.0, 61.0, 46.0, 52.0, 59.0, 44.0, 48.0, 45.0, 45.0, 53.0, 37.0, 30.0, 31.0, 30.0, 20.0, 15.0, 14.0, 19.0, 10.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.14654541015625, -4.0001220703125, -3.85369873046875, -3.707275390625, -3.56085205078125, -3.4144287109375, -3.26800537109375, -3.12158203125, -2.97515869140625, -2.8287353515625, -2.68231201171875, -2.535888671875, -2.38946533203125, -2.2430419921875, -2.09661865234375, -1.9501953125, -1.80377197265625, -1.6573486328125, -1.51092529296875, -1.364501953125, -1.21807861328125, -1.0716552734375, -0.92523193359375, -0.77880859375, -0.63238525390625, -0.4859619140625, -0.33953857421875, -0.193115234375, -0.04669189453125, 0.0997314453125, 0.24615478515625, 0.392578125, 0.53900146484375, 0.6854248046875, 0.83184814453125, 0.978271484375, 1.12469482421875, 1.2711181640625, 1.41754150390625, 1.56396484375, 1.71038818359375, 1.8568115234375, 2.00323486328125, 2.149658203125, 2.29608154296875, 2.4425048828125, 2.58892822265625, 2.7353515625, 2.88177490234375, 3.0281982421875, 3.17462158203125, 3.321044921875, 3.46746826171875, 3.6138916015625, 3.76031494140625, 3.90673828125, 4.05316162109375, 4.1995849609375, 4.34600830078125, 4.492431640625, 4.63885498046875, 4.7852783203125, 4.93170166015625, 5.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 11.0, 6.0, 33.0, 57.0, 150.0, 342.0, 897.0, 4601.0, 124276.0, 4031977.0, 28044.0, 2685.0, 700.0, 279.0, 115.0, 53.0, 23.0, 16.0, 11.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.40625, -39.26220703125, -38.1181640625, -36.97412109375, -35.830078125, -34.68603515625, -33.5419921875, -32.39794921875, -31.25390625, -30.10986328125, -28.9658203125, -27.82177734375, -26.677734375, -25.53369140625, -24.3896484375, -23.24560546875, -22.1015625, -20.95751953125, -19.8134765625, -18.66943359375, -17.525390625, -16.38134765625, -15.2373046875, -14.09326171875, -12.94921875, -11.80517578125, -10.6611328125, -9.51708984375, -8.373046875, -7.22900390625, -6.0849609375, -4.94091796875, -3.796875, -2.65283203125, -1.5087890625, -0.36474609375, 0.779296875, 1.92333984375, 3.0673828125, 4.21142578125, 5.35546875, 6.49951171875, 7.6435546875, 8.78759765625, 9.931640625, 11.07568359375, 12.2197265625, 13.36376953125, 14.5078125, 15.65185546875, 16.7958984375, 17.93994140625, 19.083984375, 20.22802734375, 21.3720703125, 22.51611328125, 23.66015625, 24.80419921875, 25.9482421875, 27.09228515625, 28.236328125, 29.38037109375, 30.5244140625, 31.66845703125, 32.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 10.0, 6.0, 21.0, 51.0, 82.0, 190.0, 920.0, 1822.0, 635.0, 176.0, 83.0, 30.0, 20.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5, -28.615966796875, -27.73193359375, -26.847900390625, -25.9638671875, -25.079833984375, -24.19580078125, -23.311767578125, -22.427734375, -21.543701171875, -20.65966796875, -19.775634765625, -18.8916015625, -18.007568359375, -17.12353515625, -16.239501953125, -15.35546875, -14.471435546875, -13.58740234375, -12.703369140625, -11.8193359375, -10.935302734375, -10.05126953125, -9.167236328125, -8.283203125, -7.399169921875, -6.51513671875, -5.631103515625, -4.7470703125, -3.863037109375, -2.97900390625, -2.094970703125, -1.2109375, -0.326904296875, 0.55712890625, 1.441162109375, 2.3251953125, 3.209228515625, 4.09326171875, 4.977294921875, 5.861328125, 6.745361328125, 7.62939453125, 8.513427734375, 9.3974609375, 10.281494140625, 11.16552734375, 12.049560546875, 12.93359375, 13.817626953125, 14.70166015625, 15.585693359375, 16.4697265625, 17.353759765625, 18.23779296875, 19.121826171875, 20.005859375, 20.889892578125, 21.77392578125, 22.657958984375, 23.5419921875, 24.426025390625, 25.31005859375, 26.194091796875, 27.078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 13.0, 25.0, 91.0, 285.0, 344.0, 165.0, 43.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.77316284179688, -130.68785095214844, -122.60254669189453, -114.51724243164062, -106.43193054199219, -98.34661865234375, -90.26131439208984, -82.17601013183594, -74.0906982421875, -66.00538635253906, -57.920082092285156, -49.834774017333984, -41.74946594238281, -33.66415786743164, -25.57884979248047, -17.493541717529297, -9.408233642578125, -1.3229255676269531, 6.762382507324219, 14.84769058227539, 22.932998657226562, 31.018306732177734, 39.103614807128906, 47.18892288208008, 55.27423095703125, 63.35953903198242, 71.4448471069336, 79.5301513671875, 87.61546325683594, 95.70077514648438, 103.78607940673828, 111.87138366699219, 119.95672607421875, 128.0420379638672, 136.12734985351562, 144.212646484375, 152.29795837402344, 160.38327026367188, 168.46856689453125, 176.5538787841797, 184.63919067382812, 192.72450256347656, 200.809814453125, 208.89511108398438, 216.9804229736328, 225.06573486328125, 233.15103149414062, 241.23634338378906, 249.3216552734375, 257.4069519042969, 265.4922790527344, 273.57757568359375, 281.66290283203125, 289.7481994628906, 297.83349609375, 305.9188232421875, 314.0041198730469, 322.08941650390625, 330.17474365234375, 338.2600402832031, 346.3453369140625, 354.4306640625, 362.5159606933594, 370.6012878417969, 378.68658447265625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 8.0, 8.0, 17.0, 17.0, 24.0, 39.0, 41.0, 47.0, 46.0, 49.0, 55.0, 67.0, 66.0, 78.0, 56.0, 78.0, 63.0, 46.0, 42.0, 26.0, 32.0, 27.0, 18.0, 16.0, 10.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.17898559570312, -99.54145812988281, -96.90392303466797, -94.26639556884766, -91.62886810302734, -88.9913330078125, -86.35380554199219, -83.71627807617188, -81.07874298095703, -78.44121551513672, -75.80368041992188, -73.16615295410156, -70.52862548828125, -67.8910903930664, -65.2535629272461, -62.616031646728516, -59.9785041809082, -57.340972900390625, -54.70344543457031, -52.065914154052734, -49.428382873535156, -46.790855407714844, -44.153324127197266, -41.51579284667969, -38.878265380859375, -36.2407341003418, -33.603206634521484, -30.965675354003906, -28.328144073486328, -25.690614700317383, -23.053085327148438, -20.41555404663086, -17.77802276611328, -15.14049243927002, -12.502962112426758, -9.865432739257812, -7.227902412414551, -4.590372085571289, -1.9528427124023438, 0.6846885681152344, 3.3222179412841797, 5.959748268127441, 8.597278594970703, 11.234807968139648, 13.87233829498291, 16.509868621826172, 19.147397994995117, 21.784929275512695, 24.42245864868164, 27.059988021850586, 29.697519302368164, 32.33504867553711, 34.97257995605469, 37.610107421875, 40.24763870239258, 42.885169982910156, 45.52269744873047, 48.16022872924805, 50.79775619506836, 53.43528747558594, 56.072818756103516, 58.710350036621094, 61.347877502441406, 63.985408782958984, 66.62294006347656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 15.0, 18.0, 28.0, 44.0, 55.0, 101.0, 164.0, 297.0, 555.0, 984.0, 2089.0, 4274.0, 10290.0, 27474.0, 85241.0, 266090.0, 393718.0, 171970.0, 53431.0, 18260.0, 7083.0, 3051.0, 1533.0, 780.0, 391.0, 224.0, 145.0, 81.0, 58.0, 28.0, 21.0, 19.0, 16.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.37060546875, -7.1005859375, -6.83056640625, -6.560546875, -6.29052734375, -6.0205078125, -5.75048828125, -5.48046875, -5.21044921875, -4.9404296875, -4.67041015625, -4.400390625, -4.13037109375, -3.8603515625, -3.59033203125, -3.3203125, -3.05029296875, -2.7802734375, -2.51025390625, -2.240234375, -1.97021484375, -1.7001953125, -1.43017578125, -1.16015625, -0.89013671875, -0.6201171875, -0.35009765625, -0.080078125, 0.18994140625, 0.4599609375, 0.72998046875, 1.0, 1.27001953125, 1.5400390625, 1.81005859375, 2.080078125, 2.35009765625, 2.6201171875, 2.89013671875, 3.16015625, 3.43017578125, 3.7001953125, 3.97021484375, 4.240234375, 4.51025390625, 4.7802734375, 5.05029296875, 5.3203125, 5.59033203125, 5.8603515625, 6.13037109375, 6.400390625, 6.67041015625, 6.9404296875, 7.21044921875, 7.48046875, 7.75048828125, 8.0205078125, 8.29052734375, 8.560546875, 8.83056640625, 9.1005859375, 9.37060546875, 9.640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 15.0, 16.0, 19.0, 19.0, 36.0, 34.0, 43.0, 48.0, 39.0, 52.0, 57.0, 59.0, 54.0, 77.0, 40.0, 70.0, 47.0, 56.0, 37.0, 33.0, 25.0, 30.0, 16.0, 16.0, 11.0, 7.0, 5.0, 10.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.7191162109375, -7.512451171875, -7.3057861328125, -7.09912109375, -6.8924560546875, -6.685791015625, -6.4791259765625, -6.2724609375, -6.0657958984375, -5.859130859375, -5.6524658203125, -5.44580078125, -5.2391357421875, -5.032470703125, -4.8258056640625, -4.619140625, -4.4124755859375, -4.205810546875, -3.9991455078125, -3.79248046875, -3.5858154296875, -3.379150390625, -3.1724853515625, -2.9658203125, -2.7591552734375, -2.552490234375, -2.3458251953125, -2.13916015625, -1.9324951171875, -1.725830078125, -1.5191650390625, -1.3125, -1.1058349609375, -0.899169921875, -0.6925048828125, -0.48583984375, -0.2791748046875, -0.072509765625, 0.1341552734375, 0.3408203125, 0.5474853515625, 0.754150390625, 0.9608154296875, 1.16748046875, 1.3741455078125, 1.580810546875, 1.7874755859375, 1.994140625, 2.2008056640625, 2.407470703125, 2.6141357421875, 2.82080078125, 3.0274658203125, 3.234130859375, 3.4407958984375, 3.6474609375, 3.8541259765625, 4.060791015625, 4.2674560546875, 4.47412109375, 4.6807861328125, 4.887451171875, 5.0941162109375, 5.30078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 26.0, 20.0, 30.0, 60.0, 82.0, 137.0, 222.0, 420.0, 800.0, 1996.0, 5767.0, 21730.0, 127983.0, 691780.0, 160577.0, 26117.0, 6490.0, 2193.0, 944.0, 448.0, 259.0, 138.0, 93.0, 51.0, 40.0, 31.0, 23.0, 19.0, 4.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.2734375, -14.7894287109375, -14.305419921875, -13.8214111328125, -13.33740234375, -12.8533935546875, -12.369384765625, -11.8853759765625, -11.4013671875, -10.9173583984375, -10.433349609375, -9.9493408203125, -9.46533203125, -8.9813232421875, -8.497314453125, -8.0133056640625, -7.529296875, -7.0452880859375, -6.561279296875, -6.0772705078125, -5.59326171875, -5.1092529296875, -4.625244140625, -4.1412353515625, -3.6572265625, -3.1732177734375, -2.689208984375, -2.2052001953125, -1.72119140625, -1.2371826171875, -0.753173828125, -0.2691650390625, 0.21484375, 0.6988525390625, 1.182861328125, 1.6668701171875, 2.15087890625, 2.6348876953125, 3.118896484375, 3.6029052734375, 4.0869140625, 4.5709228515625, 5.054931640625, 5.5389404296875, 6.02294921875, 6.5069580078125, 6.990966796875, 7.4749755859375, 7.958984375, 8.4429931640625, 8.927001953125, 9.4110107421875, 9.89501953125, 10.3790283203125, 10.863037109375, 11.3470458984375, 11.8310546875, 12.3150634765625, 12.799072265625, 13.2830810546875, 13.76708984375, 14.2510986328125, 14.735107421875, 15.2191162109375, 15.703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 15.0, 8.0, 10.0, 20.0, 25.0, 21.0, 36.0, 39.0, 45.0, 54.0, 54.0, 52.0, 52.0, 65.0, 55.0, 54.0, 49.0, 50.0, 51.0, 37.0, 21.0, 28.0, 26.0, 24.0, 16.0, 16.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.673583984375, -24.95654296875, -24.239501953125, -23.5224609375, -22.805419921875, -22.08837890625, -21.371337890625, -20.654296875, -19.937255859375, -19.22021484375, -18.503173828125, -17.7861328125, -17.069091796875, -16.35205078125, -15.635009765625, -14.91796875, -14.200927734375, -13.48388671875, -12.766845703125, -12.0498046875, -11.332763671875, -10.61572265625, -9.898681640625, -9.181640625, -8.464599609375, -7.74755859375, -7.030517578125, -6.3134765625, -5.596435546875, -4.87939453125, -4.162353515625, -3.4453125, -2.728271484375, -2.01123046875, -1.294189453125, -0.5771484375, 0.139892578125, 0.85693359375, 1.573974609375, 2.291015625, 3.008056640625, 3.72509765625, 4.442138671875, 5.1591796875, 5.876220703125, 6.59326171875, 7.310302734375, 8.02734375, 8.744384765625, 9.46142578125, 10.178466796875, 10.8955078125, 11.612548828125, 12.32958984375, 13.046630859375, 13.763671875, 14.480712890625, 15.19775390625, 15.914794921875, 16.6318359375, 17.348876953125, 18.06591796875, 18.782958984375, 19.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 10.0, 9.0, 11.0, 35.0, 33.0, 53.0, 69.0, 101.0, 119.0, 216.0, 301.0, 458.0, 733.0, 1219.0, 2333.0, 5059.0, 12771.0, 43554.0, 239220.0, 632233.0, 75895.0, 19634.0, 7269.0, 3221.0, 1630.0, 875.0, 487.0, 327.0, 209.0, 141.0, 76.0, 66.0, 44.0, 44.0, 29.0, 19.0, 11.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.82952880859375, -4.6746826171875, -4.51983642578125, -4.364990234375, -4.21014404296875, -4.0552978515625, -3.90045166015625, -3.74560546875, -3.59075927734375, -3.4359130859375, -3.28106689453125, -3.126220703125, -2.97137451171875, -2.8165283203125, -2.66168212890625, -2.5068359375, -2.35198974609375, -2.1971435546875, -2.04229736328125, -1.887451171875, -1.73260498046875, -1.5777587890625, -1.42291259765625, -1.26806640625, -1.11322021484375, -0.9583740234375, -0.80352783203125, -0.648681640625, -0.49383544921875, -0.3389892578125, -0.18414306640625, -0.029296875, 0.12554931640625, 0.2803955078125, 0.43524169921875, 0.590087890625, 0.74493408203125, 0.8997802734375, 1.05462646484375, 1.20947265625, 1.36431884765625, 1.5191650390625, 1.67401123046875, 1.828857421875, 1.98370361328125, 2.1385498046875, 2.29339599609375, 2.4482421875, 2.60308837890625, 2.7579345703125, 2.91278076171875, 3.067626953125, 3.22247314453125, 3.3773193359375, 3.53216552734375, 3.68701171875, 3.84185791015625, 3.9967041015625, 4.15155029296875, 4.306396484375, 4.46124267578125, 4.6160888671875, 4.77093505859375, 4.92578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 24.0, 27.0, 74.0, 163.0, 330.0, 182.0, 90.0, 41.0, 17.0, 11.0, 5.0, 9.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00299072265625, -0.0029015839099884033, -0.0028124451637268066, -0.00272330641746521, -0.0026341676712036133, -0.0025450289249420166, -0.00245589017868042, -0.0023667514324188232, -0.0022776126861572266, -0.00218847393989563, -0.002099335193634033, -0.0020101964473724365, -0.0019210577011108398, -0.0018319189548492432, -0.0017427802085876465, -0.0016536414623260498, -0.0015645027160644531, -0.0014753639698028564, -0.0013862252235412598, -0.001297086477279663, -0.0012079477310180664, -0.0011188089847564697, -0.001029670238494873, -0.0009405314922332764, -0.0008513927459716797, -0.000762253999710083, -0.0006731152534484863, -0.0005839765071868896, -0.000494837760925293, -0.0004056990146636963, -0.0003165602684020996, -0.00022742152214050293, -0.00013828277587890625, -4.914402961730957e-05, 3.999471664428711e-05, 0.0001291334629058838, 0.00021827220916748047, 0.00030741095542907715, 0.00039654970169067383, 0.0004856884479522705, 0.0005748271942138672, 0.0006639659404754639, 0.0007531046867370605, 0.0008422434329986572, 0.0009313821792602539, 0.0010205209255218506, 0.0011096596717834473, 0.001198798418045044, 0.0012879371643066406, 0.0013770759105682373, 0.001466214656829834, 0.0015553534030914307, 0.0016444921493530273, 0.001733630895614624, 0.0018227696418762207, 0.0019119083881378174, 0.002001047134399414, 0.0020901858806610107, 0.0021793246269226074, 0.002268463373184204, 0.0023576021194458008, 0.0024467408657073975, 0.002535879611968994, 0.002625018358230591, 0.0027141571044921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 7.0, 19.0, 24.0, 40.0, 73.0, 143.0, 405.0, 1040.0, 3237.0, 13338.0, 91813.0, 804966.0, 112503.0, 15328.0, 3649.0, 1134.0, 431.0, 170.0, 83.0, 55.0, 25.0, 21.0, 8.0, 7.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.17047119140625, -7.9268798828125, -7.68328857421875, -7.439697265625, -7.19610595703125, -6.9525146484375, -6.70892333984375, -6.46533203125, -6.22174072265625, -5.9781494140625, -5.73455810546875, -5.490966796875, -5.24737548828125, -5.0037841796875, -4.76019287109375, -4.5166015625, -4.27301025390625, -4.0294189453125, -3.78582763671875, -3.542236328125, -3.29864501953125, -3.0550537109375, -2.81146240234375, -2.56787109375, -2.32427978515625, -2.0806884765625, -1.83709716796875, -1.593505859375, -1.34991455078125, -1.1063232421875, -0.86273193359375, -0.619140625, -0.37554931640625, -0.1319580078125, 0.11163330078125, 0.355224609375, 0.59881591796875, 0.8424072265625, 1.08599853515625, 1.32958984375, 1.57318115234375, 1.8167724609375, 2.06036376953125, 2.303955078125, 2.54754638671875, 2.7911376953125, 3.03472900390625, 3.2783203125, 3.52191162109375, 3.7655029296875, 4.00909423828125, 4.252685546875, 4.49627685546875, 4.7398681640625, 4.98345947265625, 5.22705078125, 5.47064208984375, 5.7142333984375, 5.95782470703125, 6.201416015625, 6.44500732421875, 6.6885986328125, 6.93218994140625, 7.17578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 14.0, 17.0, 26.0, 38.0, 54.0, 72.0, 98.0, 120.0, 131.0, 100.0, 68.0, 71.0, 32.0, 19.0, 25.0, 21.0, 9.0, 6.0, 6.0, 7.0, 7.0, 10.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.3203125, -8.12255859375, -7.9248046875, -7.72705078125, -7.529296875, -7.33154296875, -7.1337890625, -6.93603515625, -6.73828125, -6.54052734375, -6.3427734375, -6.14501953125, -5.947265625, -5.74951171875, -5.5517578125, -5.35400390625, -5.15625, -4.95849609375, -4.7607421875, -4.56298828125, -4.365234375, -4.16748046875, -3.9697265625, -3.77197265625, -3.57421875, -3.37646484375, -3.1787109375, -2.98095703125, -2.783203125, -2.58544921875, -2.3876953125, -2.18994140625, -1.9921875, -1.79443359375, -1.5966796875, -1.39892578125, -1.201171875, -1.00341796875, -0.8056640625, -0.60791015625, -0.41015625, -0.21240234375, -0.0146484375, 0.18310546875, 0.380859375, 0.57861328125, 0.7763671875, 0.97412109375, 1.171875, 1.36962890625, 1.5673828125, 1.76513671875, 1.962890625, 2.16064453125, 2.3583984375, 2.55615234375, 2.75390625, 2.95166015625, 3.1494140625, 3.34716796875, 3.544921875, 3.74267578125, 3.9404296875, 4.13818359375, 4.3359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 15.0, 41.0, 210.0, 482.0, 177.0, 43.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.50439453125, -351.2229309082031, -342.9414978027344, -334.6600341796875, -326.37860107421875, -318.0971374511719, -309.815673828125, -301.53424072265625, -293.2527770996094, -284.9713134765625, -276.68988037109375, -268.4084167480469, -260.1269836425781, -251.84552001953125, -243.56407165527344, -235.28262329101562, -227.0011749267578, -218.7197265625, -210.4382781982422, -202.15682983398438, -193.8753662109375, -185.5939178466797, -177.31246948242188, -169.03102111816406, -160.74957275390625, -152.46812438964844, -144.18667602539062, -135.90521240234375, -127.62376403808594, -119.34231567382812, -111.06086730957031, -102.7794189453125, -94.49795532226562, -86.21650695800781, -77.93505096435547, -69.65360260009766, -61.37215042114258, -53.0906982421875, -44.80924987792969, -36.52779769897461, -28.24634552001953, -19.964893341064453, -11.683443069458008, -3.4019927978515625, 4.879459381103516, 13.160911560058594, 21.442359924316406, 29.723812103271484, 38.00526428222656, 46.28671646118164, 54.56816864013672, 62.84961700439453, 71.13107299804688, 79.41252136230469, 87.6939697265625, 95.97541809082031, 104.25687408447266, 112.53832244873047, 120.81977844238281, 129.10122680664062, 137.38267517089844, 145.66412353515625, 153.94558715820312, 162.22703552246094, 170.50848388671875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 16.0, 19.0, 16.0, 17.0, 26.0, 27.0, 30.0, 44.0, 48.0, 48.0, 80.0, 105.0, 95.0, 89.0, 52.0, 45.0, 44.0, 24.0, 34.0, 23.0, 28.0, 18.0, 14.0, 14.0, 10.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.67813110351562, -73.49794006347656, -70.3177490234375, -67.13755798339844, -63.95736312866211, -60.77717208862305, -57.596981048583984, -54.416786193847656, -51.236595153808594, -48.05640411376953, -44.87621307373047, -41.696022033691406, -38.51582717895508, -35.335636138916016, -32.15544509887695, -28.975252151489258, -25.795063018798828, -22.614871978759766, -19.43467903137207, -16.254487991333008, -13.074295997619629, -9.89410400390625, -6.7139129638671875, -3.533720016479492, -0.3535289764404297, 2.82666277885437, 6.00685453414917, 9.18704605102539, 12.36723804473877, 15.547430038452148, 18.72762107849121, 21.907814025878906, 25.08800506591797, 28.26819610595703, 31.448389053344727, 34.628578186035156, 37.808773040771484, 40.98896408081055, 44.16915512084961, 47.34934997558594, 50.529541015625, 53.70973205566406, 56.889923095703125, 60.07011413574219, 63.250308990478516, 66.43049621582031, 69.61068725585938, 72.79088592529297, 75.9710693359375, 79.15126037597656, 82.33145141601562, 85.51164245605469, 88.69183349609375, 91.87202453613281, 95.05221557617188, 98.23241424560547, 101.41260528564453, 104.5927963256836, 107.77298736572266, 110.95317840576172, 114.13336944580078, 117.31356811523438, 120.49375915527344, 123.6739501953125, 126.85414123535156]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 15.0, 26.0, 36.0, 41.0, 57.0, 99.0, 130.0, 195.0, 256.0, 388.0, 521.0, 896.0, 1578.0, 2946.0, 6910.0, 20706.0, 96255.0, 663163.0, 2493862.0, 758812.0, 109318.0, 22972.0, 7460.0, 3163.0, 1684.0, 947.0, 596.0, 359.0, 252.0, 188.0, 117.0, 75.0, 62.0, 40.0, 31.0, 19.0, 17.0, 11.0, 10.0, 8.0, 3.0, 7.0, 3.0, 7.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.546875, -6.3572998046875, -6.167724609375, -5.9781494140625, -5.78857421875, -5.5989990234375, -5.409423828125, -5.2198486328125, -5.0302734375, -4.8406982421875, -4.651123046875, -4.4615478515625, -4.27197265625, -4.0823974609375, -3.892822265625, -3.7032470703125, -3.513671875, -3.3240966796875, -3.134521484375, -2.9449462890625, -2.75537109375, -2.5657958984375, -2.376220703125, -2.1866455078125, -1.9970703125, -1.8074951171875, -1.617919921875, -1.4283447265625, -1.23876953125, -1.0491943359375, -0.859619140625, -0.6700439453125, -0.48046875, -0.2908935546875, -0.101318359375, 0.0882568359375, 0.27783203125, 0.4674072265625, 0.656982421875, 0.8465576171875, 1.0361328125, 1.2257080078125, 1.415283203125, 1.6048583984375, 1.79443359375, 1.9840087890625, 2.173583984375, 2.3631591796875, 2.552734375, 2.7423095703125, 2.931884765625, 3.1214599609375, 3.31103515625, 3.5006103515625, 3.690185546875, 3.8797607421875, 4.0693359375, 4.2589111328125, 4.448486328125, 4.6380615234375, 4.82763671875, 5.0172119140625, 5.206787109375, 5.3963623046875, 5.5859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 9.0, 3.0, 11.0, 7.0, 10.0, 7.0, 14.0, 16.0, 19.0, 24.0, 34.0, 18.0, 24.0, 33.0, 46.0, 39.0, 40.0, 38.0, 51.0, 52.0, 43.0, 43.0, 40.0, 48.0, 34.0, 34.0, 29.0, 31.0, 32.0, 27.0, 36.0, 15.0, 14.0, 17.0, 10.0, 11.0, 15.0, 11.0, 4.0, 2.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.95703125, -4.80810546875, -4.6591796875, -4.51025390625, -4.361328125, -4.21240234375, -4.0634765625, -3.91455078125, -3.765625, -3.61669921875, -3.4677734375, -3.31884765625, -3.169921875, -3.02099609375, -2.8720703125, -2.72314453125, -2.57421875, -2.42529296875, -2.2763671875, -2.12744140625, -1.978515625, -1.82958984375, -1.6806640625, -1.53173828125, -1.3828125, -1.23388671875, -1.0849609375, -0.93603515625, -0.787109375, -0.63818359375, -0.4892578125, -0.34033203125, -0.19140625, -0.04248046875, 0.1064453125, 0.25537109375, 0.404296875, 0.55322265625, 0.7021484375, 0.85107421875, 1.0, 1.14892578125, 1.2978515625, 1.44677734375, 1.595703125, 1.74462890625, 1.8935546875, 2.04248046875, 2.19140625, 2.34033203125, 2.4892578125, 2.63818359375, 2.787109375, 2.93603515625, 3.0849609375, 3.23388671875, 3.3828125, 3.53173828125, 3.6806640625, 3.82958984375, 3.978515625, 4.12744140625, 4.2763671875, 4.42529296875, 4.57421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 19.0, 27.0, 82.0, 254.0, 1078.0, 19614.0, 4142688.0, 28708.0, 1289.0, 326.0, 111.0, 46.0, 23.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.33544921875, -39.0146484375, -37.69384765625, -36.373046875, -35.05224609375, -33.7314453125, -32.41064453125, -31.08984375, -29.76904296875, -28.4482421875, -27.12744140625, -25.806640625, -24.48583984375, -23.1650390625, -21.84423828125, -20.5234375, -19.20263671875, -17.8818359375, -16.56103515625, -15.240234375, -13.91943359375, -12.5986328125, -11.27783203125, -9.95703125, -8.63623046875, -7.3154296875, -5.99462890625, -4.673828125, -3.35302734375, -2.0322265625, -0.71142578125, 0.609375, 1.93017578125, 3.2509765625, 4.57177734375, 5.892578125, 7.21337890625, 8.5341796875, 9.85498046875, 11.17578125, 12.49658203125, 13.8173828125, 15.13818359375, 16.458984375, 17.77978515625, 19.1005859375, 20.42138671875, 21.7421875, 23.06298828125, 24.3837890625, 25.70458984375, 27.025390625, 28.34619140625, 29.6669921875, 30.98779296875, 32.30859375, 33.62939453125, 34.9501953125, 36.27099609375, 37.591796875, 38.91259765625, 40.2333984375, 41.55419921875, 42.875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 6.0, 11.0, 12.0, 17.0, 34.0, 54.0, 109.0, 203.0, 440.0, 875.0, 1041.0, 590.0, 319.0, 145.0, 81.0, 43.0, 19.0, 26.0, 15.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.4649658203125, -7.031494140625, -6.5980224609375, -6.16455078125, -5.7310791015625, -5.297607421875, -4.8641357421875, -4.4306640625, -3.9971923828125, -3.563720703125, -3.1302490234375, -2.69677734375, -2.2633056640625, -1.829833984375, -1.3963623046875, -0.962890625, -0.5294189453125, -0.095947265625, 0.3375244140625, 0.77099609375, 1.2044677734375, 1.637939453125, 2.0714111328125, 2.5048828125, 2.9383544921875, 3.371826171875, 3.8052978515625, 4.23876953125, 4.6722412109375, 5.105712890625, 5.5391845703125, 5.97265625, 6.4061279296875, 6.839599609375, 7.2730712890625, 7.70654296875, 8.1400146484375, 8.573486328125, 9.0069580078125, 9.4404296875, 9.8739013671875, 10.307373046875, 10.7408447265625, 11.17431640625, 11.6077880859375, 12.041259765625, 12.4747314453125, 12.908203125, 13.3416748046875, 13.775146484375, 14.2086181640625, 14.64208984375, 15.0755615234375, 15.509033203125, 15.9425048828125, 16.3759765625, 16.8094482421875, 17.242919921875, 17.6763916015625, 18.10986328125, 18.5433349609375, 18.976806640625, 19.4102783203125, 19.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 26.0, 110.0, 333.0, 313.0, 128.0, 48.0, 13.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.99601745605469, -77.53012084960938, -71.06421661376953, -64.59831237792969, -58.132415771484375, -51.6665153503418, -45.20061492919922, -38.73471450805664, -32.26881408691406, -25.802913665771484, -19.337013244628906, -12.871112823486328, -6.40521240234375, 0.060688018798828125, 6.526588439941406, 12.992488861083984, 19.458389282226562, 25.92428970336914, 32.39019012451172, 38.8560905456543, 45.321990966796875, 51.78789138793945, 58.25379180908203, 64.71969604492188, 71.18559265136719, 77.6514892578125, 84.11739349365234, 90.58329772949219, 97.0491943359375, 103.51509094238281, 109.98099517822266, 116.4468994140625, 122.91278076171875, 129.37867736816406, 135.84457397460938, 142.31048583984375, 148.77638244628906, 155.24227905273438, 161.70819091796875, 168.17408752441406, 174.63998413085938, 181.1058807373047, 187.57177734375, 194.03768920898438, 200.5035858154297, 206.969482421875, 213.43539428710938, 219.9012908935547, 226.3671875, 232.8330841064453, 239.29898071289062, 245.764892578125, 252.2307891845703, 258.6966857910156, 265.16259765625, 271.62847900390625, 278.0943908691406, 284.560302734375, 291.02618408203125, 297.4920959472656, 303.9580078125, 310.42388916015625, 316.8898010253906, 323.3556823730469, 329.82159423828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 37.0, 37.0, 45.0, 43.0, 64.0, 66.0, 60.0, 64.0, 46.0, 57.0, 51.0, 49.0, 45.0, 39.0, 48.0, 33.0, 30.0, 10.0, 11.0, 12.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.43990325927734, -66.47781372070312, -64.5157241821289, -62.55363082885742, -60.5915412902832, -58.629451751708984, -56.6673583984375, -54.70526885986328, -52.74317932128906, -50.781089782714844, -48.819000244140625, -46.85690689086914, -44.89481735229492, -42.9327278137207, -40.97063446044922, -39.008544921875, -37.04645538330078, -35.08436584472656, -33.122276306152344, -31.16018295288086, -29.19809341430664, -27.236003875732422, -25.27391242980957, -23.31182098388672, -21.3497314453125, -19.38764190673828, -17.42555046081543, -15.463459968566895, -13.50136947631836, -11.539278984069824, -9.577188491821289, -7.615097999572754, -5.653011322021484, -3.690920829772949, -1.728830337524414, 0.2332601547241211, 2.1953506469726562, 4.157441139221191, 6.119531631469727, 8.081622123718262, 10.043712615966797, 12.005803108215332, 13.967893600463867, 15.929984092712402, 17.892074584960938, 19.854164123535156, 21.816255569458008, 23.77834701538086, 25.740436553955078, 27.702526092529297, 29.66461753845215, 31.626708984375, 33.58879852294922, 35.55088806152344, 37.512977600097656, 39.47507095336914, 41.43716049194336, 43.39925003051758, 45.36134338378906, 47.32343292236328, 49.2855224609375, 51.24761199951172, 53.20970153808594, 55.17179489135742, 57.13388442993164]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 3.0, 8.0, 20.0, 31.0, 28.0, 30.0, 57.0, 103.0, 159.0, 262.0, 418.0, 712.0, 1280.0, 2398.0, 4608.0, 8989.0, 19458.0, 44098.0, 105905.0, 242760.0, 313887.0, 173316.0, 71582.0, 30382.0, 13844.0, 6628.0, 3377.0, 1775.0, 959.0, 600.0, 312.0, 212.0, 120.0, 65.0, 48.0, 37.0, 18.0, 16.0, 12.0, 11.0, 10.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.86328125, -4.68499755859375, -4.5067138671875, -4.32843017578125, -4.150146484375, -3.97186279296875, -3.7935791015625, -3.61529541015625, -3.43701171875, -3.25872802734375, -3.0804443359375, -2.90216064453125, -2.723876953125, -2.54559326171875, -2.3673095703125, -2.18902587890625, -2.0107421875, -1.83245849609375, -1.6541748046875, -1.47589111328125, -1.297607421875, -1.11932373046875, -0.9410400390625, -0.76275634765625, -0.58447265625, -0.40618896484375, -0.2279052734375, -0.04962158203125, 0.128662109375, 0.30694580078125, 0.4852294921875, 0.66351318359375, 0.841796875, 1.02008056640625, 1.1983642578125, 1.37664794921875, 1.554931640625, 1.73321533203125, 1.9114990234375, 2.08978271484375, 2.26806640625, 2.44635009765625, 2.6246337890625, 2.80291748046875, 2.981201171875, 3.15948486328125, 3.3377685546875, 3.51605224609375, 3.6943359375, 3.87261962890625, 4.0509033203125, 4.22918701171875, 4.407470703125, 4.58575439453125, 4.7640380859375, 4.94232177734375, 5.12060546875, 5.29888916015625, 5.4771728515625, 5.65545654296875, 5.833740234375, 6.01202392578125, 6.1903076171875, 6.36859130859375, 6.546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 9.0, 9.0, 13.0, 11.0, 17.0, 17.0, 12.0, 19.0, 20.0, 18.0, 17.0, 26.0, 26.0, 40.0, 29.0, 34.0, 34.0, 30.0, 38.0, 43.0, 32.0, 41.0, 28.0, 43.0, 30.0, 37.0, 25.0, 27.0, 44.0, 27.0, 26.0, 25.0, 22.0, 10.0, 14.0, 13.0, 15.0, 10.0, 7.0, 14.0, 6.0, 4.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.20703125, -4.07733154296875, -3.9476318359375, -3.81793212890625, -3.688232421875, -3.55853271484375, -3.4288330078125, -3.29913330078125, -3.16943359375, -3.03973388671875, -2.9100341796875, -2.78033447265625, -2.650634765625, -2.52093505859375, -2.3912353515625, -2.26153564453125, -2.1318359375, -2.00213623046875, -1.8724365234375, -1.74273681640625, -1.613037109375, -1.48333740234375, -1.3536376953125, -1.22393798828125, -1.09423828125, -0.96453857421875, -0.8348388671875, -0.70513916015625, -0.575439453125, -0.44573974609375, -0.3160400390625, -0.18634033203125, -0.056640625, 0.07305908203125, 0.2027587890625, 0.33245849609375, 0.462158203125, 0.59185791015625, 0.7215576171875, 0.85125732421875, 0.98095703125, 1.11065673828125, 1.2403564453125, 1.37005615234375, 1.499755859375, 1.62945556640625, 1.7591552734375, 1.88885498046875, 2.0185546875, 2.14825439453125, 2.2779541015625, 2.40765380859375, 2.537353515625, 2.66705322265625, 2.7967529296875, 2.92645263671875, 3.05615234375, 3.18585205078125, 3.3155517578125, 3.44525146484375, 3.574951171875, 3.70465087890625, 3.8343505859375, 3.96405029296875, 4.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 13.0, 16.0, 25.0, 38.0, 45.0, 79.0, 107.0, 148.0, 235.0, 386.0, 679.0, 1332.0, 3720.0, 14898.0, 102866.0, 767625.0, 131074.0, 17632.0, 4225.0, 1495.0, 696.0, 411.0, 265.0, 148.0, 96.0, 71.0, 53.0, 42.0, 27.0, 27.0, 21.0, 8.0, 14.0, 7.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.220458984375, -15.72216796875, -15.223876953125, -14.7255859375, -14.227294921875, -13.72900390625, -13.230712890625, -12.732421875, -12.234130859375, -11.73583984375, -11.237548828125, -10.7392578125, -10.240966796875, -9.74267578125, -9.244384765625, -8.74609375, -8.247802734375, -7.74951171875, -7.251220703125, -6.7529296875, -6.254638671875, -5.75634765625, -5.258056640625, -4.759765625, -4.261474609375, -3.76318359375, -3.264892578125, -2.7666015625, -2.268310546875, -1.77001953125, -1.271728515625, -0.7734375, -0.275146484375, 0.22314453125, 0.721435546875, 1.2197265625, 1.718017578125, 2.21630859375, 2.714599609375, 3.212890625, 3.711181640625, 4.20947265625, 4.707763671875, 5.2060546875, 5.704345703125, 6.20263671875, 6.700927734375, 7.19921875, 7.697509765625, 8.19580078125, 8.694091796875, 9.1923828125, 9.690673828125, 10.18896484375, 10.687255859375, 11.185546875, 11.683837890625, 12.18212890625, 12.680419921875, 13.1787109375, 13.677001953125, 14.17529296875, 14.673583984375, 15.171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 12.0, 18.0, 18.0, 29.0, 25.0, 24.0, 31.0, 48.0, 59.0, 48.0, 59.0, 48.0, 69.0, 67.0, 51.0, 52.0, 54.0, 42.0, 32.0, 33.0, 39.0, 24.0, 22.0, 13.0, 11.0, 15.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.594970703125, -20.89306640625, -20.191162109375, -19.4892578125, -18.787353515625, -18.08544921875, -17.383544921875, -16.681640625, -15.979736328125, -15.27783203125, -14.575927734375, -13.8740234375, -13.172119140625, -12.47021484375, -11.768310546875, -11.06640625, -10.364501953125, -9.66259765625, -8.960693359375, -8.2587890625, -7.556884765625, -6.85498046875, -6.153076171875, -5.451171875, -4.749267578125, -4.04736328125, -3.345458984375, -2.6435546875, -1.941650390625, -1.23974609375, -0.537841796875, 0.1640625, 0.865966796875, 1.56787109375, 2.269775390625, 2.9716796875, 3.673583984375, 4.37548828125, 5.077392578125, 5.779296875, 6.481201171875, 7.18310546875, 7.885009765625, 8.5869140625, 9.288818359375, 9.99072265625, 10.692626953125, 11.39453125, 12.096435546875, 12.79833984375, 13.500244140625, 14.2021484375, 14.904052734375, 15.60595703125, 16.307861328125, 17.009765625, 17.711669921875, 18.41357421875, 19.115478515625, 19.8173828125, 20.519287109375, 21.22119140625, 21.923095703125, 22.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 13.0, 20.0, 25.0, 48.0, 95.0, 246.0, 826.0, 3844.0, 33458.0, 925655.0, 76146.0, 6418.0, 1185.0, 336.0, 114.0, 48.0, 24.0, 17.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.8321533203125, -10.500244140625, -10.1683349609375, -9.83642578125, -9.5045166015625, -9.172607421875, -8.8406982421875, -8.5087890625, -8.1768798828125, -7.844970703125, -7.5130615234375, -7.18115234375, -6.8492431640625, -6.517333984375, -6.1854248046875, -5.853515625, -5.5216064453125, -5.189697265625, -4.8577880859375, -4.52587890625, -4.1939697265625, -3.862060546875, -3.5301513671875, -3.1982421875, -2.8663330078125, -2.534423828125, -2.2025146484375, -1.87060546875, -1.5386962890625, -1.206787109375, -0.8748779296875, -0.54296875, -0.2110595703125, 0.120849609375, 0.4527587890625, 0.78466796875, 1.1165771484375, 1.448486328125, 1.7803955078125, 2.1123046875, 2.4442138671875, 2.776123046875, 3.1080322265625, 3.43994140625, 3.7718505859375, 4.103759765625, 4.4356689453125, 4.767578125, 5.0994873046875, 5.431396484375, 5.7633056640625, 6.09521484375, 6.4271240234375, 6.759033203125, 7.0909423828125, 7.4228515625, 7.7547607421875, 8.086669921875, 8.4185791015625, 8.75048828125, 9.0823974609375, 9.414306640625, 9.7462158203125, 10.078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 23.0, 29.0, 39.0, 64.0, 129.0, 224.0, 182.0, 86.0, 55.0, 29.0, 18.0, 12.0, 15.0, 6.0, 6.0, 4.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968612670898438, -0.0011520981788635254, -0.001107335090637207, -0.0010625720024108887, -0.0010178089141845703, -0.000973045825958252, -0.0009282827377319336, -0.0008835196495056152, -0.0008387565612792969, -0.0007939934730529785, -0.0007492303848266602, -0.0007044672966003418, -0.0006597042083740234, -0.0006149411201477051, -0.0005701780319213867, -0.0005254149436950684, -0.00048065185546875, -0.00043588876724243164, -0.0003911256790161133, -0.0003463625907897949, -0.00030159950256347656, -0.0002568364143371582, -0.00021207332611083984, -0.00016731023788452148, -0.00012254714965820312, -7.778406143188477e-05, -3.3020973205566406e-05, 1.1742115020751953e-05, 5.650520324707031e-05, 0.00010126829147338867, 0.00014603137969970703, 0.0001907944679260254, 0.00023555755615234375, 0.0002803206443786621, 0.00032508373260498047, 0.00036984682083129883, 0.0004146099090576172, 0.00045937299728393555, 0.0005041360855102539, 0.0005488991737365723, 0.0005936622619628906, 0.000638425350189209, 0.0006831884384155273, 0.0007279515266418457, 0.0007727146148681641, 0.0008174777030944824, 0.0008622407913208008, 0.0009070038795471191, 0.0009517669677734375, 0.0009965300559997559, 0.0010412931442260742, 0.0010860562324523926, 0.001130819320678711, 0.0011755824089050293, 0.0012203454971313477, 0.001265108585357666, 0.0013098716735839844, 0.0013546347618103027, 0.001399397850036621, 0.0014441609382629395, 0.0014889240264892578, 0.0015336871147155762, 0.0015784502029418945, 0.0016232132911682129, 0.0016679763793945312]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 9.0, 16.0, 15.0, 48.0, 149.0, 442.0, 2295.0, 96934.0, 941833.0, 5782.0, 693.0, 193.0, 76.0, 29.0, 14.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.251220703125, -19.65869140625, -19.066162109375, -18.4736328125, -17.881103515625, -17.28857421875, -16.696044921875, -16.103515625, -15.510986328125, -14.91845703125, -14.325927734375, -13.7333984375, -13.140869140625, -12.54833984375, -11.955810546875, -11.36328125, -10.770751953125, -10.17822265625, -9.585693359375, -8.9931640625, -8.400634765625, -7.80810546875, -7.215576171875, -6.623046875, -6.030517578125, -5.43798828125, -4.845458984375, -4.2529296875, -3.660400390625, -3.06787109375, -2.475341796875, -1.8828125, -1.290283203125, -0.69775390625, -0.105224609375, 0.4873046875, 1.079833984375, 1.67236328125, 2.264892578125, 2.857421875, 3.449951171875, 4.04248046875, 4.635009765625, 5.2275390625, 5.820068359375, 6.41259765625, 7.005126953125, 7.59765625, 8.190185546875, 8.78271484375, 9.375244140625, 9.9677734375, 10.560302734375, 11.15283203125, 11.745361328125, 12.337890625, 12.930419921875, 13.52294921875, 14.115478515625, 14.7080078125, 15.300537109375, 15.89306640625, 16.485595703125, 17.078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 23.0, 26.0, 80.0, 178.0, 334.0, 183.0, 71.0, 38.0, 15.0, 12.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.418212890625, -12.02392578125, -11.629638671875, -11.2353515625, -10.841064453125, -10.44677734375, -10.052490234375, -9.658203125, -9.263916015625, -8.86962890625, -8.475341796875, -8.0810546875, -7.686767578125, -7.29248046875, -6.898193359375, -6.50390625, -6.109619140625, -5.71533203125, -5.321044921875, -4.9267578125, -4.532470703125, -4.13818359375, -3.743896484375, -3.349609375, -2.955322265625, -2.56103515625, -2.166748046875, -1.7724609375, -1.378173828125, -0.98388671875, -0.589599609375, -0.1953125, 0.198974609375, 0.59326171875, 0.987548828125, 1.3818359375, 1.776123046875, 2.17041015625, 2.564697265625, 2.958984375, 3.353271484375, 3.74755859375, 4.141845703125, 4.5361328125, 4.930419921875, 5.32470703125, 5.718994140625, 6.11328125, 6.507568359375, 6.90185546875, 7.296142578125, 7.6904296875, 8.084716796875, 8.47900390625, 8.873291015625, 9.267578125, 9.661865234375, 10.05615234375, 10.450439453125, 10.8447265625, 11.239013671875, 11.63330078125, 12.027587890625, 12.421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 12.0, 15.0, 17.0, 50.0, 87.0, 194.0, 379.0, 150.0, 50.0, 20.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-178.47137451171875, -174.04998779296875, -169.62860107421875, -165.2071990966797, -160.7858123779297, -156.3644256591797, -151.9430389404297, -147.52163696289062, -143.10025024414062, -138.67886352539062, -134.25747680664062, -129.83607482910156, -125.41468811035156, -120.99330139160156, -116.57191467285156, -112.15052032470703, -107.72913360595703, -103.30774688720703, -98.8863525390625, -94.4649658203125, -90.04357147216797, -85.62218475341797, -81.20079040527344, -76.77940368652344, -72.35801696777344, -67.93663024902344, -63.515235900878906, -59.093849182128906, -54.672454833984375, -50.251068115234375, -45.82967758178711, -41.408287048339844, -36.98689270019531, -32.56550216674805, -28.14411163330078, -23.72272300720215, -19.301332473754883, -14.879941940307617, -10.458553314208984, -6.037162780761719, -1.6157722473144531, 2.8056178092956543, 7.227007865905762, 11.648397445678711, 16.069787979125977, 20.491178512573242, 24.912567138671875, 29.33395767211914, 33.755348205566406, 38.17673873901367, 42.59812927246094, 47.01951599121094, 51.44091033935547, 55.86229705810547, 60.283687591552734, 64.705078125, 69.12646484375, 73.5478515625, 77.96924591064453, 82.39063262939453, 86.81202697753906, 91.23341369628906, 95.65480041503906, 100.0761947631836, 104.49758911132812]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 9.0, 9.0, 8.0, 23.0, 16.0, 17.0, 20.0, 22.0, 20.0, 37.0, 28.0, 32.0, 28.0, 53.0, 66.0, 99.0, 89.0, 69.0, 39.0, 31.0, 30.0, 35.0, 29.0, 20.0, 13.0, 16.0, 17.0, 9.0, 15.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-68.72903442382812, -66.56958770751953, -64.41014862060547, -62.250701904296875, -60.09125518798828, -57.93181228637695, -55.772369384765625, -53.61292266845703, -51.4534797668457, -49.294036865234375, -47.13459014892578, -44.97514724731445, -42.815704345703125, -40.65625762939453, -38.4968147277832, -36.337371826171875, -34.17792510986328, -32.01848220825195, -29.85903549194336, -27.69959259033203, -25.54014778137207, -23.38070297241211, -21.22126007080078, -19.06181526184082, -16.90237045288086, -14.742925643920898, -12.583481788635254, -10.42403793334961, -8.264593124389648, -6.1051483154296875, -3.945704460144043, -1.7862606048583984, 0.3731842041015625, 2.5326285362243652, 4.692072868347168, 6.851517200469971, 9.010961532592773, 11.170406341552734, 13.329850196838379, 15.489294052124023, 17.648738861083984, 19.808183670043945, 21.967628479003906, 24.127071380615234, 26.286516189575195, 28.445960998535156, 30.605403900146484, 32.76484680175781, 34.924293518066406, 37.083736419677734, 39.24318313598633, 41.402626037597656, 43.56207275390625, 45.72151565551758, 47.880958557128906, 50.0404052734375, 52.19984817504883, 54.359291076660156, 56.51873779296875, 58.67818069458008, 60.837623596191406, 62.9970703125, 65.1565170288086, 67.31595611572266, 69.47540283203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 13.0, 15.0, 29.0, 57.0, 95.0, 195.0, 387.0, 731.0, 1691.0, 4567.0, 16015.0, 97786.0, 1041812.0, 2605531.0, 371246.0, 40148.0, 8725.0, 2922.0, 1208.0, 513.0, 255.0, 143.0, 78.0, 45.0, 27.0, 16.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.7071533203125, -8.445556640625, -8.1839599609375, -7.92236328125, -7.6607666015625, -7.399169921875, -7.1375732421875, -6.8759765625, -6.6143798828125, -6.352783203125, -6.0911865234375, -5.82958984375, -5.5679931640625, -5.306396484375, -5.0447998046875, -4.783203125, -4.5216064453125, -4.260009765625, -3.9984130859375, -3.73681640625, -3.4752197265625, -3.213623046875, -2.9520263671875, -2.6904296875, -2.4288330078125, -2.167236328125, -1.9056396484375, -1.64404296875, -1.3824462890625, -1.120849609375, -0.8592529296875, -0.59765625, -0.3360595703125, -0.074462890625, 0.1871337890625, 0.44873046875, 0.7103271484375, 0.971923828125, 1.2335205078125, 1.4951171875, 1.7567138671875, 2.018310546875, 2.2799072265625, 2.54150390625, 2.8031005859375, 3.064697265625, 3.3262939453125, 3.587890625, 3.8494873046875, 4.111083984375, 4.3726806640625, 4.63427734375, 4.8958740234375, 5.157470703125, 5.4190673828125, 5.6806640625, 5.9422607421875, 6.203857421875, 6.4654541015625, 6.72705078125, 6.9886474609375, 7.250244140625, 7.5118408203125, 7.7734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 12.0, 17.0, 13.0, 21.0, 17.0, 32.0, 17.0, 24.0, 33.0, 42.0, 41.0, 32.0, 50.0, 38.0, 29.0, 43.0, 51.0, 47.0, 42.0, 46.0, 36.0, 40.0, 41.0, 33.0, 24.0, 23.0, 20.0, 15.0, 24.0, 19.0, 15.0, 4.0, 6.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45916748046875, -4.3050537109375, -4.15093994140625, -3.996826171875, -3.84271240234375, -3.6885986328125, -3.53448486328125, -3.38037109375, -3.22625732421875, -3.0721435546875, -2.91802978515625, -2.763916015625, -2.60980224609375, -2.4556884765625, -2.30157470703125, -2.1474609375, -1.99334716796875, -1.8392333984375, -1.68511962890625, -1.531005859375, -1.37689208984375, -1.2227783203125, -1.06866455078125, -0.91455078125, -0.76043701171875, -0.6063232421875, -0.45220947265625, -0.298095703125, -0.14398193359375, 0.0101318359375, 0.16424560546875, 0.318359375, 0.47247314453125, 0.6265869140625, 0.78070068359375, 0.934814453125, 1.08892822265625, 1.2430419921875, 1.39715576171875, 1.55126953125, 1.70538330078125, 1.8594970703125, 2.01361083984375, 2.167724609375, 2.32183837890625, 2.4759521484375, 2.63006591796875, 2.7841796875, 2.93829345703125, 3.0924072265625, 3.24652099609375, 3.400634765625, 3.55474853515625, 3.7088623046875, 3.86297607421875, 4.01708984375, 4.17120361328125, 4.3253173828125, 4.47943115234375, 4.633544921875, 4.78765869140625, 4.9417724609375, 5.09588623046875, 5.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 17.0, 62.0, 132.0, 371.0, 1944.0, 447515.0, 3739835.0, 3528.0, 541.0, 204.0, 72.0, 28.0, 18.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9375, -38.4638671875, -36.990234375, -35.5166015625, -34.04296875, -32.5693359375, -31.095703125, -29.6220703125, -28.1484375, -26.6748046875, -25.201171875, -23.7275390625, -22.25390625, -20.7802734375, -19.306640625, -17.8330078125, -16.359375, -14.8857421875, -13.412109375, -11.9384765625, -10.46484375, -8.9912109375, -7.517578125, -6.0439453125, -4.5703125, -3.0966796875, -1.623046875, -0.1494140625, 1.32421875, 2.7978515625, 4.271484375, 5.7451171875, 7.21875, 8.6923828125, 10.166015625, 11.6396484375, 13.11328125, 14.5869140625, 16.060546875, 17.5341796875, 19.0078125, 20.4814453125, 21.955078125, 23.4287109375, 24.90234375, 26.3759765625, 27.849609375, 29.3232421875, 30.796875, 32.2705078125, 33.744140625, 35.2177734375, 36.69140625, 38.1650390625, 39.638671875, 41.1123046875, 42.5859375, 44.0595703125, 45.533203125, 47.0068359375, 48.48046875, 49.9541015625, 51.427734375, 52.9013671875, 54.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 12.0, 11.0, 17.0, 40.0, 80.0, 143.0, 364.0, 830.0, 1212.0, 753.0, 299.0, 149.0, 65.0, 44.0, 18.0, 17.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.623779296875, -10.01318359375, -9.402587890625, -8.7919921875, -8.181396484375, -7.57080078125, -6.960205078125, -6.349609375, -5.739013671875, -5.12841796875, -4.517822265625, -3.9072265625, -3.296630859375, -2.68603515625, -2.075439453125, -1.46484375, -0.854248046875, -0.24365234375, 0.366943359375, 0.9775390625, 1.588134765625, 2.19873046875, 2.809326171875, 3.419921875, 4.030517578125, 4.64111328125, 5.251708984375, 5.8623046875, 6.472900390625, 7.08349609375, 7.694091796875, 8.3046875, 8.915283203125, 9.52587890625, 10.136474609375, 10.7470703125, 11.357666015625, 11.96826171875, 12.578857421875, 13.189453125, 13.800048828125, 14.41064453125, 15.021240234375, 15.6318359375, 16.242431640625, 16.85302734375, 17.463623046875, 18.07421875, 18.684814453125, 19.29541015625, 19.906005859375, 20.5166015625, 21.127197265625, 21.73779296875, 22.348388671875, 22.958984375, 23.569580078125, 24.18017578125, 24.790771484375, 25.4013671875, 26.011962890625, 26.62255859375, 27.233154296875, 27.84375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 37.0, 125.0, 299.0, 326.0, 134.0, 33.0, 13.0, 8.0, 6.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-262.331298828125, -255.21958923339844, -248.1078643798828, -240.99615478515625, -233.8844451904297, -226.77273559570312, -219.6610107421875, -212.54930114746094, -205.43759155273438, -198.3258819580078, -191.2141571044922, -184.10244750976562, -176.99073791503906, -169.8790283203125, -162.76730346679688, -155.6555938720703, -148.5438690185547, -141.43215942382812, -134.3204345703125, -127.20872497558594, -120.09701538085938, -112.98529815673828, -105.87358093261719, -98.76187133789062, -91.65015411376953, -84.53843688964844, -77.42672729492188, -70.31501007080078, -63.20329666137695, -56.091583251953125, -48.97986602783203, -41.8681526184082, -34.75642395019531, -27.644710540771484, -20.532995223999023, -13.421279907226562, -6.309566497802734, 0.8021469116210938, 7.9138641357421875, 15.025577545166016, 22.137290954589844, 29.249004364013672, 36.3607177734375, 43.472434997558594, 50.58414840698242, 57.69586181640625, 64.80757904052734, 71.91929626464844, 79.031005859375, 86.1427230834961, 93.25443267822266, 100.36614990234375, 107.47785949707031, 114.5895767211914, 121.7012939453125, 128.81300354003906, 135.92471313476562, 143.0364227294922, 150.1481475830078, 157.25985717773438, 164.37156677246094, 171.4832763671875, 178.59500122070312, 185.7067108154297, 192.8184356689453]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 9.0, 12.0, 5.0, 7.0, 8.0, 6.0, 15.0, 20.0, 32.0, 21.0, 30.0, 32.0, 33.0, 38.0, 40.0, 43.0, 48.0, 46.0, 56.0, 53.0, 41.0, 48.0, 53.0, 28.0, 45.0, 30.0, 31.0, 27.0, 33.0, 27.0, 15.0, 12.0, 13.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-68.60537719726562, -66.64068603515625, -64.67599487304688, -62.711299896240234, -60.746604919433594, -58.78191375732422, -56.817222595214844, -54.8525276184082, -52.88783264160156, -50.92314147949219, -48.95844650268555, -46.99375534057617, -45.02906036376953, -43.064369201660156, -41.09967803955078, -39.13498306274414, -37.170291900634766, -35.20560073852539, -33.24090576171875, -31.276214599609375, -29.311519622802734, -27.34682846069336, -25.38213539123535, -23.417442321777344, -21.452749252319336, -19.488056182861328, -17.52336311340332, -15.558670997619629, -13.593977928161621, -11.629284858703613, -9.664592742919922, -7.699899673461914, -5.735206604003906, -3.7705137729644775, -1.8058209419250488, 0.15887165069580078, 2.1235647201538086, 4.088257789611816, 6.052949905395508, 8.017642974853516, 9.982336044311523, 11.947029113769531, 13.911722183227539, 15.87641429901123, 17.841106414794922, 19.805801391601562, 21.770492553710938, 23.735185623168945, 25.699878692626953, 27.66457176208496, 29.62926483154297, 31.593955993652344, 33.558650970458984, 35.52334213256836, 37.488037109375, 39.452728271484375, 41.41741943359375, 43.382110595703125, 45.346805572509766, 47.31149673461914, 49.27619171142578, 51.240882873535156, 53.20557403564453, 55.17026901245117, 57.13496398925781]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 31.0, 50.0, 69.0, 100.0, 190.0, 276.0, 466.0, 914.0, 1909.0, 4264.0, 10600.0, 28629.0, 84386.0, 273120.0, 414397.0, 150997.0, 48725.0, 16838.0, 6728.0, 2861.0, 1361.0, 647.0, 355.0, 216.0, 122.0, 84.0, 50.0, 42.0, 19.0, 15.0, 12.0, 10.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.03125, -9.7545166015625, -9.477783203125, -9.2010498046875, -8.92431640625, -8.6475830078125, -8.370849609375, -8.0941162109375, -7.8173828125, -7.5406494140625, -7.263916015625, -6.9871826171875, -6.71044921875, -6.4337158203125, -6.156982421875, -5.8802490234375, -5.603515625, -5.3267822265625, -5.050048828125, -4.7733154296875, -4.49658203125, -4.2198486328125, -3.943115234375, -3.6663818359375, -3.3896484375, -3.1129150390625, -2.836181640625, -2.5594482421875, -2.28271484375, -2.0059814453125, -1.729248046875, -1.4525146484375, -1.17578125, -0.8990478515625, -0.622314453125, -0.3455810546875, -0.06884765625, 0.2078857421875, 0.484619140625, 0.7613525390625, 1.0380859375, 1.3148193359375, 1.591552734375, 1.8682861328125, 2.14501953125, 2.4217529296875, 2.698486328125, 2.9752197265625, 3.251953125, 3.5286865234375, 3.805419921875, 4.0821533203125, 4.35888671875, 4.6356201171875, 4.912353515625, 5.1890869140625, 5.4658203125, 5.7425537109375, 6.019287109375, 6.2960205078125, 6.57275390625, 6.8494873046875, 7.126220703125, 7.4029541015625, 7.6796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 10.0, 8.0, 6.0, 6.0, 12.0, 15.0, 18.0, 22.0, 23.0, 40.0, 33.0, 38.0, 39.0, 36.0, 41.0, 47.0, 57.0, 48.0, 41.0, 53.0, 48.0, 41.0, 44.0, 38.0, 29.0, 29.0, 22.0, 32.0, 24.0, 19.0, 17.0, 15.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.44384765625, -4.2744140625, -4.10498046875, -3.935546875, -3.76611328125, -3.5966796875, -3.42724609375, -3.2578125, -3.08837890625, -2.9189453125, -2.74951171875, -2.580078125, -2.41064453125, -2.2412109375, -2.07177734375, -1.90234375, -1.73291015625, -1.5634765625, -1.39404296875, -1.224609375, -1.05517578125, -0.8857421875, -0.71630859375, -0.546875, -0.37744140625, -0.2080078125, -0.03857421875, 0.130859375, 0.30029296875, 0.4697265625, 0.63916015625, 0.80859375, 0.97802734375, 1.1474609375, 1.31689453125, 1.486328125, 1.65576171875, 1.8251953125, 1.99462890625, 2.1640625, 2.33349609375, 2.5029296875, 2.67236328125, 2.841796875, 3.01123046875, 3.1806640625, 3.35009765625, 3.51953125, 3.68896484375, 3.8583984375, 4.02783203125, 4.197265625, 4.36669921875, 4.5361328125, 4.70556640625, 4.875, 5.04443359375, 5.2138671875, 5.38330078125, 5.552734375, 5.72216796875, 5.8916015625, 6.06103515625, 6.23046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 9.0, 19.0, 16.0, 29.0, 30.0, 48.0, 76.0, 112.0, 163.0, 240.0, 379.0, 587.0, 1315.0, 2949.0, 10774.0, 89488.0, 853206.0, 73806.0, 9649.0, 2754.0, 1206.0, 659.0, 340.0, 213.0, 156.0, 98.0, 61.0, 44.0, 39.0, 16.0, 14.0, 19.0, 7.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.875, -23.22021484375, -22.5654296875, -21.91064453125, -21.255859375, -20.60107421875, -19.9462890625, -19.29150390625, -18.63671875, -17.98193359375, -17.3271484375, -16.67236328125, -16.017578125, -15.36279296875, -14.7080078125, -14.05322265625, -13.3984375, -12.74365234375, -12.0888671875, -11.43408203125, -10.779296875, -10.12451171875, -9.4697265625, -8.81494140625, -8.16015625, -7.50537109375, -6.8505859375, -6.19580078125, -5.541015625, -4.88623046875, -4.2314453125, -3.57666015625, -2.921875, -2.26708984375, -1.6123046875, -0.95751953125, -0.302734375, 0.35205078125, 1.0068359375, 1.66162109375, 2.31640625, 2.97119140625, 3.6259765625, 4.28076171875, 4.935546875, 5.59033203125, 6.2451171875, 6.89990234375, 7.5546875, 8.20947265625, 8.8642578125, 9.51904296875, 10.173828125, 10.82861328125, 11.4833984375, 12.13818359375, 12.79296875, 13.44775390625, 14.1025390625, 14.75732421875, 15.412109375, 16.06689453125, 16.7216796875, 17.37646484375, 18.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 4.0, 4.0, 16.0, 9.0, 12.0, 15.0, 18.0, 28.0, 24.0, 42.0, 23.0, 43.0, 44.0, 48.0, 64.0, 61.0, 65.0, 65.0, 45.0, 51.0, 49.0, 33.0, 37.0, 29.0, 25.0, 31.0, 26.0, 11.0, 13.0, 11.0, 9.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.26123046875, -20.6005859375, -19.93994140625, -19.279296875, -18.61865234375, -17.9580078125, -17.29736328125, -16.63671875, -15.97607421875, -15.3154296875, -14.65478515625, -13.994140625, -13.33349609375, -12.6728515625, -12.01220703125, -11.3515625, -10.69091796875, -10.0302734375, -9.36962890625, -8.708984375, -8.04833984375, -7.3876953125, -6.72705078125, -6.06640625, -5.40576171875, -4.7451171875, -4.08447265625, -3.423828125, -2.76318359375, -2.1025390625, -1.44189453125, -0.78125, -0.12060546875, 0.5400390625, 1.20068359375, 1.861328125, 2.52197265625, 3.1826171875, 3.84326171875, 4.50390625, 5.16455078125, 5.8251953125, 6.48583984375, 7.146484375, 7.80712890625, 8.4677734375, 9.12841796875, 9.7890625, 10.44970703125, 11.1103515625, 11.77099609375, 12.431640625, 13.09228515625, 13.7529296875, 14.41357421875, 15.07421875, 15.73486328125, 16.3955078125, 17.05615234375, 17.716796875, 18.37744140625, 19.0380859375, 19.69873046875, 20.359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 38.0, 46.0, 67.0, 94.0, 200.0, 432.0, 1227.0, 5104.0, 55846.0, 950498.0, 29454.0, 3769.0, 925.0, 338.0, 188.0, 108.0, 57.0, 34.0, 24.0, 17.0, 20.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.4071044921875, -10.095458984375, -9.7838134765625, -9.47216796875, -9.1605224609375, -8.848876953125, -8.5372314453125, -8.2255859375, -7.9139404296875, -7.602294921875, -7.2906494140625, -6.97900390625, -6.6673583984375, -6.355712890625, -6.0440673828125, -5.732421875, -5.4207763671875, -5.109130859375, -4.7974853515625, -4.48583984375, -4.1741943359375, -3.862548828125, -3.5509033203125, -3.2392578125, -2.9276123046875, -2.615966796875, -2.3043212890625, -1.99267578125, -1.6810302734375, -1.369384765625, -1.0577392578125, -0.74609375, -0.4344482421875, -0.122802734375, 0.1888427734375, 0.50048828125, 0.8121337890625, 1.123779296875, 1.4354248046875, 1.7470703125, 2.0587158203125, 2.370361328125, 2.6820068359375, 2.99365234375, 3.3052978515625, 3.616943359375, 3.9285888671875, 4.240234375, 4.5518798828125, 4.863525390625, 5.1751708984375, 5.48681640625, 5.7984619140625, 6.110107421875, 6.4217529296875, 6.7333984375, 7.0450439453125, 7.356689453125, 7.6683349609375, 7.97998046875, 8.2916259765625, 8.603271484375, 8.9149169921875, 9.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 9.0, 13.0, 14.0, 34.0, 49.0, 77.0, 154.0, 223.0, 138.0, 68.0, 51.0, 37.0, 22.0, 15.0, 7.0, 9.0, 7.0, 4.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016536712646484375, -0.0016117841005325317, -0.001569896936416626, -0.0015280097723007202, -0.0014861226081848145, -0.0014442354440689087, -0.001402348279953003, -0.0013604611158370972, -0.0013185739517211914, -0.0012766867876052856, -0.0012347996234893799, -0.0011929124593734741, -0.0011510252952575684, -0.0011091381311416626, -0.0010672509670257568, -0.001025363802909851, -0.0009834766387939453, -0.0009415894746780396, -0.0008997023105621338, -0.000857815146446228, -0.0008159279823303223, -0.0007740408182144165, -0.0007321536540985107, -0.000690266489982605, -0.0006483793258666992, -0.0006064921617507935, -0.0005646049976348877, -0.0005227178335189819, -0.00048083066940307617, -0.0004389435052871704, -0.00039705634117126465, -0.0003551691770553589, -0.0003132820129394531, -0.00027139484882354736, -0.0002295076847076416, -0.00018762052059173584, -0.00014573335647583008, -0.00010384619235992432, -6.195902824401855e-05, -2.0071864128112793e-05, 2.181529998779297e-05, 6.370246410369873e-05, 0.00010558962821960449, 0.00014747679233551025, 0.00018936395645141602, 0.00023125112056732178, 0.00027313828468322754, 0.0003150254487991333, 0.00035691261291503906, 0.0003987997770309448, 0.0004406869411468506, 0.00048257410526275635, 0.0005244612693786621, 0.0005663484334945679, 0.0006082355976104736, 0.0006501227617263794, 0.0006920099258422852, 0.0007338970899581909, 0.0007757842540740967, 0.0008176714181900024, 0.0008595585823059082, 0.000901445746421814, 0.0009433329105377197, 0.0009852200746536255, 0.0010271072387695312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 9.0, 26.0, 28.0, 47.0, 95.0, 267.0, 609.0, 2214.0, 18985.0, 933759.0, 85650.0, 5180.0, 992.0, 360.0, 140.0, 77.0, 42.0, 28.0, 12.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.58056640625, -12.2470703125, -11.91357421875, -11.580078125, -11.24658203125, -10.9130859375, -10.57958984375, -10.24609375, -9.91259765625, -9.5791015625, -9.24560546875, -8.912109375, -8.57861328125, -8.2451171875, -7.91162109375, -7.578125, -7.24462890625, -6.9111328125, -6.57763671875, -6.244140625, -5.91064453125, -5.5771484375, -5.24365234375, -4.91015625, -4.57666015625, -4.2431640625, -3.90966796875, -3.576171875, -3.24267578125, -2.9091796875, -2.57568359375, -2.2421875, -1.90869140625, -1.5751953125, -1.24169921875, -0.908203125, -0.57470703125, -0.2412109375, 0.09228515625, 0.42578125, 0.75927734375, 1.0927734375, 1.42626953125, 1.759765625, 2.09326171875, 2.4267578125, 2.76025390625, 3.09375, 3.42724609375, 3.7607421875, 4.09423828125, 4.427734375, 4.76123046875, 5.0947265625, 5.42822265625, 5.76171875, 6.09521484375, 6.4287109375, 6.76220703125, 7.095703125, 7.42919921875, 7.7626953125, 8.09619140625, 8.4296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 3.0, 3.0, 5.0, 4.0, 5.0, 14.0, 12.0, 17.0, 26.0, 34.0, 49.0, 60.0, 90.0, 118.0, 151.0, 94.0, 78.0, 53.0, 33.0, 38.0, 29.0, 17.0, 14.0, 11.0, 13.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.6251220703125, -5.461181640625, -5.2972412109375, -5.13330078125, -4.9693603515625, -4.805419921875, -4.6414794921875, -4.4775390625, -4.3135986328125, -4.149658203125, -3.9857177734375, -3.82177734375, -3.6578369140625, -3.493896484375, -3.3299560546875, -3.166015625, -3.0020751953125, -2.838134765625, -2.6741943359375, -2.51025390625, -2.3463134765625, -2.182373046875, -2.0184326171875, -1.8544921875, -1.6905517578125, -1.526611328125, -1.3626708984375, -1.19873046875, -1.0347900390625, -0.870849609375, -0.7069091796875, -0.54296875, -0.3790283203125, -0.215087890625, -0.0511474609375, 0.11279296875, 0.2767333984375, 0.440673828125, 0.6046142578125, 0.7685546875, 0.9324951171875, 1.096435546875, 1.2603759765625, 1.42431640625, 1.5882568359375, 1.752197265625, 1.9161376953125, 2.080078125, 2.2440185546875, 2.407958984375, 2.5718994140625, 2.73583984375, 2.8997802734375, 3.063720703125, 3.2276611328125, 3.3916015625, 3.5555419921875, 3.719482421875, 3.8834228515625, 4.04736328125, 4.2113037109375, 4.375244140625, 4.5391845703125, 4.703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 60.0, 656.0, 238.0, 32.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.8194580078125, -679.603271484375, -665.3870849609375, -651.1708984375, -636.9547119140625, -622.738525390625, -608.5223388671875, -594.30615234375, -580.0899658203125, -565.873779296875, -551.6575927734375, -537.44140625, -523.2252197265625, -509.009033203125, -494.7928466796875, -480.57666015625, -466.3605041503906, -452.1443176269531, -437.9281311035156, -423.7119445800781, -409.4957580566406, -395.2795715332031, -381.06341552734375, -366.84722900390625, -352.63104248046875, -338.41485595703125, -324.19866943359375, -309.98248291015625, -295.76629638671875, -281.55010986328125, -267.33392333984375, -253.1177520751953, -238.90151977539062, -224.68533325195312, -210.46914672851562, -196.25296020507812, -182.03677368164062, -167.82058715820312, -153.6044158935547, -139.3882293701172, -125.17204284667969, -110.95585632324219, -96.73966979980469, -82.52349090576172, -68.30730438232422, -54.09111785888672, -39.87493896484375, -25.65875244140625, -11.44256591796875, 2.773618698120117, 16.989803314208984, 31.20598602294922, 45.42217254638672, 59.63835906982422, 73.85453796386719, 88.07072448730469, 102.28691101074219, 116.50309753417969, 130.7192840576172, 144.93545532226562, 159.15164184570312, 173.36782836914062, 187.58401489257812, 201.80020141601562, 216.01638793945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 6.0, 18.0, 14.0, 19.0, 25.0, 30.0, 31.0, 34.0, 28.0, 34.0, 50.0, 124.0, 170.0, 70.0, 39.0, 49.0, 37.0, 26.0, 24.0, 26.0, 28.0, 13.0, 15.0, 17.0, 7.0, 10.0, 8.0, 5.0, 1.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.43122863769531, -98.28334045410156, -95.13545989990234, -91.9875717163086, -88.83969116210938, -85.69180297851562, -82.54391479492188, -79.39603424072266, -76.24815368652344, -73.10026550292969, -69.95238494873047, -66.80449676513672, -63.6566162109375, -60.50872802734375, -57.360843658447266, -54.21295928955078, -51.06507110595703, -47.91718673706055, -44.76930236816406, -41.62141418457031, -38.473533630371094, -35.325645446777344, -32.17776107788086, -29.029876708984375, -25.88199234008789, -22.734107971191406, -19.586223602294922, -16.438337326049805, -13.29045295715332, -10.142568588256836, -6.994682312011719, -3.8467979431152344, -0.69891357421875, 2.4489712715148926, 5.596856117248535, 8.744741439819336, 11.89262580871582, 15.040510177612305, 18.188396453857422, 21.336280822753906, 24.48416519165039, 27.632049560546875, 30.77993392944336, 33.927818298339844, 37.075706481933594, 40.22358703613281, 43.37147521972656, 46.51935958862305, 49.66724395751953, 52.815128326416016, 55.9630126953125, 59.11090087890625, 62.25878143310547, 65.40666961669922, 68.55455017089844, 71.70243835449219, 74.85032653808594, 77.99821472167969, 81.1460952758789, 84.29398345947266, 87.44186401367188, 90.58975219726562, 93.73764038085938, 96.8855209350586, 100.03340148925781]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 12.0, 12.0, 15.0, 28.0, 52.0, 85.0, 123.0, 203.0, 333.0, 569.0, 1087.0, 2200.0, 5725.0, 21654.0, 209384.0, 2352085.0, 1475914.0, 102566.0, 14152.0, 4260.0, 1719.0, 863.0, 480.0, 301.0, 165.0, 94.0, 74.0, 41.0, 34.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6641845703125, -11.273681640625, -10.8831787109375, -10.49267578125, -10.1021728515625, -9.711669921875, -9.3211669921875, -8.9306640625, -8.5401611328125, -8.149658203125, -7.7591552734375, -7.36865234375, -6.9781494140625, -6.587646484375, -6.1971435546875, -5.806640625, -5.4161376953125, -5.025634765625, -4.6351318359375, -4.24462890625, -3.8541259765625, -3.463623046875, -3.0731201171875, -2.6826171875, -2.2921142578125, -1.901611328125, -1.5111083984375, -1.12060546875, -0.7301025390625, -0.339599609375, 0.0509033203125, 0.44140625, 0.8319091796875, 1.222412109375, 1.6129150390625, 2.00341796875, 2.3939208984375, 2.784423828125, 3.1749267578125, 3.5654296875, 3.9559326171875, 4.346435546875, 4.7369384765625, 5.12744140625, 5.5179443359375, 5.908447265625, 6.2989501953125, 6.689453125, 7.0799560546875, 7.470458984375, 7.8609619140625, 8.25146484375, 8.6419677734375, 9.032470703125, 9.4229736328125, 9.8134765625, 10.2039794921875, 10.594482421875, 10.9849853515625, 11.37548828125, 11.7659912109375, 12.156494140625, 12.5469970703125, 12.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 5.0, 9.0, 13.0, 13.0, 12.0, 24.0, 22.0, 29.0, 27.0, 26.0, 26.0, 33.0, 37.0, 34.0, 42.0, 47.0, 47.0, 41.0, 50.0, 50.0, 37.0, 40.0, 34.0, 33.0, 35.0, 26.0, 32.0, 26.0, 19.0, 22.0, 23.0, 11.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.15789794921875, -4.0072021484375, -3.85650634765625, -3.705810546875, -3.55511474609375, -3.4044189453125, -3.25372314453125, -3.10302734375, -2.95233154296875, -2.8016357421875, -2.65093994140625, -2.500244140625, -2.34954833984375, -2.1988525390625, -2.04815673828125, -1.8974609375, -1.74676513671875, -1.5960693359375, -1.44537353515625, -1.294677734375, -1.14398193359375, -0.9932861328125, -0.84259033203125, -0.69189453125, -0.54119873046875, -0.3905029296875, -0.23980712890625, -0.089111328125, 0.06158447265625, 0.2122802734375, 0.36297607421875, 0.513671875, 0.66436767578125, 0.8150634765625, 0.96575927734375, 1.116455078125, 1.26715087890625, 1.4178466796875, 1.56854248046875, 1.71923828125, 1.86993408203125, 2.0206298828125, 2.17132568359375, 2.322021484375, 2.47271728515625, 2.6234130859375, 2.77410888671875, 2.9248046875, 3.07550048828125, 3.2261962890625, 3.37689208984375, 3.527587890625, 3.67828369140625, 3.8289794921875, 3.97967529296875, 4.13037109375, 4.28106689453125, 4.4317626953125, 4.58245849609375, 4.733154296875, 4.88385009765625, 5.0345458984375, 5.18524169921875, 5.3359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 9.0, 14.0, 30.0, 65.0, 103.0, 207.0, 412.0, 1010.0, 3957.0, 362168.0, 3817162.0, 6768.0, 1358.0, 473.0, 255.0, 125.0, 62.0, 35.0, 24.0, 12.0, 11.0, 10.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.53125, -49.76123046875, -47.9912109375, -46.22119140625, -44.451171875, -42.68115234375, -40.9111328125, -39.14111328125, -37.37109375, -35.60107421875, -33.8310546875, -32.06103515625, -30.291015625, -28.52099609375, -26.7509765625, -24.98095703125, -23.2109375, -21.44091796875, -19.6708984375, -17.90087890625, -16.130859375, -14.36083984375, -12.5908203125, -10.82080078125, -9.05078125, -7.28076171875, -5.5107421875, -3.74072265625, -1.970703125, -0.20068359375, 1.5693359375, 3.33935546875, 5.109375, 6.87939453125, 8.6494140625, 10.41943359375, 12.189453125, 13.95947265625, 15.7294921875, 17.49951171875, 19.26953125, 21.03955078125, 22.8095703125, 24.57958984375, 26.349609375, 28.11962890625, 29.8896484375, 31.65966796875, 33.4296875, 35.19970703125, 36.9697265625, 38.73974609375, 40.509765625, 42.27978515625, 44.0498046875, 45.81982421875, 47.58984375, 49.35986328125, 51.1298828125, 52.89990234375, 54.669921875, 56.43994140625, 58.2099609375, 59.97998046875, 61.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 14.0, 13.0, 24.0, 28.0, 63.0, 92.0, 102.0, 204.0, 347.0, 575.0, 703.0, 676.0, 427.0, 248.0, 162.0, 100.0, 78.0, 47.0, 43.0, 28.0, 20.0, 19.0, 10.0, 11.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -12.901611328125, -12.33447265625, -11.767333984375, -11.2001953125, -10.633056640625, -10.06591796875, -9.498779296875, -8.931640625, -8.364501953125, -7.79736328125, -7.230224609375, -6.6630859375, -6.095947265625, -5.52880859375, -4.961669921875, -4.39453125, -3.827392578125, -3.26025390625, -2.693115234375, -2.1259765625, -1.558837890625, -0.99169921875, -0.424560546875, 0.142578125, 0.709716796875, 1.27685546875, 1.843994140625, 2.4111328125, 2.978271484375, 3.54541015625, 4.112548828125, 4.6796875, 5.246826171875, 5.81396484375, 6.381103515625, 6.9482421875, 7.515380859375, 8.08251953125, 8.649658203125, 9.216796875, 9.783935546875, 10.35107421875, 10.918212890625, 11.4853515625, 12.052490234375, 12.61962890625, 13.186767578125, 13.75390625, 14.321044921875, 14.88818359375, 15.455322265625, 16.0224609375, 16.589599609375, 17.15673828125, 17.723876953125, 18.291015625, 18.858154296875, 19.42529296875, 19.992431640625, 20.5595703125, 21.126708984375, 21.69384765625, 22.260986328125, 22.828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 12.0, 22.0, 56.0, 128.0, 202.0, 231.0, 150.0, 67.0, 38.0, 16.0, 12.0, 9.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.5052947998047, -159.9416961669922, -152.3780975341797, -144.81448364257812, -137.25088500976562, -129.68728637695312, -122.12368774414062, -114.56008911132812, -106.9964828491211, -99.4328842163086, -91.86927795410156, -84.30567932128906, -76.74208068847656, -69.17847442626953, -61.61487579345703, -54.051273345947266, -46.4876708984375, -38.924068450927734, -31.3604679107666, -23.79686737060547, -16.233264923095703, -8.669662475585938, -1.1060638427734375, 6.457538604736328, 14.021141052246094, 21.58474349975586, 29.148344039916992, 36.711944580078125, 44.27554702758789, 51.839149475097656, 59.402748107910156, 66.96635437011719, 74.52996826171875, 82.09356689453125, 89.65717315673828, 97.22077178955078, 104.78437805175781, 112.34797668457031, 119.91157531738281, 127.47517395019531, 135.03878784179688, 142.60238647460938, 150.16598510742188, 157.72958374023438, 165.29319763183594, 172.85679626464844, 180.42039489746094, 187.98399353027344, 195.54759216308594, 203.11119079589844, 210.67478942871094, 218.2384033203125, 225.802001953125, 233.3656005859375, 240.92919921875, 248.4927978515625, 256.056396484375, 263.6199951171875, 271.18359375, 278.7471923828125, 286.310791015625, 293.8743896484375, 301.43798828125, 309.0016174316406, 316.5652160644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 9.0, 7.0, 16.0, 25.0, 17.0, 32.0, 31.0, 48.0, 60.0, 53.0, 67.0, 55.0, 77.0, 91.0, 74.0, 56.0, 53.0, 41.0, 40.0, 29.0, 28.0, 14.0, 18.0, 8.0, 10.0, 3.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.36074829101562, -152.4566650390625, -148.55259704589844, -144.6485137939453, -140.74444580078125, -136.84036254882812, -132.93629455566406, -129.03221130371094, -125.12814331054688, -121.22406768798828, -117.31999206542969, -113.4159164428711, -109.5118408203125, -105.6077651977539, -101.70368957519531, -97.79960632324219, -93.8955307006836, -89.991455078125, -86.0873794555664, -82.18330383300781, -78.27922821044922, -74.37515258789062, -70.4710693359375, -66.56700134277344, -62.66292190551758, -58.758846282958984, -54.85477066040039, -50.95069122314453, -47.04661560058594, -43.142539978027344, -39.23846435546875, -35.334388732910156, -31.430320739746094, -27.5262451171875, -23.622169494628906, -19.71809196472168, -15.814016342163086, -11.909940719604492, -8.005863189697266, -4.101787567138672, -0.19771194458007812, 3.706364154815674, 7.610440254211426, 11.514516830444336, 15.41859245300293, 19.322668075561523, 23.22674560546875, 27.130821228027344, 31.034896850585938, 34.93897247314453, 38.843048095703125, 42.74712371826172, 46.65119934082031, 50.555274963378906, 54.459354400634766, 58.36343002319336, 62.26750564575195, 66.17158508300781, 70.0756607055664, 73.979736328125, 77.8838119506836, 81.78788757324219, 85.69196319580078, 89.59603881835938, 93.50011444091797]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 11.0, 13.0, 13.0, 22.0, 23.0, 54.0, 73.0, 116.0, 196.0, 347.0, 597.0, 1044.0, 2052.0, 4157.0, 9037.0, 23016.0, 67207.0, 248956.0, 492519.0, 131845.0, 39780.0, 14690.0, 6219.0, 2954.0, 1525.0, 830.0, 501.0, 262.0, 175.0, 106.0, 79.0, 40.0, 33.0, 21.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.2578125, -9.0025634765625, -8.747314453125, -8.4920654296875, -8.23681640625, -7.9815673828125, -7.726318359375, -7.4710693359375, -7.2158203125, -6.9605712890625, -6.705322265625, -6.4500732421875, -6.19482421875, -5.9395751953125, -5.684326171875, -5.4290771484375, -5.173828125, -4.9185791015625, -4.663330078125, -4.4080810546875, -4.15283203125, -3.8975830078125, -3.642333984375, -3.3870849609375, -3.1318359375, -2.8765869140625, -2.621337890625, -2.3660888671875, -2.11083984375, -1.8555908203125, -1.600341796875, -1.3450927734375, -1.08984375, -0.8345947265625, -0.579345703125, -0.3240966796875, -0.06884765625, 0.1864013671875, 0.441650390625, 0.6968994140625, 0.9521484375, 1.2073974609375, 1.462646484375, 1.7178955078125, 1.97314453125, 2.2283935546875, 2.483642578125, 2.7388916015625, 2.994140625, 3.2493896484375, 3.504638671875, 3.7598876953125, 4.01513671875, 4.2703857421875, 4.525634765625, 4.7808837890625, 5.0361328125, 5.2913818359375, 5.546630859375, 5.8018798828125, 6.05712890625, 6.3123779296875, 6.567626953125, 6.8228759765625, 7.078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 16.0, 24.0, 19.0, 27.0, 31.0, 48.0, 38.0, 37.0, 52.0, 56.0, 65.0, 69.0, 58.0, 51.0, 56.0, 50.0, 60.0, 42.0, 32.0, 36.0, 24.0, 20.0, 12.0, 17.0, 12.0, 11.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.1015625, -9.86602783203125, -9.6304931640625, -9.39495849609375, -9.159423828125, -8.92388916015625, -8.6883544921875, -8.45281982421875, -8.21728515625, -7.98175048828125, -7.7462158203125, -7.51068115234375, -7.275146484375, -7.03961181640625, -6.8040771484375, -6.56854248046875, -6.3330078125, -6.09747314453125, -5.8619384765625, -5.62640380859375, -5.390869140625, -5.15533447265625, -4.9197998046875, -4.68426513671875, -4.44873046875, -4.21319580078125, -3.9776611328125, -3.74212646484375, -3.506591796875, -3.27105712890625, -3.0355224609375, -2.79998779296875, -2.564453125, -2.32891845703125, -2.0933837890625, -1.85784912109375, -1.622314453125, -1.38677978515625, -1.1512451171875, -0.91571044921875, -0.68017578125, -0.44464111328125, -0.2091064453125, 0.02642822265625, 0.261962890625, 0.49749755859375, 0.7330322265625, 0.96856689453125, 1.2041015625, 1.43963623046875, 1.6751708984375, 1.91070556640625, 2.146240234375, 2.38177490234375, 2.6173095703125, 2.85284423828125, 3.08837890625, 3.32391357421875, 3.5594482421875, 3.79498291015625, 4.030517578125, 4.26605224609375, 4.5015869140625, 4.73712158203125, 4.97265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 3.0, 6.0, 11.0, 17.0, 18.0, 22.0, 25.0, 50.0, 60.0, 87.0, 142.0, 209.0, 325.0, 596.0, 1232.0, 3456.0, 16900.0, 309702.0, 683680.0, 24310.0, 4491.0, 1480.0, 686.0, 325.0, 209.0, 162.0, 91.0, 63.0, 45.0, 39.0, 27.0, 20.0, 9.0, 8.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.59375, -15.16162109375, -14.7294921875, -14.29736328125, -13.865234375, -13.43310546875, -13.0009765625, -12.56884765625, -12.13671875, -11.70458984375, -11.2724609375, -10.84033203125, -10.408203125, -9.97607421875, -9.5439453125, -9.11181640625, -8.6796875, -8.24755859375, -7.8154296875, -7.38330078125, -6.951171875, -6.51904296875, -6.0869140625, -5.65478515625, -5.22265625, -4.79052734375, -4.3583984375, -3.92626953125, -3.494140625, -3.06201171875, -2.6298828125, -2.19775390625, -1.765625, -1.33349609375, -0.9013671875, -0.46923828125, -0.037109375, 0.39501953125, 0.8271484375, 1.25927734375, 1.69140625, 2.12353515625, 2.5556640625, 2.98779296875, 3.419921875, 3.85205078125, 4.2841796875, 4.71630859375, 5.1484375, 5.58056640625, 6.0126953125, 6.44482421875, 6.876953125, 7.30908203125, 7.7412109375, 8.17333984375, 8.60546875, 9.03759765625, 9.4697265625, 9.90185546875, 10.333984375, 10.76611328125, 11.1982421875, 11.63037109375, 12.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 6.0, 13.0, 8.0, 8.0, 9.0, 22.0, 18.0, 15.0, 26.0, 26.0, 33.0, 44.0, 49.0, 69.0, 74.0, 95.0, 91.0, 69.0, 50.0, 43.0, 48.0, 30.0, 27.0, 15.0, 19.0, 19.0, 12.0, 12.0, 8.0, 11.0, 6.0, 5.0, 0.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.375, -27.554931640625, -26.73486328125, -25.914794921875, -25.0947265625, -24.274658203125, -23.45458984375, -22.634521484375, -21.814453125, -20.994384765625, -20.17431640625, -19.354248046875, -18.5341796875, -17.714111328125, -16.89404296875, -16.073974609375, -15.25390625, -14.433837890625, -13.61376953125, -12.793701171875, -11.9736328125, -11.153564453125, -10.33349609375, -9.513427734375, -8.693359375, -7.873291015625, -7.05322265625, -6.233154296875, -5.4130859375, -4.593017578125, -3.77294921875, -2.952880859375, -2.1328125, -1.312744140625, -0.49267578125, 0.327392578125, 1.1474609375, 1.967529296875, 2.78759765625, 3.607666015625, 4.427734375, 5.247802734375, 6.06787109375, 6.887939453125, 7.7080078125, 8.528076171875, 9.34814453125, 10.168212890625, 10.98828125, 11.808349609375, 12.62841796875, 13.448486328125, 14.2685546875, 15.088623046875, 15.90869140625, 16.728759765625, 17.548828125, 18.368896484375, 19.18896484375, 20.009033203125, 20.8291015625, 21.649169921875, 22.46923828125, 23.289306640625, 24.109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 15.0, 16.0, 21.0, 31.0, 36.0, 40.0, 89.0, 110.0, 187.0, 286.0, 432.0, 842.0, 1576.0, 3432.0, 8656.0, 28058.0, 236348.0, 716511.0, 34043.0, 9933.0, 3765.0, 1798.0, 858.0, 498.0, 275.0, 174.0, 133.0, 95.0, 40.0, 40.0, 38.0, 23.0, 24.0, 19.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-1.65234375, -1.6023712158203125, -1.552398681640625, -1.5024261474609375, -1.45245361328125, -1.4024810791015625, -1.352508544921875, -1.3025360107421875, -1.2525634765625, -1.2025909423828125, -1.152618408203125, -1.1026458740234375, -1.05267333984375, -1.0027008056640625, -0.952728271484375, -0.9027557373046875, -0.852783203125, -0.8028106689453125, -0.752838134765625, -0.7028656005859375, -0.65289306640625, -0.6029205322265625, -0.552947998046875, -0.5029754638671875, -0.4530029296875, -0.4030303955078125, -0.353057861328125, -0.3030853271484375, -0.25311279296875, -0.2031402587890625, -0.153167724609375, -0.1031951904296875, -0.05322265625, -0.0032501220703125, 0.046722412109375, 0.0966949462890625, 0.14666748046875, 0.1966400146484375, 0.246612548828125, 0.2965850830078125, 0.3465576171875, 0.3965301513671875, 0.446502685546875, 0.4964752197265625, 0.54644775390625, 0.5964202880859375, 0.646392822265625, 0.6963653564453125, 0.746337890625, 0.7963104248046875, 0.846282958984375, 0.8962554931640625, 0.94622802734375, 0.9962005615234375, 1.046173095703125, 1.0961456298828125, 1.1461181640625, 1.1960906982421875, 1.246063232421875, 1.2960357666015625, 1.34600830078125, 1.3959808349609375, 1.445953369140625, 1.4959259033203125, 1.5458984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 12.0, 29.0, 28.0, 37.0, 62.0, 110.0, 192.0, 192.0, 119.0, 59.0, 34.0, 21.0, 18.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008893013000488281, -0.0008623376488685608, -0.0008353739976882935, -0.0008084103465080261, -0.0007814466953277588, -0.0007544830441474915, -0.0007275193929672241, -0.0007005557417869568, -0.0006735920906066895, -0.0006466284394264221, -0.0006196647882461548, -0.0005927011370658875, -0.0005657374858856201, -0.0005387738347053528, -0.0005118101835250854, -0.0004848465323448181, -0.0004578828811645508, -0.00043091922998428345, -0.0004039555788040161, -0.0003769919276237488, -0.00035002827644348145, -0.0003230646252632141, -0.0002961009740829468, -0.00026913732290267944, -0.0002421736717224121, -0.00021521002054214478, -0.00018824636936187744, -0.0001612827181816101, -0.00013431906700134277, -0.00010735541582107544, -8.03917646408081e-05, -5.342811346054077e-05, -2.6464462280273438e-05, 4.991888999938965e-07, 2.746284008026123e-05, 5.4426491260528564e-05, 8.13901424407959e-05, 0.00010835379362106323, 0.00013531744480133057, 0.0001622810959815979, 0.00018924474716186523, 0.00021620839834213257, 0.0002431720495223999, 0.00027013570070266724, 0.00029709935188293457, 0.0003240630030632019, 0.00035102665424346924, 0.00037799030542373657, 0.0004049539566040039, 0.00043191760778427124, 0.0004588812589645386, 0.0004858449101448059, 0.0005128085613250732, 0.0005397722125053406, 0.0005667358636856079, 0.0005936995148658752, 0.0006206631660461426, 0.0006476268172264099, 0.0006745904684066772, 0.0007015541195869446, 0.0007285177707672119, 0.0007554814219474792, 0.0007824450731277466, 0.0008094087243080139, 0.0008363723754882812]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 34.0, 55.0, 84.0, 127.0, 214.0, 419.0, 809.0, 1682.0, 3844.0, 10577.0, 35167.0, 507871.0, 435746.0, 34371.0, 10183.0, 3868.0, 1687.0, 782.0, 401.0, 229.0, 132.0, 67.0, 53.0, 34.0, 16.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.7294464111328125, -1.671783447265625, -1.6141204833984375, -1.55645751953125, -1.4987945556640625, -1.441131591796875, -1.3834686279296875, -1.3258056640625, -1.2681427001953125, -1.210479736328125, -1.1528167724609375, -1.09515380859375, -1.0374908447265625, -0.979827880859375, -0.9221649169921875, -0.864501953125, -0.8068389892578125, -0.749176025390625, -0.6915130615234375, -0.63385009765625, -0.5761871337890625, -0.518524169921875, -0.4608612060546875, -0.4031982421875, -0.3455352783203125, -0.287872314453125, -0.2302093505859375, -0.17254638671875, -0.1148834228515625, -0.057220458984375, 0.0004425048828125, 0.05810546875, 0.1157684326171875, 0.173431396484375, 0.2310943603515625, 0.28875732421875, 0.3464202880859375, 0.404083251953125, 0.4617462158203125, 0.5194091796875, 0.5770721435546875, 0.634735107421875, 0.6923980712890625, 0.75006103515625, 0.8077239990234375, 0.865386962890625, 0.9230499267578125, 0.980712890625, 1.0383758544921875, 1.096038818359375, 1.1537017822265625, 1.21136474609375, 1.2690277099609375, 1.326690673828125, 1.3843536376953125, 1.4420166015625, 1.4996795654296875, 1.557342529296875, 1.6150054931640625, 1.67266845703125, 1.7303314208984375, 1.787994384765625, 1.8456573486328125, 1.9033203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 10.0, 5.0, 3.0, 12.0, 5.0, 6.0, 19.0, 22.0, 17.0, 37.0, 45.0, 64.0, 107.0, 106.0, 119.0, 113.0, 81.0, 58.0, 34.0, 28.0, 17.0, 18.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.107421875, -2.0442047119140625, -1.980987548828125, -1.9177703857421875, -1.85455322265625, -1.7913360595703125, -1.728118896484375, -1.6649017333984375, -1.6016845703125, -1.5384674072265625, -1.475250244140625, -1.4120330810546875, -1.34881591796875, -1.2855987548828125, -1.222381591796875, -1.1591644287109375, -1.095947265625, -1.0327301025390625, -0.969512939453125, -0.9062957763671875, -0.84307861328125, -0.7798614501953125, -0.716644287109375, -0.6534271240234375, -0.5902099609375, -0.5269927978515625, -0.463775634765625, -0.4005584716796875, -0.33734130859375, -0.2741241455078125, -0.210906982421875, -0.1476898193359375, -0.08447265625, -0.0212554931640625, 0.041961669921875, 0.1051788330078125, 0.16839599609375, 0.2316131591796875, 0.294830322265625, 0.3580474853515625, 0.4212646484375, 0.4844818115234375, 0.547698974609375, 0.6109161376953125, 0.67413330078125, 0.7373504638671875, 0.800567626953125, 0.8637847900390625, 0.927001953125, 0.9902191162109375, 1.053436279296875, 1.1166534423828125, 1.17987060546875, 1.2430877685546875, 1.306304931640625, 1.3695220947265625, 1.4327392578125, 1.4959564208984375, 1.559173583984375, 1.6223907470703125, 1.68560791015625, 1.7488250732421875, 1.812042236328125, 1.8752593994140625, 1.9384765625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 11.0, 19.0, 37.0, 70.0, 160.0, 493.0, 98.0, 41.0, 32.0, 18.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-153.13253784179688, -149.51748657226562, -145.90245056152344, -142.2873992919922, -138.67236328125, -135.05731201171875, -131.4422607421875, -127.82722473144531, -124.21217346191406, -120.59712982177734, -116.98208618164062, -113.36703491210938, -109.75199127197266, -106.13694763183594, -102.52190399169922, -98.9068603515625, -95.29181671142578, -91.67677307128906, -88.06172943115234, -84.44668579101562, -80.83163452148438, -77.21659088134766, -73.60154724121094, -69.98650360107422, -66.3714599609375, -62.75641632080078, -59.1413688659668, -55.52632522583008, -51.911277770996094, -48.296234130859375, -44.681190490722656, -41.06614685058594, -37.45109558105469, -33.83605194091797, -30.221004486083984, -26.605960845947266, -22.990915298461914, -19.375869750976562, -15.760826110839844, -12.145780563354492, -8.53073501586914, -4.915689945220947, -1.300644874572754, 2.3143997192382812, 5.929445266723633, 9.544490814208984, 13.159534454345703, 16.774580001831055, 20.389625549316406, 24.004671096801758, 27.61971664428711, 31.234760284423828, 34.84980773925781, 38.46485137939453, 42.07989501953125, 45.69493865966797, 49.30998611450195, 52.92502975463867, 56.540077209472656, 60.155120849609375, 63.770164489746094, 67.38520812988281, 71.00025939941406, 74.61530303955078, 78.2303466796875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 10.0, 15.0, 20.0, 19.0, 15.0, 17.0, 24.0, 18.0, 39.0, 102.0, 137.0, 152.0, 124.0, 42.0, 26.0, 22.0, 24.0, 17.0, 24.0, 13.0, 14.0, 10.0, 8.0, 14.0, 8.0, 7.0, 6.0, 3.0, 7.0, 2.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.59358215332031, -68.57595825195312, -66.55833435058594, -64.54070281982422, -62.52307891845703, -60.505455017089844, -58.48782730102539, -56.47019958496094, -54.45257568359375, -52.43495178222656, -50.41732406616211, -48.399696350097656, -46.38207244873047, -44.36444854736328, -42.34682083129883, -40.329193115234375, -38.31156921386719, -36.2939453125, -34.27631759643555, -32.258689880371094, -30.241065979003906, -28.223440170288086, -26.205814361572266, -24.188188552856445, -22.170562744140625, -20.152936935424805, -18.135311126708984, -16.117685317993164, -14.100059509277344, -12.082433700561523, -10.064807891845703, -8.047182083129883, -6.029563903808594, -4.011938095092773, -1.9943122863769531, 0.023313522338867188, 2.0409393310546875, 4.058565139770508, 6.076190948486328, 8.093816757202148, 10.111442565917969, 12.129068374633789, 14.14669418334961, 16.16431999206543, 18.18194580078125, 20.19957160949707, 22.21719741821289, 24.23482322692871, 26.25244903564453, 28.27007484436035, 30.287700653076172, 32.305328369140625, 34.32295227050781, 36.340576171875, 38.35820388793945, 40.375831604003906, 42.393455505371094, 44.41107940673828, 46.428707122802734, 48.44633483886719, 50.463958740234375, 52.48158264160156, 54.499210357666016, 56.51683807373047, 58.534461975097656]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 15.0, 16.0, 23.0, 30.0, 38.0, 53.0, 63.0, 180.0, 282.0, 62.0, 50.0, 49.0, 31.0, 35.0, 13.0, 17.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.890625, -14.5601806640625, -14.229736328125, -13.8992919921875, -13.56884765625, -13.2384033203125, -12.907958984375, -12.5775146484375, -12.2470703125, -11.9166259765625, -11.586181640625, -11.2557373046875, -10.92529296875, -10.5948486328125, -10.264404296875, -9.9339599609375, -9.603515625, -9.2730712890625, -8.942626953125, -8.6121826171875, -8.28173828125, -7.9512939453125, -7.620849609375, -7.2904052734375, -6.9599609375, -6.6295166015625, -6.299072265625, -5.9686279296875, -5.63818359375, -5.3077392578125, -4.977294921875, -4.6468505859375, -4.31640625, -3.9859619140625, -3.655517578125, -3.3250732421875, -2.99462890625, -2.6641845703125, -2.333740234375, -2.0032958984375, -1.6728515625, -1.3424072265625, -1.011962890625, -0.6815185546875, -0.35107421875, -0.0206298828125, 0.309814453125, 0.6402587890625, 0.970703125, 1.3011474609375, 1.631591796875, 1.9620361328125, 2.29248046875, 2.6229248046875, 2.953369140625, 3.2838134765625, 3.6142578125, 3.9447021484375, 4.275146484375, 4.6055908203125, 4.93603515625, 5.2664794921875, 5.596923828125, 5.9273681640625, 6.2578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 4.0, 10.0, 18.0, 27.0, 38.0, 63.0, 114.0, 211.0, 444.0, 1582.0, 9004.0, 8345523.0, 27309.0, 2810.0, 760.0, 259.0, 137.0, 78.0, 44.0, 53.0, 18.0, 20.0, 9.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.94425201416016, -85.2537841796875, -82.56331634521484, -79.87284851074219, -77.18238067626953, -74.49191284179688, -71.80144500732422, -69.11097717285156, -66.4205093383789, -63.73004150390625, -61.039573669433594, -58.34910583496094, -55.65863800048828, -52.968170166015625, -50.27770233154297, -47.58723449707031, -44.896766662597656, -42.206298828125, -39.515830993652344, -36.82536315917969, -34.13489532470703, -31.444427490234375, -28.75395965576172, -26.063491821289062, -23.373023986816406, -20.68255615234375, -17.992088317871094, -15.301620483398438, -12.611152648925781, -9.920684814453125, -7.230216979980469, -4.5397491455078125, -1.849273681640625, 0.8411941528320312, 3.5316619873046875, 6.222129821777344, 8.91259765625, 11.603065490722656, 14.293533325195312, 16.98400115966797, 19.674468994140625, 22.36493682861328, 25.055404663085938, 27.745872497558594, 30.43634033203125, 33.126808166503906, 35.81727600097656, 38.50774383544922, 41.198211669921875, 43.88867950439453, 46.57914733886719, 49.269615173339844, 51.9600830078125, 54.650550842285156, 57.34101867675781, 60.03148651123047, 62.721954345703125, 65.41242218017578, 68.10289001464844, 70.7933578491211, 73.48382568359375, 76.1742935180664, 78.86476135253906, 81.55522918701172, 84.24569702148438]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 7.0, 5.0, 9.0, 5.0, 3.0, 5.0, 6.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 7.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.10792541503906, -154.2130584716797, -149.31817626953125, -144.42330932617188, -139.5284423828125, -134.63357543945312, -129.7386932373047, -124.84382629394531, -119.9489517211914, -115.0540771484375, -110.15921020507812, -105.26433563232422, -100.36946105957031, -95.47459411621094, -90.57971954345703, -85.68484497070312, -80.78997802734375, -75.89510345458984, -71.00023651123047, -66.10536193847656, -61.21049118041992, -56.31562042236328, -51.420745849609375, -46.525875091552734, -41.631004333496094, -36.73613357543945, -31.84126091003418, -26.946388244628906, -22.051517486572266, -17.156646728515625, -12.261774063110352, -7.366901397705078, -2.4720458984375, 2.422825813293457, 7.317697525024414, 12.212569236755371, 17.107440948486328, 22.00231170654297, 26.897184371948242, 31.792057037353516, 36.686927795410156, 41.5817985534668, 46.47666931152344, 51.371543884277344, 56.266414642333984, 61.161285400390625, 66.05615997314453, 70.95103454589844, 75.84590148925781, 80.74077606201172, 85.6356430053711, 90.530517578125, 95.42538452148438, 100.32025909423828, 105.21513366699219, 110.11000061035156, 115.00487518310547, 119.89974975585938, 124.79461669921875, 129.68948364257812, 134.58436584472656, 139.47923278808594, 144.3740997314453, 149.26898193359375, 154.16384887695312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 21.0, 28.0, 36.0, 78.0, 73.0, 176.0, 270.0, 476.0, 902.0, 1887.0, 4420.0, 12349.0, 37975.0, 125270.0, 212674.0, 85924.0, 26423.0, 8819.0, 3320.0, 1504.0, 699.0, 372.0, 201.0, 134.0, 67.0, 50.0, 29.0, 23.0, 17.0, 5.0, 9.0, 1.0, 0.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.90625, -61.1259765625, -59.345703125, -57.5654296875, -55.78515625, -54.0048828125, -52.224609375, -50.4443359375, -48.6640625, -46.8837890625, -45.103515625, -43.3232421875, -41.54296875, -39.7626953125, -37.982421875, -36.2021484375, -34.421875, -32.6416015625, -30.861328125, -29.0810546875, -27.30078125, -25.5205078125, -23.740234375, -21.9599609375, -20.1796875, -18.3994140625, -16.619140625, -14.8388671875, -13.05859375, -11.2783203125, -9.498046875, -7.7177734375, -5.9375, -4.1572265625, -2.376953125, -0.5966796875, 1.18359375, 2.9638671875, 4.744140625, 6.5244140625, 8.3046875, 10.0849609375, 11.865234375, 13.6455078125, 15.42578125, 17.2060546875, 18.986328125, 20.7666015625, 22.546875, 24.3271484375, 26.107421875, 27.8876953125, 29.66796875, 31.4482421875, 33.228515625, 35.0087890625, 36.7890625, 38.5693359375, 40.349609375, 42.1298828125, 43.91015625, 45.6904296875, 47.470703125, 49.2509765625, 51.03125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 20.0, 29.0, 45.0, 59.0, 80.0, 100.0, 127.0, 133.0, 81.0, 78.0, 63.0, 45.0, 37.0, 20.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.611328125, -10.24609375, -9.880859375, -9.515625, -9.150390625, -8.78515625, -8.419921875, -8.0546875, -7.689453125, -7.32421875, -6.958984375, -6.59375, -6.228515625, -5.86328125, -5.498046875, -5.1328125, -4.767578125, -4.40234375, -4.037109375, -3.671875, -3.306640625, -2.94140625, -2.576171875, -2.2109375, -1.845703125, -1.48046875, -1.115234375, -0.75, -0.384765625, -0.01953125, 0.345703125, 0.7109375, 1.076171875, 1.44140625, 1.806640625, 2.171875, 2.537109375, 2.90234375, 3.267578125, 3.6328125, 3.998046875, 4.36328125, 4.728515625, 5.09375, 5.458984375, 5.82421875, 6.189453125, 6.5546875, 6.919921875, 7.28515625, 7.650390625, 8.015625, 8.380859375, 8.74609375, 9.111328125, 9.4765625, 9.841796875, 10.20703125, 10.572265625, 10.9375, 11.302734375, 11.66796875, 12.033203125, 12.3984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 6.0, 7.0, 4.0, 15.0, 25.0, 14.0, 31.0, 65.0, 58.0, 75.0, 59.0, 34.0, 27.0, 18.0, 3.0, 8.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.72188949584961, -53.93724060058594, -52.152591705322266, -50.367942810058594, -48.58329391479492, -46.79864501953125, -45.01399230957031, -43.229347229003906, -41.44469451904297, -39.6600456237793, -37.875396728515625, -36.09074783325195, -34.30609893798828, -32.52145004272461, -30.736799240112305, -28.952150344848633, -27.167503356933594, -25.382854461669922, -23.59820556640625, -21.813556671142578, -20.028907775878906, -18.244258880615234, -16.45960807800293, -14.674959182739258, -12.890310287475586, -11.105661392211914, -9.321012496948242, -7.536362648010254, -5.751713752746582, -3.96706485748291, -2.182415008544922, -0.39776611328125, 1.3868827819824219, 3.171531915664673, 4.956181049346924, 6.740830421447754, 8.525479316711426, 10.310128211975098, 12.094778060913086, 13.879426956176758, 15.66407585144043, 17.4487247467041, 19.233373641967773, 21.018024444580078, 22.80267333984375, 24.587322235107422, 26.371971130371094, 28.156620025634766, 29.941268920898438, 31.72591781616211, 33.51056671142578, 35.29521560668945, 37.079864501953125, 38.8645133972168, 40.64916229248047, 42.433815002441406, 44.21846008300781, 46.003108978271484, 47.787757873535156, 49.57240676879883, 51.3570556640625, 53.14170455932617, 54.926353454589844, 56.71100616455078, 58.49565505981445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 8.0, 16.0, 9.0, 19.0, 37.0, 55.0, 71.0, 70.0, 65.0, 43.0, 17.0, 15.0, 9.0, 5.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.547569274902344, -40.342533111572266, -39.13750076293945, -37.932464599609375, -36.72743225097656, -35.522396087646484, -34.317359924316406, -33.112327575683594, -31.907291412353516, -30.70225715637207, -29.497222900390625, -28.292186737060547, -27.0871524810791, -25.882118225097656, -24.677082061767578, -23.472047805786133, -22.267013549804688, -21.061979293823242, -19.856945037841797, -18.65190887451172, -17.446874618530273, -16.241840362548828, -15.036805152893066, -13.831769943237305, -12.62673568725586, -11.421701431274414, -10.216666221618652, -9.01163101196289, -7.806596755981445, -6.601562023162842, -5.396527290344238, -4.191492080688477, -2.9864578247070312, -1.7814230918884277, -0.5763883590698242, 0.6286463737487793, 1.8336811065673828, 3.0387158393859863, 4.24375057220459, 5.448785781860352, 6.653820037841797, 7.8588547706604, 9.063889503479004, 10.268924713134766, 11.473958969116211, 12.678993225097656, 13.884028434753418, 15.08906364440918, 16.294097900390625, 17.49913215637207, 18.704166412353516, 19.909202575683594, 21.11423683166504, 22.319271087646484, 23.524307250976562, 24.729341506958008, 25.934375762939453, 27.1394100189209, 28.344444274902344, 29.549480438232422, 30.754514694213867, 31.959548950195312, 33.16458511352539, 34.36962127685547, 35.57465362548828]}, "eval/loss": 1.8364678621292114, "eval/wer": 0.2812376041253471, "eval/runtime": 832.195, "eval/samples_per_second": 3.175, "eval/steps_per_second": 0.398, "train/train_runtime": 108037.8512, "train/train_samples_per_second": 5.283, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 2.302149100206905} \ No newline at end of file +{"train/loss": 0.0162, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 109258, "_timestamp": 1647483800, "_step": 17852, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 12.0, 6.0, 8.0, 6.0, 12.0, 15.0, 17.0, 22.0, 35.0, 43.0, 41.0, 53.0, 54.0, 47.0, 56.0, 65.0, 50.0, 58.0, 50.0, 53.0, 44.0, 45.0, 43.0, 38.0, 23.0, 22.0, 17.0, 19.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.21875762939453, -88.52344512939453, -86.828125, -85.1328125, -83.43749237060547, -81.74217987060547, -80.04685974121094, -78.35154724121094, -76.65623474121094, -74.96092224121094, -73.2656021118164, -71.5702896118164, -69.87496948242188, -68.17965698242188, -66.48433685302734, -64.78902435302734, -63.09370422363281, -61.39838790893555, -59.70307159423828, -58.007755279541016, -56.31243896484375, -54.61712646484375, -52.921810150146484, -51.22649383544922, -49.53117752075195, -47.83586120605469, -46.14054489135742, -44.445228576660156, -42.749916076660156, -41.054595947265625, -39.359283447265625, -37.66396713256836, -35.96865463256836, -34.273338317871094, -32.57802200317383, -30.882707595825195, -29.18739128112793, -27.492074966430664, -25.79676055908203, -24.101444244384766, -22.4061279296875, -20.710811614990234, -19.01549530029297, -17.320180892944336, -15.62486457824707, -13.929548263549805, -12.234232902526855, -10.538917541503906, -8.84360122680664, -7.148285388946533, -5.452969551086426, -3.7576537132263184, -2.062337875366211, -0.3670215606689453, 1.328293800354004, 3.023609161376953, 4.718925476074219, 6.414241313934326, 8.109557151794434, 9.804872512817383, 11.500188827514648, 13.195505142211914, 14.890820503234863, 16.586135864257812, 18.281452178955078]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 2.0, 7.0, 7.0, 12.0, 14.0, 7.0, 15.0, 15.0, 26.0, 24.0, 24.0, 22.0, 35.0, 31.0, 23.0, 37.0, 38.0, 36.0, 32.0, 50.0, 48.0, 40.0, 41.0, 39.0, 35.0, 33.0, 49.0, 19.0, 29.0, 29.0, 18.0, 25.0, 19.0, 16.0, 24.0, 9.0, 14.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.85319900512695, -38.5408935546875, -37.22859191894531, -35.91628646850586, -34.60398483276367, -33.29167938232422, -31.9793758392334, -30.667072296142578, -29.354766845703125, -28.042463302612305, -26.730159759521484, -25.41785430908203, -24.10555076599121, -22.79324722290039, -21.48094367980957, -20.16864013671875, -18.85633659362793, -17.54403305053711, -16.23172950744629, -14.919425010681152, -13.607120513916016, -12.294816970825195, -10.982513427734375, -9.670208930969238, -8.357905387878418, -7.0456013679504395, -5.733297348022461, -4.420993804931641, -3.108689785003662, -1.7963857650756836, -0.4840822219848633, 0.8282222747802734, 2.1405258178710938, 3.4528298377990723, 4.765133857727051, 6.077437400817871, 7.38974142074585, 8.702045440673828, 10.014348983764648, 11.326653480529785, 12.638957023620605, 13.951260566711426, 15.263565063476562, 16.575868606567383, 17.888172149658203, 19.200477600097656, 20.512779235839844, 21.825084686279297, 23.137388229370117, 24.449691772460938, 25.761995315551758, 27.074298858642578, 28.38660430908203, 29.69890785217285, 31.011211395263672, 32.323516845703125, 33.63581848144531, 34.948123931884766, 36.26042556762695, 37.572731018066406, 38.885032653808594, 40.19733810424805, 41.5096435546875, 42.82194519042969, 44.13425064086914]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 25.0, 40.0, 47.0, 82.0, 141.0, 254.0, 401.0, 613.0, 991.0, 1579.0, 2531.0, 4057.0, 6334.0, 10190.0, 15867.0, 25238.0, 39251.0, 60422.0, 93260.0, 140151.0, 206561.0, 294505.0, 398751.0, 495048.0, 539183.0, 503644.0, 412134.0, 306321.0, 215690.0, 146820.0, 97775.0, 62907.0, 41042.0, 26517.0, 16954.0, 10778.0, 6679.0, 4275.0, 2650.0, 1652.0, 1122.0, 678.0, 415.0, 250.0, 173.0, 99.0, 64.0, 38.0, 33.0, 10.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0], "bins": [-69.375, -67.244140625, -65.11328125, -62.982421875, -60.8515625, -58.720703125, -56.58984375, -54.458984375, -52.328125, -50.197265625, -48.06640625, -45.935546875, -43.8046875, -41.673828125, -39.54296875, -37.412109375, -35.28125, -33.150390625, -31.01953125, -28.888671875, -26.7578125, -24.626953125, -22.49609375, -20.365234375, -18.234375, -16.103515625, -13.97265625, -11.841796875, -9.7109375, -7.580078125, -5.44921875, -3.318359375, -1.1875, 0.943359375, 3.07421875, 5.205078125, 7.3359375, 9.466796875, 11.59765625, 13.728515625, 15.859375, 17.990234375, 20.12109375, 22.251953125, 24.3828125, 26.513671875, 28.64453125, 30.775390625, 32.90625, 35.037109375, 37.16796875, 39.298828125, 41.4296875, 43.560546875, 45.69140625, 47.822265625, 49.953125, 52.083984375, 54.21484375, 56.345703125, 58.4765625, 60.607421875, 62.73828125, 64.869140625, 67.0]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 3.0, 8.0, 12.0, 9.0, 7.0, 7.0, 9.0, 20.0, 23.0, 17.0, 19.0, 19.0, 32.0, 23.0, 21.0, 29.0, 28.0, 30.0, 42.0, 37.0, 47.0, 35.0, 42.0, 34.0, 29.0, 32.0, 33.0, 40.0, 29.0, 17.0, 22.0, 24.0, 28.0, 23.0, 16.0, 8.0, 15.0, 16.0, 24.0, 10.0, 10.0, 10.0, 11.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 6.0], "bins": [-44.59375, -43.29345703125, -41.9931640625, -40.69287109375, -39.392578125, -38.09228515625, -36.7919921875, -35.49169921875, -34.19140625, -32.89111328125, -31.5908203125, -30.29052734375, -28.990234375, -27.68994140625, -26.3896484375, -25.08935546875, -23.7890625, -22.48876953125, -21.1884765625, -19.88818359375, -18.587890625, -17.28759765625, -15.9873046875, -14.68701171875, -13.38671875, -12.08642578125, -10.7861328125, -9.48583984375, -8.185546875, -6.88525390625, -5.5849609375, -4.28466796875, -2.984375, -1.68408203125, -0.3837890625, 0.91650390625, 2.216796875, 3.51708984375, 4.8173828125, 6.11767578125, 7.41796875, 8.71826171875, 10.0185546875, 11.31884765625, 12.619140625, 13.91943359375, 15.2197265625, 16.52001953125, 17.8203125, 19.12060546875, 20.4208984375, 21.72119140625, 23.021484375, 24.32177734375, 25.6220703125, 26.92236328125, 28.22265625, 29.52294921875, 30.8232421875, 32.12353515625, 33.423828125, 34.72412109375, 36.0244140625, 37.32470703125, 38.625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 11.0, 12.0, 27.0, 26.0, 44.0, 74.0, 134.0, 188.0, 283.0, 516.0, 890.0, 1421.0, 2352.0, 3865.0, 6632.0, 11175.0, 18153.0, 29958.0, 48549.0, 76983.0, 119442.0, 180406.0, 259012.0, 353465.0, 443011.0, 505307.0, 508941.0, 454892.0, 365317.0, 272535.0, 189286.0, 126771.0, 81705.0, 51802.0, 31955.0, 19354.0, 11873.0, 7158.0, 4307.0, 2539.0, 1601.0, 909.0, 554.0, 342.0, 180.0, 125.0, 80.0, 47.0, 28.0, 18.0, 12.0, 11.0, 3.0, 3.0, 3.0], "bins": [-63.9375, -62.1142578125, -60.291015625, -58.4677734375, -56.64453125, -54.8212890625, -52.998046875, -51.1748046875, -49.3515625, -47.5283203125, -45.705078125, -43.8818359375, -42.05859375, -40.2353515625, -38.412109375, -36.5888671875, -34.765625, -32.9423828125, -31.119140625, -29.2958984375, -27.47265625, -25.6494140625, -23.826171875, -22.0029296875, -20.1796875, -18.3564453125, -16.533203125, -14.7099609375, -12.88671875, -11.0634765625, -9.240234375, -7.4169921875, -5.59375, -3.7705078125, -1.947265625, -0.1240234375, 1.69921875, 3.5224609375, 5.345703125, 7.1689453125, 8.9921875, 10.8154296875, 12.638671875, 14.4619140625, 16.28515625, 18.1083984375, 19.931640625, 21.7548828125, 23.578125, 25.4013671875, 27.224609375, 29.0478515625, 30.87109375, 32.6943359375, 34.517578125, 36.3408203125, 38.1640625, 39.9873046875, 41.810546875, 43.6337890625, 45.45703125, 47.2802734375, 49.103515625, 50.9267578125, 52.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 8.0, 4.0, 6.0, 13.0, 10.0, 21.0, 16.0, 24.0, 26.0, 31.0, 30.0, 48.0, 58.0, 77.0, 75.0, 86.0, 118.0, 124.0, 114.0, 150.0, 153.0, 144.0, 208.0, 194.0, 204.0, 208.0, 216.0, 222.0, 181.0, 174.0, 173.0, 137.0, 132.0, 109.0, 109.0, 89.0, 70.0, 64.0, 50.0, 41.0, 39.0, 36.0, 20.0, 16.0, 10.0, 15.0, 5.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.989013671875, -21.21240234375, -20.435791015625, -19.6591796875, -18.882568359375, -18.10595703125, -17.329345703125, -16.552734375, -15.776123046875, -14.99951171875, -14.222900390625, -13.4462890625, -12.669677734375, -11.89306640625, -11.116455078125, -10.33984375, -9.563232421875, -8.78662109375, -8.010009765625, -7.2333984375, -6.456787109375, -5.68017578125, -4.903564453125, -4.126953125, -3.350341796875, -2.57373046875, -1.797119140625, -1.0205078125, -0.243896484375, 0.53271484375, 1.309326171875, 2.0859375, 2.862548828125, 3.63916015625, 4.415771484375, 5.1923828125, 5.968994140625, 6.74560546875, 7.522216796875, 8.298828125, 9.075439453125, 9.85205078125, 10.628662109375, 11.4052734375, 12.181884765625, 12.95849609375, 13.735107421875, 14.51171875, 15.288330078125, 16.06494140625, 16.841552734375, 17.6181640625, 18.394775390625, 19.17138671875, 19.947998046875, 20.724609375, 21.501220703125, 22.27783203125, 23.054443359375, 23.8310546875, 24.607666015625, 25.38427734375, 26.160888671875, 26.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 13.0, 25.0, 20.0, 19.0, 29.0, 29.0, 32.0, 37.0, 40.0, 34.0, 62.0, 40.0, 40.0, 39.0, 40.0, 51.0, 46.0, 42.0, 44.0, 35.0, 44.0, 26.0, 29.0, 25.0, 25.0, 21.0, 17.0, 14.0, 16.0, 10.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-78.66213989257812, -76.70450592041016, -74.74687957763672, -72.78924560546875, -70.83161163330078, -68.87398529052734, -66.91635131835938, -64.9587173461914, -63.00109100341797, -61.043460845947266, -59.0858268737793, -57.128196716308594, -55.17056655883789, -53.21293640136719, -51.25530242919922, -49.297672271728516, -47.34003829956055, -45.382408142089844, -43.424774169921875, -41.46714401245117, -39.50951385498047, -37.5518798828125, -35.5942497253418, -33.636619567871094, -31.678987503051758, -29.721355438232422, -27.76372528076172, -25.806093215942383, -23.848461151123047, -21.890830993652344, -19.933198928833008, -17.975566864013672, -16.01793670654297, -14.06030559539795, -12.10267448425293, -10.145042419433594, -8.187411308288574, -6.229780197143555, -4.272148132324219, -2.314517021179199, -0.3568859100341797, 1.600745439529419, 3.5583767890930176, 5.516008377075195, 7.473639488220215, 9.431270599365234, 11.38890266418457, 13.34653377532959, 15.30416488647461, 17.261796951293945, 19.21942710876465, 21.177059173583984, 23.134689331054688, 25.092321395874023, 27.04995346069336, 29.007583618164062, 30.9652156829834, 32.922847747802734, 34.88047790527344, 36.838111877441406, 38.79574203491211, 40.75337219238281, 42.71100616455078, 44.668636322021484, 46.62626647949219]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 9.0, 19.0, 19.0, 17.0, 25.0, 30.0, 20.0, 25.0, 38.0, 39.0, 30.0, 35.0, 28.0, 41.0, 38.0, 50.0, 41.0, 42.0, 46.0, 35.0, 28.0, 31.0, 26.0, 42.0, 27.0, 34.0, 23.0, 19.0, 18.0, 13.0, 10.0, 10.0, 7.0, 12.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.91980743408203, -60.128684997558594, -58.33755874633789, -56.54643630981445, -54.75531005859375, -52.96418762207031, -51.173065185546875, -49.38194274902344, -47.590816497802734, -45.7996940612793, -44.008567810058594, -42.217445373535156, -40.42632293701172, -38.635196685791016, -36.84407424926758, -35.052947998046875, -33.26182556152344, -31.470701217651367, -29.679576873779297, -27.88845443725586, -26.09733009338379, -24.30620574951172, -22.51508331298828, -20.72395896911621, -18.93283462524414, -17.14171028137207, -15.350586891174316, -13.559463500976562, -11.768339157104492, -9.977214813232422, -8.186091423034668, -6.394968032836914, -4.603847503662109, -2.8127236366271973, -1.0215997695922852, 0.769524097442627, 2.560647964477539, 4.351772308349609, 6.142895698547363, 7.934019088745117, 9.725143432617188, 11.516267776489258, 13.307391166687012, 15.098514556884766, 16.889638900756836, 18.680763244628906, 20.471885681152344, 22.263010025024414, 24.054134368896484, 25.845258712768555, 27.636383056640625, 29.427505493164062, 31.218629837036133, 33.0097541809082, 34.80087661743164, 36.592002868652344, 38.38312530517578, 40.17424774169922, 41.96537399291992, 43.75649642944336, 45.54762268066406, 47.3387451171875, 49.12986755371094, 50.920989990234375, 52.71211624145508]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 12.0, 13.0, 28.0, 43.0, 55.0, 60.0, 123.0, 208.0, 287.0, 476.0, 743.0, 1171.0, 1851.0, 3053.0, 4997.0, 8039.0, 13451.0, 22545.0, 37176.0, 60395.0, 93730.0, 133593.0, 161822.0, 156923.0, 124441.0, 85225.0, 54203.0, 32889.0, 20007.0, 11904.0, 7386.0, 4376.0, 2726.0, 1632.0, 1085.0, 678.0, 388.0, 297.0, 198.0, 110.0, 84.0, 41.0, 29.0, 19.0, 16.0, 6.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-27.84375, -26.970458984375, -26.09716796875, -25.223876953125, -24.3505859375, -23.477294921875, -22.60400390625, -21.730712890625, -20.857421875, -19.984130859375, -19.11083984375, -18.237548828125, -17.3642578125, -16.490966796875, -15.61767578125, -14.744384765625, -13.87109375, -12.997802734375, -12.12451171875, -11.251220703125, -10.3779296875, -9.504638671875, -8.63134765625, -7.758056640625, -6.884765625, -6.011474609375, -5.13818359375, -4.264892578125, -3.3916015625, -2.518310546875, -1.64501953125, -0.771728515625, 0.1015625, 0.974853515625, 1.84814453125, 2.721435546875, 3.5947265625, 4.468017578125, 5.34130859375, 6.214599609375, 7.087890625, 7.961181640625, 8.83447265625, 9.707763671875, 10.5810546875, 11.454345703125, 12.32763671875, 13.200927734375, 14.07421875, 14.947509765625, 15.82080078125, 16.694091796875, 17.5673828125, 18.440673828125, 19.31396484375, 20.187255859375, 21.060546875, 21.933837890625, 22.80712890625, 23.680419921875, 24.5537109375, 25.427001953125, 26.30029296875, 27.173583984375, 28.046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 9.0, 8.0, 13.0, 16.0, 16.0, 17.0, 18.0, 24.0, 34.0, 16.0, 21.0, 36.0, 40.0, 31.0, 25.0, 36.0, 38.0, 41.0, 40.0, 41.0, 43.0, 41.0, 38.0, 33.0, 30.0, 24.0, 37.0, 34.0, 29.0, 27.0, 22.0, 16.0, 17.0, 15.0, 9.0, 7.0, 9.0, 8.0, 11.0, 8.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-63.125, -61.3271484375, -59.529296875, -57.7314453125, -55.93359375, -54.1357421875, -52.337890625, -50.5400390625, -48.7421875, -46.9443359375, -45.146484375, -43.3486328125, -41.55078125, -39.7529296875, -37.955078125, -36.1572265625, -34.359375, -32.5615234375, -30.763671875, -28.9658203125, -27.16796875, -25.3701171875, -23.572265625, -21.7744140625, -19.9765625, -18.1787109375, -16.380859375, -14.5830078125, -12.78515625, -10.9873046875, -9.189453125, -7.3916015625, -5.59375, -3.7958984375, -1.998046875, -0.2001953125, 1.59765625, 3.3955078125, 5.193359375, 6.9912109375, 8.7890625, 10.5869140625, 12.384765625, 14.1826171875, 15.98046875, 17.7783203125, 19.576171875, 21.3740234375, 23.171875, 24.9697265625, 26.767578125, 28.5654296875, 30.36328125, 32.1611328125, 33.958984375, 35.7568359375, 37.5546875, 39.3525390625, 41.150390625, 42.9482421875, 44.74609375, 46.5439453125, 48.341796875, 50.1396484375, 51.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 9.0, 10.0, 19.0, 30.0, 36.0, 43.0, 67.0, 76.0, 119.0, 172.0, 235.0, 322.0, 479.0, 715.0, 1129.0, 1667.0, 2723.0, 4209.0, 7163.0, 12027.0, 22436.0, 56611.0, 843408.0, 44976.0, 20407.0, 11344.0, 6641.0, 4013.0, 2580.0, 1604.0, 1038.0, 692.0, 449.0, 321.0, 250.0, 138.0, 88.0, 87.0, 58.0, 37.0, 32.0, 31.0, 16.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-58.9375, -57.1201171875, -55.302734375, -53.4853515625, -51.66796875, -49.8505859375, -48.033203125, -46.2158203125, -44.3984375, -42.5810546875, -40.763671875, -38.9462890625, -37.12890625, -35.3115234375, -33.494140625, -31.6767578125, -29.859375, -28.0419921875, -26.224609375, -24.4072265625, -22.58984375, -20.7724609375, -18.955078125, -17.1376953125, -15.3203125, -13.5029296875, -11.685546875, -9.8681640625, -8.05078125, -6.2333984375, -4.416015625, -2.5986328125, -0.78125, 1.0361328125, 2.853515625, 4.6708984375, 6.48828125, 8.3056640625, 10.123046875, 11.9404296875, 13.7578125, 15.5751953125, 17.392578125, 19.2099609375, 21.02734375, 22.8447265625, 24.662109375, 26.4794921875, 28.296875, 30.1142578125, 31.931640625, 33.7490234375, 35.56640625, 37.3837890625, 39.201171875, 41.0185546875, 42.8359375, 44.6533203125, 46.470703125, 48.2880859375, 50.10546875, 51.9228515625, 53.740234375, 55.5576171875, 57.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 9.0, 8.0, 6.0, 15.0, 10.0, 16.0, 14.0, 22.0, 14.0, 21.0, 20.0, 23.0, 38.0, 34.0, 42.0, 29.0, 44.0, 37.0, 40.0, 54.0, 45.0, 39.0, 27.0, 46.0, 40.0, 33.0, 40.0, 28.0, 40.0, 28.0, 28.0, 17.0, 13.0, 22.0, 14.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.65625, -39.41064453125, -38.1650390625, -36.91943359375, -35.673828125, -34.42822265625, -33.1826171875, -31.93701171875, -30.69140625, -29.44580078125, -28.2001953125, -26.95458984375, -25.708984375, -24.46337890625, -23.2177734375, -21.97216796875, -20.7265625, -19.48095703125, -18.2353515625, -16.98974609375, -15.744140625, -14.49853515625, -13.2529296875, -12.00732421875, -10.76171875, -9.51611328125, -8.2705078125, -7.02490234375, -5.779296875, -4.53369140625, -3.2880859375, -2.04248046875, -0.796875, 0.44873046875, 1.6943359375, 2.93994140625, 4.185546875, 5.43115234375, 6.6767578125, 7.92236328125, 9.16796875, 10.41357421875, 11.6591796875, 12.90478515625, 14.150390625, 15.39599609375, 16.6416015625, 17.88720703125, 19.1328125, 20.37841796875, 21.6240234375, 22.86962890625, 24.115234375, 25.36083984375, 26.6064453125, 27.85205078125, 29.09765625, 30.34326171875, 31.5888671875, 32.83447265625, 34.080078125, 35.32568359375, 36.5712890625, 37.81689453125, 39.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 5.0, 13.0, 11.0, 19.0, 49.0, 39.0, 72.0, 85.0, 142.0, 213.0, 415.0, 938.0, 2470.0, 10350.0, 92506.0, 916821.0, 18308.0, 3572.0, 1174.0, 541.0, 275.0, 138.0, 118.0, 61.0, 46.0, 39.0, 20.0, 18.0, 23.0, 11.0, 11.0, 6.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.0859375, -11.721435546875, -11.35693359375, -10.992431640625, -10.6279296875, -10.263427734375, -9.89892578125, -9.534423828125, -9.169921875, -8.805419921875, -8.44091796875, -8.076416015625, -7.7119140625, -7.347412109375, -6.98291015625, -6.618408203125, -6.25390625, -5.889404296875, -5.52490234375, -5.160400390625, -4.7958984375, -4.431396484375, -4.06689453125, -3.702392578125, -3.337890625, -2.973388671875, -2.60888671875, -2.244384765625, -1.8798828125, -1.515380859375, -1.15087890625, -0.786376953125, -0.421875, -0.057373046875, 0.30712890625, 0.671630859375, 1.0361328125, 1.400634765625, 1.76513671875, 2.129638671875, 2.494140625, 2.858642578125, 3.22314453125, 3.587646484375, 3.9521484375, 4.316650390625, 4.68115234375, 5.045654296875, 5.41015625, 5.774658203125, 6.13916015625, 6.503662109375, 6.8681640625, 7.232666015625, 7.59716796875, 7.961669921875, 8.326171875, 8.690673828125, 9.05517578125, 9.419677734375, 9.7841796875, 10.148681640625, 10.51318359375, 10.877685546875, 11.2421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 23.0, 30.0, 33.0, 54.0, 77.0, 108.0, 137.0, 147.0, 102.0, 86.0, 60.0, 36.0, 18.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005898475646972656, -0.0005728527903556824, -0.0005558580160140991, -0.0005388632416725159, -0.0005218684673309326, -0.0005048736929893494, -0.0004878789186477661, -0.00047088414430618286, -0.0004538893699645996, -0.00043689459562301636, -0.0004198998212814331, -0.00040290504693984985, -0.0003859102725982666, -0.00036891549825668335, -0.0003519207239151001, -0.00033492594957351685, -0.0003179311752319336, -0.00030093640089035034, -0.0002839416265487671, -0.00026694685220718384, -0.0002499520778656006, -0.00023295730352401733, -0.00021596252918243408, -0.00019896775484085083, -0.00018197298049926758, -0.00016497820615768433, -0.00014798343181610107, -0.00013098865747451782, -0.00011399388313293457, -9.699910879135132e-05, -8.000433444976807e-05, -6.300956010818481e-05, -4.601478576660156e-05, -2.902001142501831e-05, -1.2025237083435059e-05, 4.969537258148193e-06, 2.1964311599731445e-05, 3.89590859413147e-05, 5.595386028289795e-05, 7.29486346244812e-05, 8.994340896606445e-05, 0.0001069381833076477, 0.00012393295764923096, 0.0001409277319908142, 0.00015792250633239746, 0.0001749172806739807, 0.00019191205501556396, 0.00020890682935714722, 0.00022590160369873047, 0.00024289637804031372, 0.00025989115238189697, 0.0002768859267234802, 0.0002938807010650635, 0.00031087547540664673, 0.00032787024974823, 0.00034486502408981323, 0.0003618597984313965, 0.00037885457277297974, 0.000395849347114563, 0.00041284412145614624, 0.0004298388957977295, 0.00044683367013931274, 0.000463828444480896, 0.00048082321882247925, 0.0004978179931640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 18.0, 26.0, 27.0, 44.0, 60.0, 74.0, 151.0, 212.0, 399.0, 745.0, 1475.0, 3388.0, 8242.0, 20828.0, 54635.0, 139127.0, 277642.0, 290147.0, 151537.0, 60375.0, 22905.0, 9126.0, 3815.0, 1639.0, 815.0, 402.0, 230.0, 156.0, 92.0, 59.0, 43.0, 22.0, 17.0, 21.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.02288818359375, -7.7801513671875, -7.53741455078125, -7.294677734375, -7.05194091796875, -6.8092041015625, -6.56646728515625, -6.32373046875, -6.08099365234375, -5.8382568359375, -5.59552001953125, -5.352783203125, -5.11004638671875, -4.8673095703125, -4.62457275390625, -4.3818359375, -4.13909912109375, -3.8963623046875, -3.65362548828125, -3.410888671875, -3.16815185546875, -2.9254150390625, -2.68267822265625, -2.43994140625, -2.19720458984375, -1.9544677734375, -1.71173095703125, -1.468994140625, -1.22625732421875, -0.9835205078125, -0.74078369140625, -0.498046875, -0.25531005859375, -0.0125732421875, 0.23016357421875, 0.472900390625, 0.71563720703125, 0.9583740234375, 1.20111083984375, 1.44384765625, 1.68658447265625, 1.9293212890625, 2.17205810546875, 2.414794921875, 2.65753173828125, 2.9002685546875, 3.14300537109375, 3.3857421875, 3.62847900390625, 3.8712158203125, 4.11395263671875, 4.356689453125, 4.59942626953125, 4.8421630859375, 5.08489990234375, 5.32763671875, 5.57037353515625, 5.8131103515625, 6.05584716796875, 6.298583984375, 6.54132080078125, 6.7840576171875, 7.02679443359375, 7.26953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 8.0, 15.0, 13.0, 17.0, 19.0, 17.0, 25.0, 38.0, 31.0, 42.0, 46.0, 71.0, 58.0, 50.0, 58.0, 52.0, 47.0, 55.0, 43.0, 30.0, 33.0, 31.0, 27.0, 27.0, 15.0, 13.0, 18.0, 16.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.37042236328125, -1.3238525390625, -1.27728271484375, -1.230712890625, -1.18414306640625, -1.1375732421875, -1.09100341796875, -1.04443359375, -0.99786376953125, -0.9512939453125, -0.90472412109375, -0.858154296875, -0.81158447265625, -0.7650146484375, -0.71844482421875, -0.671875, -0.62530517578125, -0.5787353515625, -0.53216552734375, -0.485595703125, -0.43902587890625, -0.3924560546875, -0.34588623046875, -0.29931640625, -0.25274658203125, -0.2061767578125, -0.15960693359375, -0.113037109375, -0.06646728515625, -0.0198974609375, 0.02667236328125, 0.0732421875, 0.11981201171875, 0.1663818359375, 0.21295166015625, 0.259521484375, 0.30609130859375, 0.3526611328125, 0.39923095703125, 0.44580078125, 0.49237060546875, 0.5389404296875, 0.58551025390625, 0.632080078125, 0.67864990234375, 0.7252197265625, 0.77178955078125, 0.818359375, 0.86492919921875, 0.9114990234375, 0.95806884765625, 1.004638671875, 1.05120849609375, 1.0977783203125, 1.14434814453125, 1.19091796875, 1.23748779296875, 1.2840576171875, 1.33062744140625, 1.377197265625, 1.42376708984375, 1.4703369140625, 1.51690673828125, 1.5634765625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 5.0, 6.0, 14.0, 18.0, 22.0, 26.0, 22.0, 29.0, 34.0, 46.0, 41.0, 53.0, 47.0, 45.0, 44.0, 46.0, 47.0, 47.0, 51.0, 54.0, 42.0, 46.0, 25.0, 28.0, 29.0, 18.0, 20.0, 20.0, 15.0, 9.0, 12.0, 10.0, 5.0, 7.0, 4.0, 2.0, 4.0], "bins": [-92.06939697265625, -89.90866088867188, -87.7479248046875, -85.5871810913086, -83.42644500732422, -81.26570892333984, -79.10497283935547, -76.9442367553711, -74.78349304199219, -72.62275695800781, -70.46202087402344, -68.30127716064453, -66.14054107666016, -63.97980499267578, -61.819068908691406, -59.65833282470703, -57.497596740722656, -55.33686065673828, -53.17612075805664, -51.015384674072266, -48.854644775390625, -46.69390869140625, -44.533172607421875, -42.3724365234375, -40.21169662475586, -38.050960540771484, -35.890220642089844, -33.72948455810547, -31.56874656677246, -29.408008575439453, -27.247272491455078, -25.08653450012207, -22.925800323486328, -20.76506233215332, -18.604324340820312, -16.443588256835938, -14.28285026550293, -12.122112274169922, -9.96137523651123, -7.800638198852539, -5.639900207519531, -3.4791626930236816, -1.318425178527832, 0.8423123359680176, 3.003049850463867, 5.163787841796875, 7.324524879455566, 9.485261917114258, 11.645999908447266, 13.806737899780273, 15.967474937438965, 18.128211975097656, 20.288949966430664, 22.449687957763672, 24.610424041748047, 26.771162033081055, 28.931900024414062, 31.09263801574707, 33.25337600708008, 35.41411209106445, 37.574851989746094, 39.73558807373047, 41.896324157714844, 44.05706024169922, 46.21780014038086]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 8.0, 18.0, 7.0, 12.0, 22.0, 16.0, 24.0, 35.0, 20.0, 23.0, 29.0, 36.0, 37.0, 25.0, 31.0, 38.0, 38.0, 39.0, 46.0, 34.0, 45.0, 39.0, 37.0, 28.0, 22.0, 33.0, 40.0, 29.0, 27.0, 22.0, 19.0, 15.0, 14.0, 14.0, 9.0, 3.0, 12.0, 8.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-62.82893371582031, -61.046478271484375, -59.2640266418457, -57.481571197509766, -55.69911575317383, -53.916664123535156, -52.13420867919922, -50.35175323486328, -48.569297790527344, -46.786842346191406, -45.004390716552734, -43.2219352722168, -41.43947982788086, -39.65702819824219, -37.87457275390625, -36.09211730957031, -34.30966567993164, -32.5272102355957, -30.7447566986084, -28.962303161621094, -27.179847717285156, -25.39739418029785, -23.614940643310547, -21.83248519897461, -20.050031661987305, -18.267578125, -16.485122680664062, -14.702669143676758, -12.920214653015137, -11.137760162353516, -9.355306625366211, -7.57285213470459, -5.790393829345703, -4.007939338684082, -2.225485324859619, -0.44303131103515625, 1.3394231796264648, 3.121877670288086, 4.904331207275391, 6.686785697937012, 8.469240188598633, 10.251694679260254, 12.034149169921875, 13.81660270690918, 15.5990571975708, 17.381511688232422, 19.163965225219727, 20.94641876220703, 22.72887420654297, 24.511327743530273, 26.29378318786621, 28.076236724853516, 29.858692169189453, 31.641145706176758, 33.42359924316406, 35.2060546875, 36.98851013183594, 38.770965576171875, 40.55341720581055, 42.335872650146484, 44.11832809448242, 45.900779724121094, 47.68323516845703, 49.46569061279297, 51.24814224243164]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 13.0, 22.0, 31.0, 34.0, 80.0, 111.0, 177.0, 265.0, 400.0, 644.0, 1055.0, 1798.0, 2974.0, 5285.0, 9544.0, 16776.0, 29014.0, 48286.0, 75929.0, 107305.0, 135026.0, 147042.0, 139357.0, 114342.0, 82199.0, 53526.0, 32988.0, 19083.0, 10638.0, 6040.0, 3380.0, 2016.0, 1126.0, 741.0, 468.0, 260.0, 184.0, 118.0, 97.0, 62.0, 49.0, 22.0, 13.0, 9.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.693359375, -66.44921875, -64.205078125, -61.9609375, -59.716796875, -57.47265625, -55.228515625, -52.984375, -50.740234375, -48.49609375, -46.251953125, -44.0078125, -41.763671875, -39.51953125, -37.275390625, -35.03125, -32.787109375, -30.54296875, -28.298828125, -26.0546875, -23.810546875, -21.56640625, -19.322265625, -17.078125, -14.833984375, -12.58984375, -10.345703125, -8.1015625, -5.857421875, -3.61328125, -1.369140625, 0.875, 3.119140625, 5.36328125, 7.607421875, 9.8515625, 12.095703125, 14.33984375, 16.583984375, 18.828125, 21.072265625, 23.31640625, 25.560546875, 27.8046875, 30.048828125, 32.29296875, 34.537109375, 36.78125, 39.025390625, 41.26953125, 43.513671875, 45.7578125, 48.001953125, 50.24609375, 52.490234375, 54.734375, 56.978515625, 59.22265625, 61.466796875, 63.7109375, 65.955078125, 68.19921875, 70.443359375, 72.6875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 13.0, 20.0, 20.0, 22.0, 34.0, 22.0, 20.0, 33.0, 39.0, 34.0, 25.0, 36.0, 39.0, 43.0, 37.0, 44.0, 35.0, 47.0, 43.0, 26.0, 31.0, 29.0, 37.0, 36.0, 29.0, 25.0, 18.0, 14.0, 17.0, 15.0, 12.0, 4.0, 10.0, 9.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-63.15625, -61.34814453125, -59.5400390625, -57.73193359375, -55.923828125, -54.11572265625, -52.3076171875, -50.49951171875, -48.69140625, -46.88330078125, -45.0751953125, -43.26708984375, -41.458984375, -39.65087890625, -37.8427734375, -36.03466796875, -34.2265625, -32.41845703125, -30.6103515625, -28.80224609375, -26.994140625, -25.18603515625, -23.3779296875, -21.56982421875, -19.76171875, -17.95361328125, -16.1455078125, -14.33740234375, -12.529296875, -10.72119140625, -8.9130859375, -7.10498046875, -5.296875, -3.48876953125, -1.6806640625, 0.12744140625, 1.935546875, 3.74365234375, 5.5517578125, 7.35986328125, 9.16796875, 10.97607421875, 12.7841796875, 14.59228515625, 16.400390625, 18.20849609375, 20.0166015625, 21.82470703125, 23.6328125, 25.44091796875, 27.2490234375, 29.05712890625, 30.865234375, 32.67333984375, 34.4814453125, 36.28955078125, 38.09765625, 39.90576171875, 41.7138671875, 43.52197265625, 45.330078125, 47.13818359375, 48.9462890625, 50.75439453125, 52.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 5.0, 5.0, 24.0, 25.0, 48.0, 56.0, 94.0, 140.0, 191.0, 276.0, 448.0, 636.0, 996.0, 1483.0, 2353.0, 3777.0, 6082.0, 10086.0, 17115.0, 28073.0, 45244.0, 69942.0, 98908.0, 126951.0, 142416.0, 138377.0, 115862.0, 85563.0, 58079.0, 37091.0, 22561.0, 13524.0, 8290.0, 5013.0, 3177.0, 1963.0, 1259.0, 763.0, 566.0, 363.0, 240.0, 158.0, 115.0, 68.0, 58.0, 28.0, 18.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-79.75, -77.3173828125, -74.884765625, -72.4521484375, -70.01953125, -67.5869140625, -65.154296875, -62.7216796875, -60.2890625, -57.8564453125, -55.423828125, -52.9912109375, -50.55859375, -48.1259765625, -45.693359375, -43.2607421875, -40.828125, -38.3955078125, -35.962890625, -33.5302734375, -31.09765625, -28.6650390625, -26.232421875, -23.7998046875, -21.3671875, -18.9345703125, -16.501953125, -14.0693359375, -11.63671875, -9.2041015625, -6.771484375, -4.3388671875, -1.90625, 0.5263671875, 2.958984375, 5.3916015625, 7.82421875, 10.2568359375, 12.689453125, 15.1220703125, 17.5546875, 19.9873046875, 22.419921875, 24.8525390625, 27.28515625, 29.7177734375, 32.150390625, 34.5830078125, 37.015625, 39.4482421875, 41.880859375, 44.3134765625, 46.74609375, 49.1787109375, 51.611328125, 54.0439453125, 56.4765625, 58.9091796875, 61.341796875, 63.7744140625, 66.20703125, 68.6396484375, 71.072265625, 73.5048828125, 75.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 10.0, 7.0, 14.0, 9.0, 17.0, 14.0, 14.0, 27.0, 32.0, 30.0, 33.0, 37.0, 34.0, 48.0, 46.0, 35.0, 39.0, 51.0, 42.0, 35.0, 46.0, 42.0, 33.0, 33.0, 36.0, 33.0, 21.0, 25.0, 16.0, 21.0, 20.0, 23.0, 10.0, 13.0, 7.0, 13.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -34.94482421875, -33.7333984375, -32.52197265625, -31.310546875, -30.09912109375, -28.8876953125, -27.67626953125, -26.46484375, -25.25341796875, -24.0419921875, -22.83056640625, -21.619140625, -20.40771484375, -19.1962890625, -17.98486328125, -16.7734375, -15.56201171875, -14.3505859375, -13.13916015625, -11.927734375, -10.71630859375, -9.5048828125, -8.29345703125, -7.08203125, -5.87060546875, -4.6591796875, -3.44775390625, -2.236328125, -1.02490234375, 0.1865234375, 1.39794921875, 2.609375, 3.82080078125, 5.0322265625, 6.24365234375, 7.455078125, 8.66650390625, 9.8779296875, 11.08935546875, 12.30078125, 13.51220703125, 14.7236328125, 15.93505859375, 17.146484375, 18.35791015625, 19.5693359375, 20.78076171875, 21.9921875, 23.20361328125, 24.4150390625, 25.62646484375, 26.837890625, 28.04931640625, 29.2607421875, 30.47216796875, 31.68359375, 32.89501953125, 34.1064453125, 35.31787109375, 36.529296875, 37.74072265625, 38.9521484375, 40.16357421875, 41.375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 23.0, 24.0, 40.0, 68.0, 90.0, 123.0, 202.0, 323.0, 467.0, 684.0, 1080.0, 1618.0, 2529.0, 3866.0, 6005.0, 9517.0, 14857.0, 23139.0, 35281.0, 52759.0, 74891.0, 99049.0, 119334.0, 128011.0, 121432.0, 104619.0, 80654.0, 57572.0, 39025.0, 25472.0, 16312.0, 10361.0, 6739.0, 4398.0, 2716.0, 1773.0, 1172.0, 785.0, 504.0, 354.0, 219.0, 171.0, 86.0, 70.0, 42.0, 23.0, 27.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0625, -13.587646484375, -13.11279296875, -12.637939453125, -12.1630859375, -11.688232421875, -11.21337890625, -10.738525390625, -10.263671875, -9.788818359375, -9.31396484375, -8.839111328125, -8.3642578125, -7.889404296875, -7.41455078125, -6.939697265625, -6.46484375, -5.989990234375, -5.51513671875, -5.040283203125, -4.5654296875, -4.090576171875, -3.61572265625, -3.140869140625, -2.666015625, -2.191162109375, -1.71630859375, -1.241455078125, -0.7666015625, -0.291748046875, 0.18310546875, 0.657958984375, 1.1328125, 1.607666015625, 2.08251953125, 2.557373046875, 3.0322265625, 3.507080078125, 3.98193359375, 4.456787109375, 4.931640625, 5.406494140625, 5.88134765625, 6.356201171875, 6.8310546875, 7.305908203125, 7.78076171875, 8.255615234375, 8.73046875, 9.205322265625, 9.68017578125, 10.155029296875, 10.6298828125, 11.104736328125, 11.57958984375, 12.054443359375, 12.529296875, 13.004150390625, 13.47900390625, 13.953857421875, 14.4287109375, 14.903564453125, 15.37841796875, 15.853271484375, 16.328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 3.0, 13.0, 8.0, 14.0, 17.0, 23.0, 30.0, 35.0, 42.0, 53.0, 64.0, 63.0, 71.0, 73.0, 69.0, 69.0, 72.0, 53.0, 49.0, 44.0, 31.0, 23.0, 19.0, 11.0, 19.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028591156005859375, -0.0027809441089630127, -0.002702772617340088, -0.002624601125717163, -0.0025464296340942383, -0.0024682581424713135, -0.0023900866508483887, -0.002311915159225464, -0.002233743667602539, -0.0021555721759796143, -0.0020774006843566895, -0.0019992291927337646, -0.0019210577011108398, -0.001842886209487915, -0.0017647147178649902, -0.0016865432262420654, -0.0016083717346191406, -0.0015302002429962158, -0.001452028751373291, -0.0013738572597503662, -0.0012956857681274414, -0.0012175142765045166, -0.0011393427848815918, -0.001061171293258667, -0.0009829998016357422, -0.0009048283100128174, -0.0008266568183898926, -0.0007484853267669678, -0.000670313835144043, -0.0005921423435211182, -0.0005139708518981934, -0.00043579936027526855, -0.00035762786865234375, -0.00027945637702941895, -0.00020128488540649414, -0.00012311339378356934, -4.494190216064453e-05, 3.3229589462280273e-05, 0.00011140108108520508, 0.00018957257270812988, 0.0002677440643310547, 0.0003459155559539795, 0.0004240870475769043, 0.0005022585391998291, 0.0005804300308227539, 0.0006586015224456787, 0.0007367730140686035, 0.0008149445056915283, 0.0008931159973144531, 0.0009712874889373779, 0.0010494589805603027, 0.0011276304721832275, 0.0012058019638061523, 0.0012839734554290771, 0.001362144947052002, 0.0014403164386749268, 0.0015184879302978516, 0.0015966594219207764, 0.0016748309135437012, 0.001753002405166626, 0.0018311738967895508, 0.0019093453884124756, 0.0019875168800354004, 0.002065688371658325, 0.00214385986328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 32.0, 32.0, 61.0, 74.0, 99.0, 155.0, 256.0, 351.0, 579.0, 893.0, 1343.0, 2156.0, 3288.0, 5144.0, 8244.0, 12763.0, 19728.0, 29843.0, 44074.0, 61781.0, 82483.0, 102674.0, 116517.0, 119695.0, 110736.0, 93304.0, 73067.0, 53043.0, 36491.0, 24690.0, 16037.0, 10327.0, 6573.0, 4262.0, 2800.0, 1752.0, 1113.0, 721.0, 430.0, 313.0, 214.0, 122.0, 82.0, 65.0, 33.0, 32.0, 26.0, 15.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.828125, -13.3712158203125, -12.914306640625, -12.4573974609375, -12.00048828125, -11.5435791015625, -11.086669921875, -10.6297607421875, -10.1728515625, -9.7159423828125, -9.259033203125, -8.8021240234375, -8.34521484375, -7.8883056640625, -7.431396484375, -6.9744873046875, -6.517578125, -6.0606689453125, -5.603759765625, -5.1468505859375, -4.68994140625, -4.2330322265625, -3.776123046875, -3.3192138671875, -2.8623046875, -2.4053955078125, -1.948486328125, -1.4915771484375, -1.03466796875, -0.5777587890625, -0.120849609375, 0.3360595703125, 0.79296875, 1.2498779296875, 1.706787109375, 2.1636962890625, 2.62060546875, 3.0775146484375, 3.534423828125, 3.9913330078125, 4.4482421875, 4.9051513671875, 5.362060546875, 5.8189697265625, 6.27587890625, 6.7327880859375, 7.189697265625, 7.6466064453125, 8.103515625, 8.5604248046875, 9.017333984375, 9.4742431640625, 9.93115234375, 10.3880615234375, 10.844970703125, 11.3018798828125, 11.7587890625, 12.2156982421875, 12.672607421875, 13.1295166015625, 13.58642578125, 14.0433349609375, 14.500244140625, 14.9571533203125, 15.4140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 11.0, 11.0, 7.0, 7.0, 15.0, 10.0, 16.0, 27.0, 16.0, 33.0, 33.0, 44.0, 45.0, 28.0, 49.0, 54.0, 56.0, 41.0, 48.0, 55.0, 50.0, 45.0, 44.0, 41.0, 39.0, 30.0, 17.0, 26.0, 22.0, 14.0, 9.0, 11.0, 13.0, 8.0, 10.0, 1.0, 5.0, 2.0, 0.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.34375, -8.1080322265625, -7.872314453125, -7.6365966796875, -7.40087890625, -7.1651611328125, -6.929443359375, -6.6937255859375, -6.4580078125, -6.2222900390625, -5.986572265625, -5.7508544921875, -5.51513671875, -5.2794189453125, -5.043701171875, -4.8079833984375, -4.572265625, -4.3365478515625, -4.100830078125, -3.8651123046875, -3.62939453125, -3.3936767578125, -3.157958984375, -2.9222412109375, -2.6865234375, -2.4508056640625, -2.215087890625, -1.9793701171875, -1.74365234375, -1.5079345703125, -1.272216796875, -1.0364990234375, -0.80078125, -0.5650634765625, -0.329345703125, -0.0936279296875, 0.14208984375, 0.3778076171875, 0.613525390625, 0.8492431640625, 1.0849609375, 1.3206787109375, 1.556396484375, 1.7921142578125, 2.02783203125, 2.2635498046875, 2.499267578125, 2.7349853515625, 2.970703125, 3.2064208984375, 3.442138671875, 3.6778564453125, 3.91357421875, 4.1492919921875, 4.385009765625, 4.6207275390625, 4.8564453125, 5.0921630859375, 5.327880859375, 5.5635986328125, 5.79931640625, 6.0350341796875, 6.270751953125, 6.5064697265625, 6.7421875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 6.0, 10.0, 12.0, 13.0, 15.0, 14.0, 19.0, 25.0, 26.0, 29.0, 27.0, 35.0, 35.0, 34.0, 45.0, 44.0, 59.0, 38.0, 37.0, 48.0, 39.0, 39.0, 41.0, 33.0, 28.0, 37.0, 34.0, 27.0, 15.0, 20.0, 19.0, 13.0, 15.0, 12.0, 14.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.18128967285156, -63.26628494262695, -61.351280212402344, -59.436275482177734, -57.521270751953125, -55.606266021728516, -53.691261291503906, -51.7762565612793, -49.86125183105469, -47.94624710083008, -46.03124237060547, -44.11623764038086, -42.20123291015625, -40.28622817993164, -38.37122344970703, -36.45621871948242, -34.54121398925781, -32.6262092590332, -30.711204528808594, -28.796199798583984, -26.881195068359375, -24.966190338134766, -23.051185607910156, -21.136180877685547, -19.221176147460938, -17.306171417236328, -15.391166687011719, -13.47616195678711, -11.5611572265625, -9.64615249633789, -7.731147766113281, -5.816143035888672, -3.9011383056640625, -1.9861335754394531, -0.07112884521484375, 1.8438758850097656, 3.758880615234375, 5.673885345458984, 7.588890075683594, 9.503894805908203, 11.418899536132812, 13.333904266357422, 15.248908996582031, 17.16391372680664, 19.07891845703125, 20.99392318725586, 22.90892791748047, 24.823932647705078, 26.738937377929688, 28.653942108154297, 30.568946838378906, 32.483951568603516, 34.398956298828125, 36.313961029052734, 38.228965759277344, 40.14397048950195, 42.05897521972656, 43.97397994995117, 45.88898468017578, 47.80398941040039, 49.718994140625, 51.63399887084961, 53.54900360107422, 55.46400833129883, 57.37901306152344]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 5.0, 13.0, 13.0, 14.0, 14.0, 15.0, 18.0, 18.0, 24.0, 24.0, 15.0, 28.0, 25.0, 27.0, 43.0, 40.0, 26.0, 43.0, 38.0, 35.0, 33.0, 44.0, 37.0, 33.0, 30.0, 36.0, 37.0, 27.0, 28.0, 33.0, 20.0, 28.0, 18.0, 16.0, 14.0, 13.0, 11.0, 8.0, 10.0, 7.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.16705322265625, -54.35741424560547, -52.54777908325195, -50.73814010620117, -48.92850112915039, -47.118865966796875, -45.309226989746094, -43.49958801269531, -41.68994903564453, -39.88031005859375, -38.070674896240234, -36.26103591918945, -34.45139694213867, -32.641761779785156, -30.832122802734375, -29.022483825683594, -27.212848663330078, -25.40321159362793, -23.59357261657715, -21.783935546875, -19.97429656982422, -18.16465950012207, -16.355022430419922, -14.545384407043457, -12.735746383666992, -10.926108360290527, -9.116470336914062, -7.306833267211914, -5.497195243835449, -3.6875572204589844, -1.877920150756836, -0.0682821273803711, 1.7413597106933594, 3.550997495651245, 5.360635280609131, 7.1702728271484375, 8.979910850524902, 10.789548873901367, 12.599185943603516, 14.40882396697998, 16.218461990356445, 18.028099060058594, 19.837738037109375, 21.647375106811523, 23.457012176513672, 25.266651153564453, 27.0762882232666, 28.88592529296875, 30.69556427001953, 32.50520324707031, 34.31483840942383, 36.12447738647461, 37.93411636352539, 39.743751525878906, 41.55339050292969, 43.36302947998047, 45.17266845703125, 46.98230743408203, 48.79194259643555, 50.60158157348633, 52.41122055053711, 54.220855712890625, 56.030494689941406, 57.84013366699219, 59.6497688293457]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 17.0, 24.0, 38.0, 61.0, 70.0, 136.0, 198.0, 348.0, 498.0, 784.0, 1193.0, 1968.0, 3114.0, 4883.0, 7999.0, 12563.0, 19346.0, 30379.0, 47212.0, 73457.0, 111603.0, 166203.0, 239627.0, 329306.0, 422832.0, 494039.0, 510119.0, 465316.0, 379643.0, 282874.0, 200389.0, 135679.0, 89448.0, 58529.0, 37780.0, 23956.0, 15367.0, 9803.0, 6309.0, 3970.0, 2620.0, 1659.0, 1086.0, 631.0, 419.0, 276.0, 182.0, 121.0, 71.0, 35.0, 31.0, 21.0, 19.0, 12.0, 6.0, 5.0, 4.0, 1.0], "bins": [-56.96875, -55.2021484375, -53.435546875, -51.6689453125, -49.90234375, -48.1357421875, -46.369140625, -44.6025390625, -42.8359375, -41.0693359375, -39.302734375, -37.5361328125, -35.76953125, -34.0029296875, -32.236328125, -30.4697265625, -28.703125, -26.9365234375, -25.169921875, -23.4033203125, -21.63671875, -19.8701171875, -18.103515625, -16.3369140625, -14.5703125, -12.8037109375, -11.037109375, -9.2705078125, -7.50390625, -5.7373046875, -3.970703125, -2.2041015625, -0.4375, 1.3291015625, 3.095703125, 4.8623046875, 6.62890625, 8.3955078125, 10.162109375, 11.9287109375, 13.6953125, 15.4619140625, 17.228515625, 18.9951171875, 20.76171875, 22.5283203125, 24.294921875, 26.0615234375, 27.828125, 29.5947265625, 31.361328125, 33.1279296875, 34.89453125, 36.6611328125, 38.427734375, 40.1943359375, 41.9609375, 43.7275390625, 45.494140625, 47.2607421875, 49.02734375, 50.7939453125, 52.560546875, 54.3271484375, 56.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 7.0, 10.0, 12.0, 15.0, 15.0, 17.0, 16.0, 13.0, 31.0, 17.0, 26.0, 23.0, 20.0, 30.0, 40.0, 40.0, 28.0, 38.0, 44.0, 25.0, 36.0, 43.0, 35.0, 35.0, 30.0, 37.0, 35.0, 27.0, 27.0, 29.0, 27.0, 25.0, 21.0, 18.0, 12.0, 12.0, 12.0, 7.0, 10.0, 11.0, 10.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.03125, -47.46875, -45.90625, -44.34375, -42.78125, -41.21875, -39.65625, -38.09375, -36.53125, -34.96875, -33.40625, -31.84375, -30.28125, -28.71875, -27.15625, -25.59375, -24.03125, -22.46875, -20.90625, -19.34375, -17.78125, -16.21875, -14.65625, -13.09375, -11.53125, -9.96875, -8.40625, -6.84375, -5.28125, -3.71875, -2.15625, -0.59375, 0.96875, 2.53125, 4.09375, 5.65625, 7.21875, 8.78125, 10.34375, 11.90625, 13.46875, 15.03125, 16.59375, 18.15625, 19.71875, 21.28125, 22.84375, 24.40625, 25.96875, 27.53125, 29.09375, 30.65625, 32.21875, 33.78125, 35.34375, 36.90625, 38.46875, 40.03125, 41.59375, 43.15625, 44.71875, 46.28125, 47.84375, 49.40625, 50.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 42.0, 69.0, 120.0, 155.0, 246.0, 378.0, 726.0, 1250.0, 2134.0, 3834.0, 6950.0, 12806.0, 23908.0, 43825.0, 80598.0, 143223.0, 241744.0, 380137.0, 535252.0, 646465.0, 640993.0, 524491.0, 367146.0, 231874.0, 136760.0, 76565.0, 42223.0, 22903.0, 12034.0, 6843.0, 3637.0, 2009.0, 1158.0, 621.0, 378.0, 268.0, 152.0, 87.0, 56.0, 44.0, 31.0, 22.0, 17.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-74.125, -71.8056640625, -69.486328125, -67.1669921875, -64.84765625, -62.5283203125, -60.208984375, -57.8896484375, -55.5703125, -53.2509765625, -50.931640625, -48.6123046875, -46.29296875, -43.9736328125, -41.654296875, -39.3349609375, -37.015625, -34.6962890625, -32.376953125, -30.0576171875, -27.73828125, -25.4189453125, -23.099609375, -20.7802734375, -18.4609375, -16.1416015625, -13.822265625, -11.5029296875, -9.18359375, -6.8642578125, -4.544921875, -2.2255859375, 0.09375, 2.4130859375, 4.732421875, 7.0517578125, 9.37109375, 11.6904296875, 14.009765625, 16.3291015625, 18.6484375, 20.9677734375, 23.287109375, 25.6064453125, 27.92578125, 30.2451171875, 32.564453125, 34.8837890625, 37.203125, 39.5224609375, 41.841796875, 44.1611328125, 46.48046875, 48.7998046875, 51.119140625, 53.4384765625, 55.7578125, 58.0771484375, 60.396484375, 62.7158203125, 65.03515625, 67.3544921875, 69.673828125, 71.9931640625, 74.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 9.0, 8.0, 17.0, 13.0, 32.0, 34.0, 30.0, 48.0, 48.0, 69.0, 83.0, 83.0, 102.0, 106.0, 141.0, 160.0, 180.0, 184.0, 201.0, 223.0, 196.0, 224.0, 235.0, 209.0, 191.0, 180.0, 146.0, 154.0, 130.0, 107.0, 84.0, 81.0, 72.0, 68.0, 51.0, 42.0, 32.0, 23.0, 21.0, 18.0, 9.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.265625, -26.41650390625, -25.5673828125, -24.71826171875, -23.869140625, -23.02001953125, -22.1708984375, -21.32177734375, -20.47265625, -19.62353515625, -18.7744140625, -17.92529296875, -17.076171875, -16.22705078125, -15.3779296875, -14.52880859375, -13.6796875, -12.83056640625, -11.9814453125, -11.13232421875, -10.283203125, -9.43408203125, -8.5849609375, -7.73583984375, -6.88671875, -6.03759765625, -5.1884765625, -4.33935546875, -3.490234375, -2.64111328125, -1.7919921875, -0.94287109375, -0.09375, 0.75537109375, 1.6044921875, 2.45361328125, 3.302734375, 4.15185546875, 5.0009765625, 5.85009765625, 6.69921875, 7.54833984375, 8.3974609375, 9.24658203125, 10.095703125, 10.94482421875, 11.7939453125, 12.64306640625, 13.4921875, 14.34130859375, 15.1904296875, 16.03955078125, 16.888671875, 17.73779296875, 18.5869140625, 19.43603515625, 20.28515625, 21.13427734375, 21.9833984375, 22.83251953125, 23.681640625, 24.53076171875, 25.3798828125, 26.22900390625, 27.078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 5.0, 6.0, 8.0, 9.0, 14.0, 13.0, 22.0, 18.0, 23.0, 32.0, 27.0, 35.0, 30.0, 42.0, 47.0, 44.0, 38.0, 49.0, 43.0, 48.0, 37.0, 33.0, 32.0, 46.0, 43.0, 30.0, 44.0, 34.0, 18.0, 20.0, 18.0, 13.0, 17.0, 9.0, 9.0, 5.0, 12.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-66.95327758789062, -64.97203826904297, -62.99079132080078, -61.00954818725586, -59.02830505371094, -57.04706573486328, -55.06582260131836, -53.08457946777344, -51.103336334228516, -49.122093200683594, -47.14085006713867, -45.15960693359375, -43.178367614746094, -41.197120666503906, -39.21588134765625, -37.23463821411133, -35.253395080566406, -33.272151947021484, -31.290908813476562, -29.309667587280273, -27.32842445373535, -25.34718132019043, -23.36594009399414, -21.38469696044922, -19.403453826904297, -17.422210693359375, -15.44096851348877, -13.459726333618164, -11.478483200073242, -9.49724006652832, -7.515997886657715, -5.534755706787109, -3.5535125732421875, -1.5722699165344238, 0.40897274017333984, 2.3902153968811035, 4.371458053588867, 6.352701187133789, 8.333943367004395, 10.315185546875, 12.296428680419922, 14.277671813964844, 16.258914947509766, 18.240156173706055, 20.221399307250977, 22.2026424407959, 24.183883666992188, 26.16512680053711, 28.14636993408203, 30.127613067626953, 32.108856201171875, 34.0900993347168, 36.07134246826172, 38.052581787109375, 40.0338249206543, 42.01506805419922, 43.99631118774414, 45.97755432128906, 47.958797454833984, 49.940040588378906, 51.92127990722656, 53.90252685546875, 55.883766174316406, 57.86500930786133, 59.84625244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 7.0, 6.0, 10.0, 14.0, 12.0, 13.0, 15.0, 17.0, 11.0, 22.0, 29.0, 30.0, 28.0, 35.0, 36.0, 34.0, 43.0, 29.0, 42.0, 45.0, 40.0, 49.0, 46.0, 30.0, 37.0, 36.0, 25.0, 38.0, 31.0, 31.0, 19.0, 22.0, 22.0, 14.0, 17.0, 12.0, 6.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.89384078979492, -53.91671371459961, -51.9395866394043, -49.96245574951172, -47.985328674316406, -46.008201599121094, -44.03107452392578, -42.05394744873047, -40.076820373535156, -38.099693298339844, -36.12256622314453, -34.14543914794922, -32.16830825805664, -30.191181182861328, -28.214054107666016, -26.236927032470703, -24.259796142578125, -22.282669067382812, -20.305540084838867, -18.328413009643555, -16.35128402709961, -14.374156951904297, -12.397029876708984, -10.419901847839355, -8.442773818969727, -6.465645790100098, -4.488518238067627, -2.5113906860351562, -0.5342626571655273, 1.4428653717041016, 3.419992446899414, 5.397120475769043, 7.3742523193359375, 9.351380348205566, 11.328508377075195, 13.305635452270508, 15.282763481140137, 17.259891510009766, 19.237018585205078, 21.21414566040039, 23.191274642944336, 25.16840171813965, 27.145530700683594, 29.122657775878906, 31.09978485107422, 33.07691192626953, 35.054039001464844, 37.03116989135742, 39.008296966552734, 40.98542404174805, 42.96255111694336, 44.93968200683594, 46.91680908203125, 48.89393615722656, 50.871063232421875, 52.84819030761719, 54.8253173828125, 56.80244445800781, 58.779571533203125, 60.75669860839844, 62.733829498291016, 64.71095275878906, 66.68807983398438, 68.66521453857422, 70.64234161376953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 2.0, 20.0, 28.0, 31.0, 60.0, 80.0, 117.0, 189.0, 346.0, 494.0, 725.0, 1171.0, 1862.0, 2890.0, 4407.0, 7115.0, 11148.0, 17391.0, 26691.0, 39669.0, 57090.0, 77675.0, 99170.0, 115209.0, 121406.0, 115026.0, 99080.0, 78407.0, 57105.0, 39580.0, 26534.0, 17482.0, 11035.0, 7010.0, 4471.0, 2827.0, 1746.0, 1219.0, 720.0, 460.0, 304.0, 196.0, 116.0, 85.0, 50.0, 41.0, 22.0, 15.0, 8.0, 14.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.74609375, -25.7734375, -24.80078125, -23.828125, -22.85546875, -21.8828125, -20.91015625, -19.9375, -18.96484375, -17.9921875, -17.01953125, -16.046875, -15.07421875, -14.1015625, -13.12890625, -12.15625, -11.18359375, -10.2109375, -9.23828125, -8.265625, -7.29296875, -6.3203125, -5.34765625, -4.375, -3.40234375, -2.4296875, -1.45703125, -0.484375, 0.48828125, 1.4609375, 2.43359375, 3.40625, 4.37890625, 5.3515625, 6.32421875, 7.296875, 8.26953125, 9.2421875, 10.21484375, 11.1875, 12.16015625, 13.1328125, 14.10546875, 15.078125, 16.05078125, 17.0234375, 17.99609375, 18.96875, 19.94140625, 20.9140625, 21.88671875, 22.859375, 23.83203125, 24.8046875, 25.77734375, 26.75, 27.72265625, 28.6953125, 29.66796875, 30.640625, 31.61328125, 32.5859375, 33.55859375, 34.53125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 3.0, 12.0, 13.0, 13.0, 9.0, 17.0, 13.0, 20.0, 19.0, 21.0, 30.0, 34.0, 29.0, 34.0, 42.0, 39.0, 29.0, 40.0, 49.0, 32.0, 44.0, 41.0, 47.0, 36.0, 29.0, 35.0, 32.0, 33.0, 29.0, 24.0, 24.0, 17.0, 18.0, 13.0, 15.0, 10.0, 6.0, 7.0, 13.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.03125, -53.98583984375, -51.9404296875, -49.89501953125, -47.849609375, -45.80419921875, -43.7587890625, -41.71337890625, -39.66796875, -37.62255859375, -35.5771484375, -33.53173828125, -31.486328125, -29.44091796875, -27.3955078125, -25.35009765625, -23.3046875, -21.25927734375, -19.2138671875, -17.16845703125, -15.123046875, -13.07763671875, -11.0322265625, -8.98681640625, -6.94140625, -4.89599609375, -2.8505859375, -0.80517578125, 1.240234375, 3.28564453125, 5.3310546875, 7.37646484375, 9.421875, 11.46728515625, 13.5126953125, 15.55810546875, 17.603515625, 19.64892578125, 21.6943359375, 23.73974609375, 25.78515625, 27.83056640625, 29.8759765625, 31.92138671875, 33.966796875, 36.01220703125, 38.0576171875, 40.10302734375, 42.1484375, 44.19384765625, 46.2392578125, 48.28466796875, 50.330078125, 52.37548828125, 54.4208984375, 56.46630859375, 58.51171875, 60.55712890625, 62.6025390625, 64.64794921875, 66.693359375, 68.73876953125, 70.7841796875, 72.82958984375, 74.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 3.0, 17.0, 16.0, 27.0, 42.0, 41.0, 55.0, 82.0, 117.0, 139.0, 230.0, 351.0, 422.0, 685.0, 1009.0, 1491.0, 2145.0, 3177.0, 4888.0, 7677.0, 11506.0, 17810.0, 29831.0, 287047.0, 587386.0, 34705.0, 19876.0, 12723.0, 8289.0, 5356.0, 3622.0, 2416.0, 1625.0, 1155.0, 782.0, 561.0, 351.0, 248.0, 172.0, 139.0, 100.0, 67.0, 63.0, 31.0, 28.0, 12.0, 9.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0, 3.0], "bins": [-66.5, -64.55029296875, -62.6005859375, -60.65087890625, -58.701171875, -56.75146484375, -54.8017578125, -52.85205078125, -50.90234375, -48.95263671875, -47.0029296875, -45.05322265625, -43.103515625, -41.15380859375, -39.2041015625, -37.25439453125, -35.3046875, -33.35498046875, -31.4052734375, -29.45556640625, -27.505859375, -25.55615234375, -23.6064453125, -21.65673828125, -19.70703125, -17.75732421875, -15.8076171875, -13.85791015625, -11.908203125, -9.95849609375, -8.0087890625, -6.05908203125, -4.109375, -2.15966796875, -0.2099609375, 1.73974609375, 3.689453125, 5.63916015625, 7.5888671875, 9.53857421875, 11.48828125, 13.43798828125, 15.3876953125, 17.33740234375, 19.287109375, 21.23681640625, 23.1865234375, 25.13623046875, 27.0859375, 29.03564453125, 30.9853515625, 32.93505859375, 34.884765625, 36.83447265625, 38.7841796875, 40.73388671875, 42.68359375, 44.63330078125, 46.5830078125, 48.53271484375, 50.482421875, 52.43212890625, 54.3818359375, 56.33154296875, 58.28125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 16.0, 12.0, 12.0, 8.0, 34.0, 29.0, 28.0, 30.0, 35.0, 32.0, 34.0, 45.0, 32.0, 46.0, 48.0, 34.0, 42.0, 43.0, 44.0, 43.0, 44.0, 46.0, 38.0, 33.0, 24.0, 16.0, 20.0, 14.0, 8.0, 15.0, 13.0, 10.0, 13.0, 6.0, 7.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0751953125, -49.462890625, -47.8505859375, -46.23828125, -44.6259765625, -43.013671875, -41.4013671875, -39.7890625, -38.1767578125, -36.564453125, -34.9521484375, -33.33984375, -31.7275390625, -30.115234375, -28.5029296875, -26.890625, -25.2783203125, -23.666015625, -22.0537109375, -20.44140625, -18.8291015625, -17.216796875, -15.6044921875, -13.9921875, -12.3798828125, -10.767578125, -9.1552734375, -7.54296875, -5.9306640625, -4.318359375, -2.7060546875, -1.09375, 0.5185546875, 2.130859375, 3.7431640625, 5.35546875, 6.9677734375, 8.580078125, 10.1923828125, 11.8046875, 13.4169921875, 15.029296875, 16.6416015625, 18.25390625, 19.8662109375, 21.478515625, 23.0908203125, 24.703125, 26.3154296875, 27.927734375, 29.5400390625, 31.15234375, 32.7646484375, 34.376953125, 35.9892578125, 37.6015625, 39.2138671875, 40.826171875, 42.4384765625, 44.05078125, 45.6630859375, 47.275390625, 48.8876953125, 50.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 4.0, 6.0, 21.0, 22.0, 29.0, 41.0, 59.0, 82.0, 132.0, 185.0, 287.0, 467.0, 708.0, 1050.0, 1867.0, 3127.0, 5640.0, 10474.0, 20405.0, 51378.0, 804085.0, 94663.0, 24992.0, 12572.0, 6808.0, 3780.0, 2033.0, 1248.0, 847.0, 497.0, 328.0, 217.0, 132.0, 95.0, 82.0, 54.0, 29.0, 29.0, 18.0, 9.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08984375, -5.877197265625, -5.66455078125, -5.451904296875, -5.2392578125, -5.026611328125, -4.81396484375, -4.601318359375, -4.388671875, -4.176025390625, -3.96337890625, -3.750732421875, -3.5380859375, -3.325439453125, -3.11279296875, -2.900146484375, -2.6875, -2.474853515625, -2.26220703125, -2.049560546875, -1.8369140625, -1.624267578125, -1.41162109375, -1.198974609375, -0.986328125, -0.773681640625, -0.56103515625, -0.348388671875, -0.1357421875, 0.076904296875, 0.28955078125, 0.502197265625, 0.71484375, 0.927490234375, 1.14013671875, 1.352783203125, 1.5654296875, 1.778076171875, 1.99072265625, 2.203369140625, 2.416015625, 2.628662109375, 2.84130859375, 3.053955078125, 3.2666015625, 3.479248046875, 3.69189453125, 3.904541015625, 4.1171875, 4.329833984375, 4.54248046875, 4.755126953125, 4.9677734375, 5.180419921875, 5.39306640625, 5.605712890625, 5.818359375, 6.031005859375, 6.24365234375, 6.456298828125, 6.6689453125, 6.881591796875, 7.09423828125, 7.306884765625, 7.51953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 12.0, 8.0, 10.0, 16.0, 4.0, 16.0, 22.0, 22.0, 31.0, 31.0, 33.0, 41.0, 55.0, 66.0, 53.0, 54.0, 52.0, 55.0, 61.0, 54.0, 43.0, 34.0, 42.0, 28.0, 30.0, 25.0, 19.0, 15.0, 4.0, 12.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0009131431579589844, -0.0008829161524772644, -0.0008526891469955444, -0.0008224621415138245, -0.0007922351360321045, -0.0007620081305503845, -0.0007317811250686646, -0.0007015541195869446, -0.0006713271141052246, -0.0006411001086235046, -0.0006108731031417847, -0.0005806460976600647, -0.0005504190921783447, -0.0005201920866966248, -0.0004899650812149048, -0.0004597380757331848, -0.00042951107025146484, -0.0003992840647697449, -0.0003690570592880249, -0.00033883005380630493, -0.00030860304832458496, -0.000278376042842865, -0.000248149037361145, -0.00021792203187942505, -0.00018769502639770508, -0.0001574680209159851, -0.00012724101543426514, -9.701400995254517e-05, -6.67870044708252e-05, -3.6559998989105225e-05, -6.332993507385254e-06, 2.3894011974334717e-05, 5.412101745605469e-05, 8.434802293777466e-05, 0.00011457502841949463, 0.0001448020339012146, 0.00017502903938293457, 0.00020525604486465454, 0.0002354830503463745, 0.0002657100558280945, 0.00029593706130981445, 0.0003261640667915344, 0.0003563910722732544, 0.00038661807775497437, 0.00041684508323669434, 0.0004470720887184143, 0.0004772990942001343, 0.0005075260996818542, 0.0005377531051635742, 0.0005679801106452942, 0.0005982071161270142, 0.0006284341216087341, 0.0006586611270904541, 0.0006888881325721741, 0.000719115138053894, 0.000749342143535614, 0.000779569149017334, 0.000809796154499054, 0.0008400231599807739, 0.0008702501654624939, 0.0009004771709442139, 0.0009307041764259338, 0.0009609311819076538, 0.0009911581873893738, 0.0010213851928710938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 9.0, 20.0, 24.0, 36.0, 40.0, 66.0, 108.0, 154.0, 211.0, 303.0, 480.0, 743.0, 1007.0, 1552.0, 2364.0, 3465.0, 5076.0, 7742.0, 11775.0, 17454.0, 26043.0, 37878.0, 52949.0, 71034.0, 90389.0, 105971.0, 114173.0, 111468.0, 99676.0, 81631.0, 62521.0, 45205.0, 31775.0, 21804.0, 14410.0, 9751.0, 6430.0, 4269.0, 2806.0, 1830.0, 1235.0, 880.0, 577.0, 396.0, 265.0, 198.0, 111.0, 96.0, 61.0, 41.0, 27.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.09375, -2.023406982421875, -1.95306396484375, -1.882720947265625, -1.8123779296875, -1.742034912109375, -1.67169189453125, -1.601348876953125, -1.531005859375, -1.460662841796875, -1.39031982421875, -1.319976806640625, -1.2496337890625, -1.179290771484375, -1.10894775390625, -1.038604736328125, -0.96826171875, -0.897918701171875, -0.82757568359375, -0.757232666015625, -0.6868896484375, -0.616546630859375, -0.54620361328125, -0.475860595703125, -0.405517578125, -0.335174560546875, -0.26483154296875, -0.194488525390625, -0.1241455078125, -0.053802490234375, 0.01654052734375, 0.086883544921875, 0.1572265625, 0.227569580078125, 0.29791259765625, 0.368255615234375, 0.4385986328125, 0.508941650390625, 0.57928466796875, 0.649627685546875, 0.719970703125, 0.790313720703125, 0.86065673828125, 0.930999755859375, 1.0013427734375, 1.071685791015625, 1.14202880859375, 1.212371826171875, 1.28271484375, 1.353057861328125, 1.42340087890625, 1.493743896484375, 1.5640869140625, 1.634429931640625, 1.70477294921875, 1.775115966796875, 1.845458984375, 1.915802001953125, 1.98614501953125, 2.056488037109375, 2.1268310546875, 2.197174072265625, 2.26751708984375, 2.337860107421875, 2.408203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 12.0, 22.0, 21.0, 11.0, 35.0, 39.0, 44.0, 36.0, 43.0, 52.0, 48.0, 56.0, 66.0, 47.0, 52.0, 62.0, 43.0, 39.0, 44.0, 34.0, 35.0, 21.0, 27.0, 16.0, 11.0, 14.0, 6.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.353515625, -1.3142852783203125, -1.275054931640625, -1.2358245849609375, -1.19659423828125, -1.1573638916015625, -1.118133544921875, -1.0789031982421875, -1.0396728515625, -1.0004425048828125, -0.961212158203125, -0.9219818115234375, -0.88275146484375, -0.8435211181640625, -0.804290771484375, -0.7650604248046875, -0.725830078125, -0.6865997314453125, -0.647369384765625, -0.6081390380859375, -0.56890869140625, -0.5296783447265625, -0.490447998046875, -0.4512176513671875, -0.4119873046875, -0.3727569580078125, -0.333526611328125, -0.2942962646484375, -0.25506591796875, -0.2158355712890625, -0.176605224609375, -0.1373748779296875, -0.09814453125, -0.0589141845703125, -0.019683837890625, 0.0195465087890625, 0.05877685546875, 0.0980072021484375, 0.137237548828125, 0.1764678955078125, 0.2156982421875, 0.2549285888671875, 0.294158935546875, 0.3333892822265625, 0.37261962890625, 0.4118499755859375, 0.451080322265625, 0.4903106689453125, 0.529541015625, 0.5687713623046875, 0.608001708984375, 0.6472320556640625, 0.68646240234375, 0.7256927490234375, 0.764923095703125, 0.8041534423828125, 0.8433837890625, 0.8826141357421875, 0.921844482421875, 0.9610748291015625, 1.00030517578125, 1.0395355224609375, 1.078765869140625, 1.1179962158203125, 1.1572265625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 11.0, 11.0, 12.0, 17.0, 18.0, 24.0, 35.0, 32.0, 32.0, 41.0, 44.0, 48.0, 48.0, 51.0, 44.0, 46.0, 50.0, 33.0, 36.0, 38.0, 42.0, 38.0, 39.0, 31.0, 23.0, 22.0, 26.0, 11.0, 10.0, 11.0, 10.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-75.80357360839844, -73.64806365966797, -71.4925537109375, -69.33704376220703, -67.18153381347656, -65.0260238647461, -62.87051773071289, -60.71500778198242, -58.55949783325195, -56.403987884521484, -54.248477935791016, -52.09296798706055, -49.937461853027344, -47.781951904296875, -45.626441955566406, -43.47093200683594, -41.31542205810547, -39.159912109375, -37.00440216064453, -34.84889221191406, -32.693382263183594, -30.537874221801758, -28.382366180419922, -26.226856231689453, -24.071346282958984, -21.915836334228516, -19.760326385498047, -17.60481834411621, -15.449308395385742, -13.293798446655273, -11.138289451599121, -8.982780456542969, -6.827274322509766, -4.671764850616455, -2.5162553787231445, -0.360745906829834, 1.7947635650634766, 3.9502735137939453, 6.105782508850098, 8.26129150390625, 10.416801452636719, 12.572311401367188, 14.72782039642334, 16.883329391479492, 19.03883934020996, 21.19434928894043, 23.349857330322266, 25.505367279052734, 27.660877227783203, 29.816387176513672, 31.97189712524414, 34.12740707397461, 36.28291320800781, 38.43842315673828, 40.59393310546875, 42.74944305419922, 44.90495300292969, 47.060462951660156, 49.215972900390625, 51.371482849121094, 53.52699279785156, 55.68250274658203, 57.838008880615234, 59.9935188293457, 62.14902877807617]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 7.0, 13.0, 14.0, 10.0, 13.0, 16.0, 19.0, 20.0, 22.0, 26.0, 32.0, 31.0, 38.0, 37.0, 39.0, 37.0, 30.0, 49.0, 40.0, 45.0, 41.0, 43.0, 36.0, 33.0, 36.0, 27.0, 37.0, 30.0, 24.0, 20.0, 18.0, 22.0, 11.0, 16.0, 15.0, 2.0, 9.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.99536895751953, -54.92876434326172, -52.862159729003906, -50.795555114746094, -48.72895050048828, -46.66234588623047, -44.595741271972656, -42.529136657714844, -40.46253204345703, -38.39592742919922, -36.329322814941406, -34.262718200683594, -32.19611358642578, -30.12950897216797, -28.062902450561523, -25.99629783630371, -23.929691314697266, -21.863086700439453, -19.79648208618164, -17.729877471923828, -15.6632719039917, -13.596667289733887, -11.530061721801758, -9.463457107543945, -7.396852493286133, -5.33024787902832, -3.2636427879333496, -1.197037696838379, 0.8695669174194336, 2.936171531677246, 5.002777099609375, 7.0693817138671875, 9.135986328125, 11.202590942382812, 13.269195556640625, 15.335801124572754, 17.40240478515625, 19.469009399414062, 21.535615921020508, 23.60222053527832, 25.668825149536133, 27.735429763793945, 29.802034378051758, 31.868640899658203, 33.935245513916016, 36.00185012817383, 38.06845474243164, 40.13505935668945, 42.201663970947266, 44.26826858520508, 46.33487319946289, 48.4014778137207, 50.468082427978516, 52.53468704223633, 54.601295471191406, 56.66790008544922, 58.73450469970703, 60.801109313964844, 62.867713928222656, 64.93431854248047, 67.00092315673828, 69.0675277709961, 71.1341323852539, 73.20073699951172, 75.26734161376953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 14.0, 21.0, 14.0, 30.0, 44.0, 57.0, 98.0, 128.0, 182.0, 293.0, 411.0, 679.0, 972.0, 1577.0, 2398.0, 3848.0, 6403.0, 10704.0, 17835.0, 29680.0, 47745.0, 73195.0, 102486.0, 129782.0, 142976.0, 136751.0, 113332.0, 82471.0, 55658.0, 34748.0, 21023.0, 12751.0, 7532.0, 4548.0, 2908.0, 1751.0, 1160.0, 759.0, 483.0, 350.0, 241.0, 148.0, 108.0, 77.0, 60.0, 37.0, 26.0, 18.0, 12.0, 10.0, 4.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-68.6875, -66.5849609375, -64.482421875, -62.3798828125, -60.27734375, -58.1748046875, -56.072265625, -53.9697265625, -51.8671875, -49.7646484375, -47.662109375, -45.5595703125, -43.45703125, -41.3544921875, -39.251953125, -37.1494140625, -35.046875, -32.9443359375, -30.841796875, -28.7392578125, -26.63671875, -24.5341796875, -22.431640625, -20.3291015625, -18.2265625, -16.1240234375, -14.021484375, -11.9189453125, -9.81640625, -7.7138671875, -5.611328125, -3.5087890625, -1.40625, 0.6962890625, 2.798828125, 4.9013671875, 7.00390625, 9.1064453125, 11.208984375, 13.3115234375, 15.4140625, 17.5166015625, 19.619140625, 21.7216796875, 23.82421875, 25.9267578125, 28.029296875, 30.1318359375, 32.234375, 34.3369140625, 36.439453125, 38.5419921875, 40.64453125, 42.7470703125, 44.849609375, 46.9521484375, 49.0546875, 51.1572265625, 53.259765625, 55.3623046875, 57.46484375, 59.5673828125, 61.669921875, 63.7724609375, 65.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 5.0, 5.0, 4.0, 8.0, 5.0, 8.0, 14.0, 16.0, 15.0, 14.0, 11.0, 22.0, 23.0, 23.0, 24.0, 31.0, 37.0, 38.0, 37.0, 34.0, 42.0, 35.0, 52.0, 35.0, 47.0, 43.0, 35.0, 38.0, 30.0, 34.0, 31.0, 34.0, 27.0, 18.0, 25.0, 18.0, 19.0, 12.0, 8.0, 12.0, 7.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.625, -52.7490234375, -50.873046875, -48.9970703125, -47.12109375, -45.2451171875, -43.369140625, -41.4931640625, -39.6171875, -37.7412109375, -35.865234375, -33.9892578125, -32.11328125, -30.2373046875, -28.361328125, -26.4853515625, -24.609375, -22.7333984375, -20.857421875, -18.9814453125, -17.10546875, -15.2294921875, -13.353515625, -11.4775390625, -9.6015625, -7.7255859375, -5.849609375, -3.9736328125, -2.09765625, -0.2216796875, 1.654296875, 3.5302734375, 5.40625, 7.2822265625, 9.158203125, 11.0341796875, 12.91015625, 14.7861328125, 16.662109375, 18.5380859375, 20.4140625, 22.2900390625, 24.166015625, 26.0419921875, 27.91796875, 29.7939453125, 31.669921875, 33.5458984375, 35.421875, 37.2978515625, 39.173828125, 41.0498046875, 42.92578125, 44.8017578125, 46.677734375, 48.5537109375, 50.4296875, 52.3056640625, 54.181640625, 56.0576171875, 57.93359375, 59.8095703125, 61.685546875, 63.5615234375, 65.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 12.0, 19.0, 24.0, 56.0, 81.0, 115.0, 156.0, 259.0, 389.0, 579.0, 859.0, 1403.0, 2429.0, 3838.0, 6484.0, 11297.0, 20446.0, 35294.0, 60573.0, 95516.0, 135745.0, 163314.0, 160509.0, 129149.0, 88265.0, 55305.0, 32340.0, 18194.0, 10479.0, 6011.0, 3540.0, 2165.0, 1318.0, 820.0, 558.0, 322.0, 214.0, 150.0, 109.0, 67.0, 44.0, 30.0, 27.0, 17.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.625, -79.9521484375, -77.279296875, -74.6064453125, -71.93359375, -69.2607421875, -66.587890625, -63.9150390625, -61.2421875, -58.5693359375, -55.896484375, -53.2236328125, -50.55078125, -47.8779296875, -45.205078125, -42.5322265625, -39.859375, -37.1865234375, -34.513671875, -31.8408203125, -29.16796875, -26.4951171875, -23.822265625, -21.1494140625, -18.4765625, -15.8037109375, -13.130859375, -10.4580078125, -7.78515625, -5.1123046875, -2.439453125, 0.2333984375, 2.90625, 5.5791015625, 8.251953125, 10.9248046875, 13.59765625, 16.2705078125, 18.943359375, 21.6162109375, 24.2890625, 26.9619140625, 29.634765625, 32.3076171875, 34.98046875, 37.6533203125, 40.326171875, 42.9990234375, 45.671875, 48.3447265625, 51.017578125, 53.6904296875, 56.36328125, 59.0361328125, 61.708984375, 64.3818359375, 67.0546875, 69.7275390625, 72.400390625, 75.0732421875, 77.74609375, 80.4189453125, 83.091796875, 85.7646484375, 88.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 12.0, 15.0, 17.0, 18.0, 14.0, 21.0, 37.0, 27.0, 36.0, 32.0, 41.0, 49.0, 53.0, 45.0, 42.0, 45.0, 40.0, 46.0, 52.0, 44.0, 36.0, 44.0, 31.0, 32.0, 23.0, 17.0, 24.0, 18.0, 8.0, 12.0, 14.0, 16.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-43.5625, -42.216796875, -40.87109375, -39.525390625, -38.1796875, -36.833984375, -35.48828125, -34.142578125, -32.796875, -31.451171875, -30.10546875, -28.759765625, -27.4140625, -26.068359375, -24.72265625, -23.376953125, -22.03125, -20.685546875, -19.33984375, -17.994140625, -16.6484375, -15.302734375, -13.95703125, -12.611328125, -11.265625, -9.919921875, -8.57421875, -7.228515625, -5.8828125, -4.537109375, -3.19140625, -1.845703125, -0.5, 0.845703125, 2.19140625, 3.537109375, 4.8828125, 6.228515625, 7.57421875, 8.919921875, 10.265625, 11.611328125, 12.95703125, 14.302734375, 15.6484375, 16.994140625, 18.33984375, 19.685546875, 21.03125, 22.376953125, 23.72265625, 25.068359375, 26.4140625, 27.759765625, 29.10546875, 30.451171875, 31.796875, 33.142578125, 34.48828125, 35.833984375, 37.1796875, 38.525390625, 39.87109375, 41.216796875, 42.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 15.0, 20.0, 25.0, 35.0, 60.0, 90.0, 155.0, 266.0, 440.0, 766.0, 1254.0, 2036.0, 3736.0, 6529.0, 11717.0, 20416.0, 34799.0, 57247.0, 87455.0, 120736.0, 146029.0, 150679.0, 132084.0, 101420.0, 68222.0, 42752.0, 25298.0, 14590.0, 8432.0, 4807.0, 2667.0, 1525.0, 890.0, 541.0, 312.0, 169.0, 124.0, 69.0, 54.0, 32.0, 21.0, 12.0, 10.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.90625, -18.30029296875, -17.6943359375, -17.08837890625, -16.482421875, -15.87646484375, -15.2705078125, -14.66455078125, -14.05859375, -13.45263671875, -12.8466796875, -12.24072265625, -11.634765625, -11.02880859375, -10.4228515625, -9.81689453125, -9.2109375, -8.60498046875, -7.9990234375, -7.39306640625, -6.787109375, -6.18115234375, -5.5751953125, -4.96923828125, -4.36328125, -3.75732421875, -3.1513671875, -2.54541015625, -1.939453125, -1.33349609375, -0.7275390625, -0.12158203125, 0.484375, 1.09033203125, 1.6962890625, 2.30224609375, 2.908203125, 3.51416015625, 4.1201171875, 4.72607421875, 5.33203125, 5.93798828125, 6.5439453125, 7.14990234375, 7.755859375, 8.36181640625, 8.9677734375, 9.57373046875, 10.1796875, 10.78564453125, 11.3916015625, 11.99755859375, 12.603515625, 13.20947265625, 13.8154296875, 14.42138671875, 15.02734375, 15.63330078125, 16.2392578125, 16.84521484375, 17.451171875, 18.05712890625, 18.6630859375, 19.26904296875, 19.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 28.0, 20.0, 25.0, 32.0, 34.0, 37.0, 42.0, 49.0, 51.0, 51.0, 42.0, 63.0, 51.0, 45.0, 55.0, 41.0, 35.0, 35.0, 34.0, 34.0, 26.0, 29.0, 11.0, 21.0, 12.0, 14.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019254684448242188, -0.0018616467714309692, -0.0017978250980377197, -0.0017340034246444702, -0.0016701817512512207, -0.0016063600778579712, -0.0015425384044647217, -0.0014787167310714722, -0.0014148950576782227, -0.0013510733842849731, -0.0012872517108917236, -0.0012234300374984741, -0.0011596083641052246, -0.001095786690711975, -0.0010319650173187256, -0.0009681433439254761, -0.0009043216705322266, -0.000840499997138977, -0.0007766783237457275, -0.000712856650352478, -0.0006490349769592285, -0.000585213303565979, -0.0005213916301727295, -0.00045756995677948, -0.00039374828338623047, -0.00032992660999298096, -0.00026610493659973145, -0.00020228326320648193, -0.00013846158981323242, -7.463991641998291e-05, -1.0818243026733398e-05, 5.300343036651611e-05, 0.00011682510375976562, 0.00018064677715301514, 0.00024446845054626465, 0.00030829012393951416, 0.00037211179733276367, 0.0004359334707260132, 0.0004997551441192627, 0.0005635768175125122, 0.0006273984909057617, 0.0006912201642990112, 0.0007550418376922607, 0.0008188635110855103, 0.0008826851844787598, 0.0009465068578720093, 0.0010103285312652588, 0.0010741502046585083, 0.0011379718780517578, 0.0012017935514450073, 0.0012656152248382568, 0.0013294368982315063, 0.0013932585716247559, 0.0014570802450180054, 0.0015209019184112549, 0.0015847235918045044, 0.001648545265197754, 0.0017123669385910034, 0.001776188611984253, 0.0018400102853775024, 0.001903831958770752, 0.0019676536321640015, 0.002031475305557251, 0.0020952969789505005, 0.00215911865234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 34.0, 37.0, 41.0, 90.0, 118.0, 176.0, 264.0, 391.0, 599.0, 844.0, 1382.0, 1991.0, 3005.0, 4867.0, 7403.0, 11499.0, 17803.0, 27030.0, 40146.0, 57317.0, 79016.0, 100157.0, 116513.0, 122690.0, 114808.0, 97569.0, 76024.0, 54754.0, 37952.0, 25858.0, 16797.0, 11065.0, 7125.0, 4483.0, 2996.0, 1931.0, 1288.0, 836.0, 507.0, 380.0, 224.0, 165.0, 105.0, 76.0, 49.0, 39.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 9.0, 3.0, 1.0], "bins": [-16.25, -15.7490234375, -15.248046875, -14.7470703125, -14.24609375, -13.7451171875, -13.244140625, -12.7431640625, -12.2421875, -11.7412109375, -11.240234375, -10.7392578125, -10.23828125, -9.7373046875, -9.236328125, -8.7353515625, -8.234375, -7.7333984375, -7.232421875, -6.7314453125, -6.23046875, -5.7294921875, -5.228515625, -4.7275390625, -4.2265625, -3.7255859375, -3.224609375, -2.7236328125, -2.22265625, -1.7216796875, -1.220703125, -0.7197265625, -0.21875, 0.2822265625, 0.783203125, 1.2841796875, 1.78515625, 2.2861328125, 2.787109375, 3.2880859375, 3.7890625, 4.2900390625, 4.791015625, 5.2919921875, 5.79296875, 6.2939453125, 6.794921875, 7.2958984375, 7.796875, 8.2978515625, 8.798828125, 9.2998046875, 9.80078125, 10.3017578125, 10.802734375, 11.3037109375, 11.8046875, 12.3056640625, 12.806640625, 13.3076171875, 13.80859375, 14.3095703125, 14.810546875, 15.3115234375, 15.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 16.0, 15.0, 24.0, 16.0, 25.0, 20.0, 39.0, 42.0, 41.0, 41.0, 45.0, 60.0, 58.0, 48.0, 66.0, 53.0, 46.0, 36.0, 31.0, 38.0, 38.0, 38.0, 22.0, 24.0, 13.0, 16.0, 16.0, 6.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.24609375, -7.018798828125, -6.79150390625, -6.564208984375, -6.3369140625, -6.109619140625, -5.88232421875, -5.655029296875, -5.427734375, -5.200439453125, -4.97314453125, -4.745849609375, -4.5185546875, -4.291259765625, -4.06396484375, -3.836669921875, -3.609375, -3.382080078125, -3.15478515625, -2.927490234375, -2.7001953125, -2.472900390625, -2.24560546875, -2.018310546875, -1.791015625, -1.563720703125, -1.33642578125, -1.109130859375, -0.8818359375, -0.654541015625, -0.42724609375, -0.199951171875, 0.02734375, 0.254638671875, 0.48193359375, 0.709228515625, 0.9365234375, 1.163818359375, 1.39111328125, 1.618408203125, 1.845703125, 2.072998046875, 2.30029296875, 2.527587890625, 2.7548828125, 2.982177734375, 3.20947265625, 3.436767578125, 3.6640625, 3.891357421875, 4.11865234375, 4.345947265625, 4.5732421875, 4.800537109375, 5.02783203125, 5.255126953125, 5.482421875, 5.709716796875, 5.93701171875, 6.164306640625, 6.3916015625, 6.618896484375, 6.84619140625, 7.073486328125, 7.30078125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 9.0, 12.0, 12.0, 18.0, 20.0, 29.0, 33.0, 32.0, 41.0, 37.0, 45.0, 36.0, 39.0, 42.0, 33.0, 48.0, 44.0, 35.0, 45.0, 39.0, 42.0, 30.0, 36.0, 26.0, 31.0, 16.0, 22.0, 20.0, 18.0, 12.0, 12.0, 6.0, 14.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.189083099365234, -60.27553939819336, -58.361995697021484, -56.44845199584961, -54.534908294677734, -52.621360778808594, -50.70781707763672, -48.794273376464844, -46.88072967529297, -44.967185974121094, -43.05364227294922, -41.140098571777344, -39.22655487060547, -37.313011169433594, -35.39946746826172, -33.48591995239258, -31.572378158569336, -29.65883445739746, -27.745290756225586, -25.831745147705078, -23.918201446533203, -22.004657745361328, -20.091114044189453, -18.177570343017578, -16.264026641845703, -14.350482940673828, -12.436938285827637, -10.523394584655762, -8.60984992980957, -6.696306228637695, -4.78276252746582, -2.869217872619629, -0.9556732177734375, 0.9578708410263062, 2.87141489982605, 4.784958839416504, 6.698503017425537, 8.61204719543457, 10.525590896606445, 12.439135551452637, 14.352679252624512, 16.266223907470703, 18.179767608642578, 20.093311309814453, 22.006855010986328, 23.920398712158203, 25.833942413330078, 27.747488021850586, 29.66103172302246, 31.574575424194336, 33.488121032714844, 35.40166473388672, 37.315208435058594, 39.22875213623047, 41.142295837402344, 43.05583953857422, 44.969383239746094, 46.88292694091797, 48.796470642089844, 50.71001434326172, 52.623558044433594, 54.53710174560547, 56.450645446777344, 58.364192962646484, 60.27773666381836]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 28.0, 14.0, 15.0, 17.0, 21.0, 32.0, 37.0, 31.0, 25.0, 33.0, 27.0, 35.0, 42.0, 37.0, 33.0, 38.0, 43.0, 35.0, 47.0, 33.0, 27.0, 25.0, 30.0, 26.0, 33.0, 33.0, 23.0, 12.0, 18.0, 16.0, 7.0, 13.0, 8.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.026329040527344, -50.16587829589844, -48.30542755126953, -46.444976806640625, -44.584529876708984, -42.72407913208008, -40.86362838745117, -39.003177642822266, -37.142730712890625, -35.28227996826172, -33.42182922363281, -31.56138038635254, -29.700931549072266, -27.84048080444336, -25.980030059814453, -24.119579315185547, -22.25912857055664, -20.398677825927734, -18.53822898864746, -16.677778244018555, -14.817328453063965, -12.956878662109375, -11.096427917480469, -9.235978126525879, -7.375528335571289, -5.515078544616699, -3.654628276824951, -1.7941780090332031, 0.06627178192138672, 1.9267215728759766, 3.787172317504883, 5.647622108459473, 7.5080718994140625, 9.368521690368652, 11.228971481323242, 13.089422225952148, 14.949872016906738, 16.810321807861328, 18.670772552490234, 20.53122329711914, 22.391672134399414, 24.25212287902832, 26.112571716308594, 27.9730224609375, 29.833473205566406, 31.69392204284668, 33.55437469482422, 35.41482162475586, 37.275272369384766, 39.13572311401367, 40.99617385864258, 42.85662078857422, 44.717071533203125, 46.57752227783203, 48.43797302246094, 50.298423767089844, 52.15887451171875, 54.019325256347656, 55.87977600097656, 57.74022674560547, 59.60067367553711, 61.461124420166016, 63.32157516479492, 65.18202209472656, 67.04247283935547]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 11.0, 18.0, 28.0, 42.0, 76.0, 121.0, 200.0, 316.0, 589.0, 952.0, 1492.0, 2526.0, 4350.0, 7005.0, 11884.0, 19751.0, 32830.0, 53605.0, 87683.0, 139074.0, 214626.0, 316454.0, 430625.0, 526383.0, 562820.0, 518340.0, 417305.0, 301483.0, 203956.0, 130892.0, 81386.0, 49896.0, 30420.0, 18512.0, 11151.0, 6719.0, 4072.0, 2501.0, 1595.0, 911.0, 659.0, 373.0, 229.0, 146.0, 86.0, 72.0, 44.0, 24.0, 14.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-58.125, -56.3330078125, -54.541015625, -52.7490234375, -50.95703125, -49.1650390625, -47.373046875, -45.5810546875, -43.7890625, -41.9970703125, -40.205078125, -38.4130859375, -36.62109375, -34.8291015625, -33.037109375, -31.2451171875, -29.453125, -27.6611328125, -25.869140625, -24.0771484375, -22.28515625, -20.4931640625, -18.701171875, -16.9091796875, -15.1171875, -13.3251953125, -11.533203125, -9.7412109375, -7.94921875, -6.1572265625, -4.365234375, -2.5732421875, -0.78125, 1.0107421875, 2.802734375, 4.5947265625, 6.38671875, 8.1787109375, 9.970703125, 11.7626953125, 13.5546875, 15.3466796875, 17.138671875, 18.9306640625, 20.72265625, 22.5146484375, 24.306640625, 26.0986328125, 27.890625, 29.6826171875, 31.474609375, 33.2666015625, 35.05859375, 36.8505859375, 38.642578125, 40.4345703125, 42.2265625, 44.0185546875, 45.810546875, 47.6025390625, 49.39453125, 51.1865234375, 52.978515625, 54.7705078125, 56.5625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 7.0, 11.0, 15.0, 13.0, 18.0, 19.0, 16.0, 21.0, 30.0, 24.0, 34.0, 34.0, 34.0, 26.0, 30.0, 31.0, 46.0, 47.0, 45.0, 35.0, 45.0, 31.0, 36.0, 35.0, 23.0, 25.0, 38.0, 36.0, 23.0, 23.0, 22.0, 15.0, 12.0, 16.0, 12.0, 9.0, 7.0, 11.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.15576171875, -41.5302734375, -39.90478515625, -38.279296875, -36.65380859375, -35.0283203125, -33.40283203125, -31.77734375, -30.15185546875, -28.5263671875, -26.90087890625, -25.275390625, -23.64990234375, -22.0244140625, -20.39892578125, -18.7734375, -17.14794921875, -15.5224609375, -13.89697265625, -12.271484375, -10.64599609375, -9.0205078125, -7.39501953125, -5.76953125, -4.14404296875, -2.5185546875, -0.89306640625, 0.732421875, 2.35791015625, 3.9833984375, 5.60888671875, 7.234375, 8.85986328125, 10.4853515625, 12.11083984375, 13.736328125, 15.36181640625, 16.9873046875, 18.61279296875, 20.23828125, 21.86376953125, 23.4892578125, 25.11474609375, 26.740234375, 28.36572265625, 29.9912109375, 31.61669921875, 33.2421875, 34.86767578125, 36.4931640625, 38.11865234375, 39.744140625, 41.36962890625, 42.9951171875, 44.62060546875, 46.24609375, 47.87158203125, 49.4970703125, 51.12255859375, 52.748046875, 54.37353515625, 55.9990234375, 57.62451171875, 59.25]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 11.0, 33.0, 44.0, 100.0, 147.0, 256.0, 409.0, 626.0, 1168.0, 1943.0, 3359.0, 5957.0, 10396.0, 17840.0, 31373.0, 53585.0, 89492.0, 143184.0, 221088.0, 322262.0, 431006.0, 518071.0, 550668.0, 510450.0, 418899.0, 309558.0, 212385.0, 136791.0, 83564.0, 50257.0, 29121.0, 16935.0, 9979.0, 5594.0, 3229.0, 1856.0, 1100.0, 592.0, 392.0, 238.0, 120.0, 72.0, 44.0, 22.0, 13.0, 13.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-63.75, -61.84375, -59.9375, -58.03125, -56.125, -54.21875, -52.3125, -50.40625, -48.5, -46.59375, -44.6875, -42.78125, -40.875, -38.96875, -37.0625, -35.15625, -33.25, -31.34375, -29.4375, -27.53125, -25.625, -23.71875, -21.8125, -19.90625, -18.0, -16.09375, -14.1875, -12.28125, -10.375, -8.46875, -6.5625, -4.65625, -2.75, -0.84375, 1.0625, 2.96875, 4.875, 6.78125, 8.6875, 10.59375, 12.5, 14.40625, 16.3125, 18.21875, 20.125, 22.03125, 23.9375, 25.84375, 27.75, 29.65625, 31.5625, 33.46875, 35.375, 37.28125, 39.1875, 41.09375, 43.0, 44.90625, 46.8125, 48.71875, 50.625, 52.53125, 54.4375, 56.34375, 58.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 24.0, 27.0, 23.0, 42.0, 56.0, 82.0, 86.0, 119.0, 119.0, 140.0, 180.0, 174.0, 202.0, 220.0, 207.0, 214.0, 250.0, 230.0, 255.0, 214.0, 206.0, 167.0, 140.0, 129.0, 106.0, 94.0, 61.0, 64.0, 53.0, 41.0, 32.0, 21.0, 12.0, 19.0, 9.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.640625, -26.752197265625, -25.86376953125, -24.975341796875, -24.0869140625, -23.198486328125, -22.31005859375, -21.421630859375, -20.533203125, -19.644775390625, -18.75634765625, -17.867919921875, -16.9794921875, -16.091064453125, -15.20263671875, -14.314208984375, -13.42578125, -12.537353515625, -11.64892578125, -10.760498046875, -9.8720703125, -8.983642578125, -8.09521484375, -7.206787109375, -6.318359375, -5.429931640625, -4.54150390625, -3.653076171875, -2.7646484375, -1.876220703125, -0.98779296875, -0.099365234375, 0.7890625, 1.677490234375, 2.56591796875, 3.454345703125, 4.3427734375, 5.231201171875, 6.11962890625, 7.008056640625, 7.896484375, 8.784912109375, 9.67333984375, 10.561767578125, 11.4501953125, 12.338623046875, 13.22705078125, 14.115478515625, 15.00390625, 15.892333984375, 16.78076171875, 17.669189453125, 18.5576171875, 19.446044921875, 20.33447265625, 21.222900390625, 22.111328125, 22.999755859375, 23.88818359375, 24.776611328125, 25.6650390625, 26.553466796875, 27.44189453125, 28.330322265625, 29.21875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 7.0, 8.0, 14.0, 9.0, 17.0, 25.0, 24.0, 29.0, 32.0, 38.0, 41.0, 44.0, 45.0, 47.0, 34.0, 47.0, 38.0, 34.0, 48.0, 40.0, 50.0, 34.0, 34.0, 38.0, 26.0, 24.0, 29.0, 19.0, 14.0, 18.0, 11.0, 9.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.0414810180664, -62.051815032958984, -60.06214904785156, -58.072479248046875, -56.08281326293945, -54.09314727783203, -52.10348129272461, -50.11381530761719, -48.1241455078125, -46.13447952270508, -44.144813537597656, -42.15514373779297, -40.16547775268555, -38.175811767578125, -36.1861457824707, -34.19647979736328, -32.20681381225586, -30.217147827148438, -28.227479934692383, -26.23781394958496, -24.248146057128906, -22.258480072021484, -20.268814086914062, -18.27914810180664, -16.289480209350586, -14.299813270568848, -12.31014633178711, -10.320480346679688, -8.33081340789795, -6.341146469116211, -4.351480484008789, -2.361813545227051, -0.3721427917480469, 1.6175239086151123, 3.6071906089782715, 5.596857070922852, 7.58652400970459, 9.576190948486328, 11.56585693359375, 13.555523872375488, 15.545190811157227, 17.53485679626465, 19.524524688720703, 21.514190673828125, 23.503856658935547, 25.4935245513916, 27.483190536499023, 29.472858428955078, 31.4625244140625, 33.45219039916992, 35.441856384277344, 37.43152618408203, 39.42119216918945, 41.410858154296875, 43.4005241394043, 45.39019012451172, 47.379859924316406, 49.36952590942383, 51.35919189453125, 53.34886169433594, 55.33852767944336, 57.32819366455078, 59.3178596496582, 61.307525634765625, 63.29719161987305]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 13.0, 13.0, 21.0, 21.0, 20.0, 30.0, 29.0, 30.0, 43.0, 33.0, 43.0, 34.0, 37.0, 35.0, 47.0, 42.0, 44.0, 56.0, 39.0, 28.0, 33.0, 35.0, 31.0, 32.0, 21.0, 18.0, 27.0, 17.0, 18.0, 12.0, 16.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.1981086730957, -50.17898178100586, -48.159854888916016, -46.14072799682617, -44.12159729003906, -42.10247039794922, -40.083343505859375, -38.06421661376953, -36.04508972167969, -34.025962829589844, -32.0068359375, -29.987707138061523, -27.96858024597168, -25.949453353881836, -23.93032455444336, -21.911197662353516, -19.892070770263672, -17.872943878173828, -15.853816032409668, -13.834688186645508, -11.815561294555664, -9.79643440246582, -7.77730655670166, -5.7581787109375, -3.7390518188476562, -1.7199244499206543, 0.29920291900634766, 2.3183302879333496, 4.337457656860352, 6.356584548950195, 8.375712394714355, 10.394840240478516, 12.413963317871094, 14.433090209960938, 16.45221710205078, 18.471345901489258, 20.4904727935791, 22.509599685668945, 24.528728485107422, 26.547855377197266, 28.56698226928711, 30.586109161376953, 32.6052360534668, 34.62436294555664, 36.64349365234375, 38.662620544433594, 40.68174743652344, 42.70087432861328, 44.720001220703125, 46.73912811279297, 48.75825500488281, 50.777381896972656, 52.7965087890625, 54.815635681152344, 56.83476638793945, 58.8538932800293, 60.87302017211914, 62.892147064208984, 64.9112777709961, 66.93040466308594, 68.94953155517578, 70.96865844726562, 72.98778533935547, 75.00691223144531, 77.02603912353516]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 18.0, 26.0, 32.0, 62.0, 99.0, 123.0, 190.0, 332.0, 512.0, 805.0, 1310.0, 1936.0, 2922.0, 4618.0, 6983.0, 10573.0, 15849.0, 23310.0, 33445.0, 46418.0, 61905.0, 77733.0, 92309.0, 101624.0, 104860.0, 100458.0, 89157.0, 74347.0, 58061.0, 43335.0, 31382.0, 21663.0, 14597.0, 9589.0, 6322.0, 4161.0, 2599.0, 1713.0, 1105.0, 701.0, 478.0, 330.0, 185.0, 125.0, 98.0, 55.0, 38.0, 19.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-28.078125, -27.18359375, -26.2890625, -25.39453125, -24.5, -23.60546875, -22.7109375, -21.81640625, -20.921875, -20.02734375, -19.1328125, -18.23828125, -17.34375, -16.44921875, -15.5546875, -14.66015625, -13.765625, -12.87109375, -11.9765625, -11.08203125, -10.1875, -9.29296875, -8.3984375, -7.50390625, -6.609375, -5.71484375, -4.8203125, -3.92578125, -3.03125, -2.13671875, -1.2421875, -0.34765625, 0.546875, 1.44140625, 2.3359375, 3.23046875, 4.125, 5.01953125, 5.9140625, 6.80859375, 7.703125, 8.59765625, 9.4921875, 10.38671875, 11.28125, 12.17578125, 13.0703125, 13.96484375, 14.859375, 15.75390625, 16.6484375, 17.54296875, 18.4375, 19.33203125, 20.2265625, 21.12109375, 22.015625, 22.91015625, 23.8046875, 24.69921875, 25.59375, 26.48828125, 27.3828125, 28.27734375, 29.171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 15.0, 22.0, 21.0, 18.0, 30.0, 31.0, 30.0, 43.0, 35.0, 39.0, 33.0, 41.0, 33.0, 43.0, 42.0, 47.0, 54.0, 41.0, 27.0, 31.0, 34.0, 32.0, 34.0, 23.0, 19.0, 23.0, 19.0, 14.0, 15.0, 14.0, 11.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.75, -50.712890625, -48.67578125, -46.638671875, -44.6015625, -42.564453125, -40.52734375, -38.490234375, -36.453125, -34.416015625, -32.37890625, -30.341796875, -28.3046875, -26.267578125, -24.23046875, -22.193359375, -20.15625, -18.119140625, -16.08203125, -14.044921875, -12.0078125, -9.970703125, -7.93359375, -5.896484375, -3.859375, -1.822265625, 0.21484375, 2.251953125, 4.2890625, 6.326171875, 8.36328125, 10.400390625, 12.4375, 14.474609375, 16.51171875, 18.548828125, 20.5859375, 22.623046875, 24.66015625, 26.697265625, 28.734375, 30.771484375, 32.80859375, 34.845703125, 36.8828125, 38.919921875, 40.95703125, 42.994140625, 45.03125, 47.068359375, 49.10546875, 51.142578125, 53.1796875, 55.216796875, 57.25390625, 59.291015625, 61.328125, 63.365234375, 65.40234375, 67.439453125, 69.4765625, 71.513671875, 73.55078125, 75.587890625, 77.625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 13.0, 8.0, 11.0, 23.0, 42.0, 40.0, 66.0, 96.0, 123.0, 178.0, 230.0, 337.0, 462.0, 608.0, 912.0, 1204.0, 1691.0, 2282.0, 3206.0, 4328.0, 5954.0, 8307.0, 11384.0, 15689.0, 22526.0, 64395.0, 673006.0, 142752.0, 25810.0, 17002.0, 12508.0, 9026.0, 6700.0, 4899.0, 3575.0, 2543.0, 1775.0, 1353.0, 950.0, 754.0, 491.0, 381.0, 250.0, 199.0, 146.0, 99.0, 81.0, 47.0, 37.0, 15.0, 13.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0], "bins": [-47.9375, -46.46875, -45.0, -43.53125, -42.0625, -40.59375, -39.125, -37.65625, -36.1875, -34.71875, -33.25, -31.78125, -30.3125, -28.84375, -27.375, -25.90625, -24.4375, -22.96875, -21.5, -20.03125, -18.5625, -17.09375, -15.625, -14.15625, -12.6875, -11.21875, -9.75, -8.28125, -6.8125, -5.34375, -3.875, -2.40625, -0.9375, 0.53125, 2.0, 3.46875, 4.9375, 6.40625, 7.875, 9.34375, 10.8125, 12.28125, 13.75, 15.21875, 16.6875, 18.15625, 19.625, 21.09375, 22.5625, 24.03125, 25.5, 26.96875, 28.4375, 29.90625, 31.375, 32.84375, 34.3125, 35.78125, 37.25, 38.71875, 40.1875, 41.65625, 43.125, 44.59375, 46.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 3.0, 11.0, 7.0, 7.0, 18.0, 13.0, 20.0, 16.0, 16.0, 18.0, 31.0, 39.0, 37.0, 42.0, 43.0, 43.0, 49.0, 43.0, 63.0, 36.0, 46.0, 41.0, 48.0, 37.0, 27.0, 31.0, 38.0, 31.0, 24.0, 22.0, 17.0, 19.0, 18.0, 10.0, 9.0, 3.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.1962890625, -40.611328125, -39.0263671875, -37.44140625, -35.8564453125, -34.271484375, -32.6865234375, -31.1015625, -29.5166015625, -27.931640625, -26.3466796875, -24.76171875, -23.1767578125, -21.591796875, -20.0068359375, -18.421875, -16.8369140625, -15.251953125, -13.6669921875, -12.08203125, -10.4970703125, -8.912109375, -7.3271484375, -5.7421875, -4.1572265625, -2.572265625, -0.9873046875, 0.59765625, 2.1826171875, 3.767578125, 5.3525390625, 6.9375, 8.5224609375, 10.107421875, 11.6923828125, 13.27734375, 14.8623046875, 16.447265625, 18.0322265625, 19.6171875, 21.2021484375, 22.787109375, 24.3720703125, 25.95703125, 27.5419921875, 29.126953125, 30.7119140625, 32.296875, 33.8818359375, 35.466796875, 37.0517578125, 38.63671875, 40.2216796875, 41.806640625, 43.3916015625, 44.9765625, 46.5615234375, 48.146484375, 49.7314453125, 51.31640625, 52.9013671875, 54.486328125, 56.0712890625, 57.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 20.0, 16.0, 22.0, 27.0, 45.0, 47.0, 65.0, 80.0, 110.0, 145.0, 194.0, 284.0, 369.0, 591.0, 705.0, 1040.0, 1513.0, 2240.0, 3047.0, 4776.0, 6969.0, 10614.0, 16690.0, 30278.0, 148299.0, 679154.0, 72873.0, 24596.0, 14626.0, 9452.0, 6087.0, 4114.0, 2833.0, 1871.0, 1361.0, 913.0, 658.0, 480.0, 338.0, 256.0, 193.0, 132.0, 124.0, 83.0, 52.0, 44.0, 31.0, 24.0, 12.0, 22.0, 5.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0], "bins": [-4.98046875, -4.8265380859375, -4.672607421875, -4.5186767578125, -4.36474609375, -4.2108154296875, -4.056884765625, -3.9029541015625, -3.7490234375, -3.5950927734375, -3.441162109375, -3.2872314453125, -3.13330078125, -2.9793701171875, -2.825439453125, -2.6715087890625, -2.517578125, -2.3636474609375, -2.209716796875, -2.0557861328125, -1.90185546875, -1.7479248046875, -1.593994140625, -1.4400634765625, -1.2861328125, -1.1322021484375, -0.978271484375, -0.8243408203125, -0.67041015625, -0.5164794921875, -0.362548828125, -0.2086181640625, -0.0546875, 0.0992431640625, 0.253173828125, 0.4071044921875, 0.56103515625, 0.7149658203125, 0.868896484375, 1.0228271484375, 1.1767578125, 1.3306884765625, 1.484619140625, 1.6385498046875, 1.79248046875, 1.9464111328125, 2.100341796875, 2.2542724609375, 2.408203125, 2.5621337890625, 2.716064453125, 2.8699951171875, 3.02392578125, 3.1778564453125, 3.331787109375, 3.4857177734375, 3.6396484375, 3.7935791015625, 3.947509765625, 4.1014404296875, 4.25537109375, 4.4093017578125, 4.563232421875, 4.7171630859375, 4.87109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 14.0, 7.0, 15.0, 16.0, 27.0, 29.0, 19.0, 29.0, 28.0, 38.0, 40.0, 42.0, 47.0, 44.0, 42.0, 43.0, 52.0, 46.0, 53.0, 41.0, 40.0, 41.0, 25.0, 26.0, 21.0, 24.0, 22.0, 17.0, 9.0, 11.0, 11.0, 4.0, 6.0, 10.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011510848999023438, -0.0011145174503326416, -0.0010779500007629395, -0.0010413825511932373, -0.0010048151016235352, -0.000968247652053833, -0.0009316802024841309, -0.0008951127529144287, -0.0008585453033447266, -0.0008219778537750244, -0.0007854104042053223, -0.0007488429546356201, -0.000712275505065918, -0.0006757080554962158, -0.0006391406059265137, -0.0006025731563568115, -0.0005660057067871094, -0.0005294382572174072, -0.0004928708076477051, -0.00045630335807800293, -0.0004197359085083008, -0.00038316845893859863, -0.0003466010093688965, -0.00031003355979919434, -0.0002734661102294922, -0.00023689866065979004, -0.0002003312110900879, -0.00016376376152038574, -0.0001271963119506836, -9.062886238098145e-05, -5.40614128112793e-05, -1.749396324157715e-05, 1.9073486328125e-05, 5.564093589782715e-05, 9.22083854675293e-05, 0.00012877583503723145, 0.0001653432846069336, 0.00020191073417663574, 0.0002384781837463379, 0.00027504563331604004, 0.0003116130828857422, 0.00034818053245544434, 0.0003847479820251465, 0.00042131543159484863, 0.0004578828811645508, 0.0004944503307342529, 0.0005310177803039551, 0.0005675852298736572, 0.0006041526794433594, 0.0006407201290130615, 0.0006772875785827637, 0.0007138550281524658, 0.000750422477722168, 0.0007869899272918701, 0.0008235573768615723, 0.0008601248264312744, 0.0008966922760009766, 0.0009332597255706787, 0.0009698271751403809, 0.001006394624710083, 0.0010429620742797852, 0.0010795295238494873, 0.0011160969734191895, 0.0011526644229888916, 0.0011892318725585938]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 9.0, 6.0, 12.0, 17.0, 31.0, 42.0, 61.0, 82.0, 158.0, 176.0, 338.0, 453.0, 696.0, 993.0, 1501.0, 2310.0, 3416.0, 5375.0, 8284.0, 12780.0, 19713.0, 30933.0, 46364.0, 68397.0, 93987.0, 119371.0, 134051.0, 129967.0, 111039.0, 83812.0, 59623.0, 40182.0, 26158.0, 16721.0, 10956.0, 7068.0, 4629.0, 2926.0, 1983.0, 1275.0, 918.0, 592.0, 380.0, 268.0, 178.0, 111.0, 65.0, 62.0, 35.0, 16.0, 15.0, 11.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-2.68359375, -2.5992431640625, -2.514892578125, -2.4305419921875, -2.34619140625, -2.2618408203125, -2.177490234375, -2.0931396484375, -2.0087890625, -1.9244384765625, -1.840087890625, -1.7557373046875, -1.67138671875, -1.5870361328125, -1.502685546875, -1.4183349609375, -1.333984375, -1.2496337890625, -1.165283203125, -1.0809326171875, -0.99658203125, -0.9122314453125, -0.827880859375, -0.7435302734375, -0.6591796875, -0.5748291015625, -0.490478515625, -0.4061279296875, -0.32177734375, -0.2374267578125, -0.153076171875, -0.0687255859375, 0.015625, 0.0999755859375, 0.184326171875, 0.2686767578125, 0.35302734375, 0.4373779296875, 0.521728515625, 0.6060791015625, 0.6904296875, 0.7747802734375, 0.859130859375, 0.9434814453125, 1.02783203125, 1.1121826171875, 1.196533203125, 1.2808837890625, 1.365234375, 1.4495849609375, 1.533935546875, 1.6182861328125, 1.70263671875, 1.7869873046875, 1.871337890625, 1.9556884765625, 2.0400390625, 2.1243896484375, 2.208740234375, 2.2930908203125, 2.37744140625, 2.4617919921875, 2.546142578125, 2.6304931640625, 2.71484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 2.0, 7.0, 3.0, 21.0, 13.0, 12.0, 23.0, 19.0, 30.0, 29.0, 36.0, 43.0, 41.0, 49.0, 43.0, 49.0, 56.0, 49.0, 54.0, 59.0, 44.0, 54.0, 42.0, 35.0, 38.0, 20.0, 14.0, 21.0, 15.0, 16.0, 5.0, 13.0, 11.0, 4.0, 10.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0448760986328125, -1.011627197265625, -0.9783782958984375, -0.94512939453125, -0.9118804931640625, -0.878631591796875, -0.8453826904296875, -0.8121337890625, -0.7788848876953125, -0.745635986328125, -0.7123870849609375, -0.67913818359375, -0.6458892822265625, -0.612640380859375, -0.5793914794921875, -0.546142578125, -0.5128936767578125, -0.479644775390625, -0.4463958740234375, -0.41314697265625, -0.3798980712890625, -0.346649169921875, -0.3134002685546875, -0.2801513671875, -0.2469024658203125, -0.213653564453125, -0.1804046630859375, -0.14715576171875, -0.1139068603515625, -0.080657958984375, -0.0474090576171875, -0.01416015625, 0.0190887451171875, 0.052337646484375, 0.0855865478515625, 0.11883544921875, 0.1520843505859375, 0.185333251953125, 0.2185821533203125, 0.2518310546875, 0.2850799560546875, 0.318328857421875, 0.3515777587890625, 0.38482666015625, 0.4180755615234375, 0.451324462890625, 0.4845733642578125, 0.517822265625, 0.5510711669921875, 0.584320068359375, 0.6175689697265625, 0.65081787109375, 0.6840667724609375, 0.717315673828125, 0.7505645751953125, 0.7838134765625, 0.8170623779296875, 0.850311279296875, 0.8835601806640625, 0.91680908203125, 0.9500579833984375, 0.983306884765625, 1.0165557861328125, 1.0498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 14.0, 13.0, 22.0, 16.0, 27.0, 34.0, 44.0, 25.0, 27.0, 46.0, 45.0, 53.0, 58.0, 55.0, 48.0, 45.0, 46.0, 37.0, 39.0, 51.0, 36.0, 39.0, 31.0, 18.0, 12.0, 24.0, 17.0, 13.0, 12.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.9545669555664, -74.69002532958984, -72.42549133300781, -70.16094970703125, -67.89641571044922, -65.63187408447266, -63.36733627319336, -61.10279846191406, -58.838260650634766, -56.57372283935547, -54.30918502807617, -52.044647216796875, -49.78010559082031, -47.51557159423828, -45.25102996826172, -42.98649215698242, -40.721954345703125, -38.45741653442383, -36.19287872314453, -33.928340911865234, -31.663801193237305, -29.399263381958008, -27.134723663330078, -24.87018585205078, -22.605648040771484, -20.341110229492188, -18.07657241821289, -15.812032699584961, -13.547494888305664, -11.282957077026367, -9.018418312072754, -6.753879547119141, -4.4893341064453125, -2.2247958183288574, 0.039742469787597656, 2.3042807579040527, 4.568819046020508, 6.833356857299805, 9.097895622253418, 11.362434387207031, 13.626972198486328, 15.891510009765625, 18.156047821044922, 20.42058753967285, 22.68512535095215, 24.949663162231445, 27.214202880859375, 29.478740692138672, 31.74327850341797, 34.007816314697266, 36.27235412597656, 38.53689193725586, 40.801429748535156, 43.06597137451172, 45.330509185791016, 47.59504699707031, 49.85958480834961, 52.124122619628906, 54.3886604309082, 56.6531982421875, 58.91773986816406, 61.182273864746094, 63.446815490722656, 65.71134948730469, 67.97589111328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 10.0, 11.0, 13.0, 20.0, 12.0, 27.0, 18.0, 29.0, 23.0, 34.0, 39.0, 39.0, 33.0, 43.0, 34.0, 31.0, 44.0, 45.0, 44.0, 53.0, 47.0, 34.0, 28.0, 35.0, 37.0, 27.0, 26.0, 22.0, 20.0, 25.0, 15.0, 14.0, 14.0, 9.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.366737365722656, -52.296630859375, -50.22652816772461, -48.15642166137695, -46.08631896972656, -44.016212463378906, -41.94610595703125, -39.875999450683594, -37.8058967590332, -35.73579025268555, -33.665687561035156, -31.5955810546875, -29.525476455688477, -27.455371856689453, -25.385265350341797, -23.315160751342773, -21.24505615234375, -19.174951553344727, -17.104846954345703, -15.034740447998047, -12.964635848999023, -10.89453125, -8.82442569732666, -6.75432014465332, -4.684215545654297, -2.6141104698181152, -0.5440053939819336, 1.526099681854248, 3.5962047576904297, 5.666309356689453, 7.736414909362793, 9.806520462036133, 11.876617431640625, 13.946722030639648, 16.016826629638672, 18.086933135986328, 20.15703773498535, 22.227142333984375, 24.29724884033203, 26.367353439331055, 28.437458038330078, 30.5075626373291, 32.577667236328125, 34.64777374267578, 36.71788024902344, 38.78798294067383, 40.858089447021484, 42.928192138671875, 44.99829864501953, 47.06840515136719, 49.13850784301758, 51.208614349365234, 53.278717041015625, 55.34882354736328, 57.41893005371094, 59.489036560058594, 61.559139251708984, 63.62924575805664, 65.69934844970703, 67.76945495605469, 69.83956146240234, 71.90966796875, 73.97976684570312, 76.04987335205078, 78.11997985839844]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 30.0, 54.0, 54.0, 92.0, 157.0, 224.0, 417.0, 633.0, 1040.0, 1811.0, 3028.0, 4995.0, 8713.0, 14132.0, 23245.0, 36536.0, 54820.0, 78354.0, 100563.0, 119748.0, 127566.0, 122210.0, 104890.0, 82340.0, 58774.0, 39752.0, 25528.0, 15418.0, 9606.0, 5499.0, 3240.0, 1958.0, 1195.0, 739.0, 464.0, 268.0, 164.0, 106.0, 66.0, 39.0, 21.0, 16.0, 12.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.21875, -51.42041015625, -49.6220703125, -47.82373046875, -46.025390625, -44.22705078125, -42.4287109375, -40.63037109375, -38.83203125, -37.03369140625, -35.2353515625, -33.43701171875, -31.638671875, -29.84033203125, -28.0419921875, -26.24365234375, -24.4453125, -22.64697265625, -20.8486328125, -19.05029296875, -17.251953125, -15.45361328125, -13.6552734375, -11.85693359375, -10.05859375, -8.26025390625, -6.4619140625, -4.66357421875, -2.865234375, -1.06689453125, 0.7314453125, 2.52978515625, 4.328125, 6.12646484375, 7.9248046875, 9.72314453125, 11.521484375, 13.31982421875, 15.1181640625, 16.91650390625, 18.71484375, 20.51318359375, 22.3115234375, 24.10986328125, 25.908203125, 27.70654296875, 29.5048828125, 31.30322265625, 33.1015625, 34.89990234375, 36.6982421875, 38.49658203125, 40.294921875, 42.09326171875, 43.8916015625, 45.68994140625, 47.48828125, 49.28662109375, 51.0849609375, 52.88330078125, 54.681640625, 56.47998046875, 58.2783203125, 60.07666015625, 61.875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 10.0, 12.0, 17.0, 12.0, 20.0, 20.0, 28.0, 28.0, 24.0, 39.0, 40.0, 43.0, 37.0, 39.0, 42.0, 41.0, 45.0, 38.0, 53.0, 48.0, 42.0, 35.0, 26.0, 32.0, 42.0, 22.0, 19.0, 27.0, 23.0, 17.0, 14.0, 9.0, 17.0, 3.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.58349609375, -49.5732421875, -47.56298828125, -45.552734375, -43.54248046875, -41.5322265625, -39.52197265625, -37.51171875, -35.50146484375, -33.4912109375, -31.48095703125, -29.470703125, -27.46044921875, -25.4501953125, -23.43994140625, -21.4296875, -19.41943359375, -17.4091796875, -15.39892578125, -13.388671875, -11.37841796875, -9.3681640625, -7.35791015625, -5.34765625, -3.33740234375, -1.3271484375, 0.68310546875, 2.693359375, 4.70361328125, 6.7138671875, 8.72412109375, 10.734375, 12.74462890625, 14.7548828125, 16.76513671875, 18.775390625, 20.78564453125, 22.7958984375, 24.80615234375, 26.81640625, 28.82666015625, 30.8369140625, 32.84716796875, 34.857421875, 36.86767578125, 38.8779296875, 40.88818359375, 42.8984375, 44.90869140625, 46.9189453125, 48.92919921875, 50.939453125, 52.94970703125, 54.9599609375, 56.97021484375, 58.98046875, 60.99072265625, 63.0009765625, 65.01123046875, 67.021484375, 69.03173828125, 71.0419921875, 73.05224609375, 75.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 20.0, 15.0, 28.0, 50.0, 58.0, 95.0, 175.0, 232.0, 394.0, 696.0, 1147.0, 1897.0, 3335.0, 5858.0, 10277.0, 17876.0, 30313.0, 49846.0, 76312.0, 106124.0, 132568.0, 144737.0, 136808.0, 112506.0, 82177.0, 54129.0, 33830.0, 19925.0, 11495.0, 6673.0, 3649.0, 2164.0, 1221.0, 720.0, 430.0, 254.0, 165.0, 137.0, 72.0, 46.0, 30.0, 15.0, 15.0, 11.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0], "bins": [-70.5625, -68.46240234375, -66.3623046875, -64.26220703125, -62.162109375, -60.06201171875, -57.9619140625, -55.86181640625, -53.76171875, -51.66162109375, -49.5615234375, -47.46142578125, -45.361328125, -43.26123046875, -41.1611328125, -39.06103515625, -36.9609375, -34.86083984375, -32.7607421875, -30.66064453125, -28.560546875, -26.46044921875, -24.3603515625, -22.26025390625, -20.16015625, -18.06005859375, -15.9599609375, -13.85986328125, -11.759765625, -9.65966796875, -7.5595703125, -5.45947265625, -3.359375, -1.25927734375, 0.8408203125, 2.94091796875, 5.041015625, 7.14111328125, 9.2412109375, 11.34130859375, 13.44140625, 15.54150390625, 17.6416015625, 19.74169921875, 21.841796875, 23.94189453125, 26.0419921875, 28.14208984375, 30.2421875, 32.34228515625, 34.4423828125, 36.54248046875, 38.642578125, 40.74267578125, 42.8427734375, 44.94287109375, 47.04296875, 49.14306640625, 51.2431640625, 53.34326171875, 55.443359375, 57.54345703125, 59.6435546875, 61.74365234375, 63.84375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 16.0, 17.0, 15.0, 22.0, 17.0, 24.0, 33.0, 29.0, 29.0, 35.0, 25.0, 44.0, 52.0, 46.0, 48.0, 48.0, 63.0, 37.0, 40.0, 34.0, 33.0, 36.0, 37.0, 29.0, 17.0, 21.0, 25.0, 24.0, 11.0, 18.0, 8.0, 9.0, 5.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-44.625, -43.2900390625, -41.955078125, -40.6201171875, -39.28515625, -37.9501953125, -36.615234375, -35.2802734375, -33.9453125, -32.6103515625, -31.275390625, -29.9404296875, -28.60546875, -27.2705078125, -25.935546875, -24.6005859375, -23.265625, -21.9306640625, -20.595703125, -19.2607421875, -17.92578125, -16.5908203125, -15.255859375, -13.9208984375, -12.5859375, -11.2509765625, -9.916015625, -8.5810546875, -7.24609375, -5.9111328125, -4.576171875, -3.2412109375, -1.90625, -0.5712890625, 0.763671875, 2.0986328125, 3.43359375, 4.7685546875, 6.103515625, 7.4384765625, 8.7734375, 10.1083984375, 11.443359375, 12.7783203125, 14.11328125, 15.4482421875, 16.783203125, 18.1181640625, 19.453125, 20.7880859375, 22.123046875, 23.4580078125, 24.79296875, 26.1279296875, 27.462890625, 28.7978515625, 30.1328125, 31.4677734375, 32.802734375, 34.1376953125, 35.47265625, 36.8076171875, 38.142578125, 39.4775390625, 40.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 21.0, 21.0, 33.0, 69.0, 89.0, 150.0, 244.0, 399.0, 649.0, 997.0, 1658.0, 3078.0, 5311.0, 9758.0, 18873.0, 36113.0, 66712.0, 116137.0, 167339.0, 191749.0, 168234.0, 115608.0, 67664.0, 36050.0, 18911.0, 9883.0, 5299.0, 3039.0, 1727.0, 1047.0, 603.0, 379.0, 233.0, 164.0, 90.0, 75.0, 45.0, 26.0, 21.0, 21.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.711181640625, -23.84423828125, -22.977294921875, -22.1103515625, -21.243408203125, -20.37646484375, -19.509521484375, -18.642578125, -17.775634765625, -16.90869140625, -16.041748046875, -15.1748046875, -14.307861328125, -13.44091796875, -12.573974609375, -11.70703125, -10.840087890625, -9.97314453125, -9.106201171875, -8.2392578125, -7.372314453125, -6.50537109375, -5.638427734375, -4.771484375, -3.904541015625, -3.03759765625, -2.170654296875, -1.3037109375, -0.436767578125, 0.43017578125, 1.297119140625, 2.1640625, 3.031005859375, 3.89794921875, 4.764892578125, 5.6318359375, 6.498779296875, 7.36572265625, 8.232666015625, 9.099609375, 9.966552734375, 10.83349609375, 11.700439453125, 12.5673828125, 13.434326171875, 14.30126953125, 15.168212890625, 16.03515625, 16.902099609375, 17.76904296875, 18.635986328125, 19.5029296875, 20.369873046875, 21.23681640625, 22.103759765625, 22.970703125, 23.837646484375, 24.70458984375, 25.571533203125, 26.4384765625, 27.305419921875, 28.17236328125, 29.039306640625, 29.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 9.0, 5.0, 22.0, 17.0, 14.0, 22.0, 29.0, 27.0, 34.0, 34.0, 50.0, 35.0, 54.0, 51.0, 64.0, 55.0, 52.0, 50.0, 56.0, 43.0, 39.0, 33.0, 26.0, 24.0, 32.0, 21.0, 17.0, 12.0, 10.0, 8.0, 10.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0024166107177734375, -0.0023413002490997314, -0.0022659897804260254, -0.0021906793117523193, -0.0021153688430786133, -0.0020400583744049072, -0.001964747905731201, -0.0018894374370574951, -0.001814126968383789, -0.001738816499710083, -0.001663506031036377, -0.001588195562362671, -0.0015128850936889648, -0.0014375746250152588, -0.0013622641563415527, -0.0012869536876678467, -0.0012116432189941406, -0.0011363327503204346, -0.0010610222816467285, -0.0009857118129730225, -0.0009104013442993164, -0.0008350908756256104, -0.0007597804069519043, -0.0006844699382781982, -0.0006091594696044922, -0.0005338490009307861, -0.0004585385322570801, -0.000383228063583374, -0.00030791759490966797, -0.00023260712623596191, -0.00015729665756225586, -8.19861888885498e-05, -6.67572021484375e-06, 6.86347484588623e-05, 0.00014394521713256836, 0.00021925568580627441, 0.00029456615447998047, 0.0003698766231536865, 0.0004451870918273926, 0.0005204975605010986, 0.0005958080291748047, 0.0006711184978485107, 0.0007464289665222168, 0.0008217394351959229, 0.0008970499038696289, 0.000972360372543335, 0.001047670841217041, 0.001122981309890747, 0.0011982917785644531, 0.0012736022472381592, 0.0013489127159118652, 0.0014242231845855713, 0.0014995336532592773, 0.0015748441219329834, 0.0016501545906066895, 0.0017254650592803955, 0.0018007755279541016, 0.0018760859966278076, 0.0019513964653015137, 0.0020267069339752197, 0.0021020174026489258, 0.002177327871322632, 0.002252638339996338, 0.002327948808670044, 0.00240325927734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 9.0, 8.0, 13.0, 21.0, 33.0, 44.0, 88.0, 134.0, 213.0, 312.0, 465.0, 740.0, 1141.0, 1815.0, 2802.0, 4334.0, 6985.0, 10980.0, 17648.0, 27088.0, 41986.0, 61827.0, 85937.0, 110041.0, 127232.0, 129828.0, 117323.0, 95160.0, 69609.0, 47287.0, 31578.0, 20409.0, 12921.0, 8158.0, 5285.0, 3249.0, 2050.0, 1320.0, 874.0, 577.0, 377.0, 220.0, 138.0, 102.0, 70.0, 51.0, 24.0, 20.0, 14.0, 10.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.6435546875, -16.052734375, -15.4619140625, -14.87109375, -14.2802734375, -13.689453125, -13.0986328125, -12.5078125, -11.9169921875, -11.326171875, -10.7353515625, -10.14453125, -9.5537109375, -8.962890625, -8.3720703125, -7.78125, -7.1904296875, -6.599609375, -6.0087890625, -5.41796875, -4.8271484375, -4.236328125, -3.6455078125, -3.0546875, -2.4638671875, -1.873046875, -1.2822265625, -0.69140625, -0.1005859375, 0.490234375, 1.0810546875, 1.671875, 2.2626953125, 2.853515625, 3.4443359375, 4.03515625, 4.6259765625, 5.216796875, 5.8076171875, 6.3984375, 6.9892578125, 7.580078125, 8.1708984375, 8.76171875, 9.3525390625, 9.943359375, 10.5341796875, 11.125, 11.7158203125, 12.306640625, 12.8974609375, 13.48828125, 14.0791015625, 14.669921875, 15.2607421875, 15.8515625, 16.4423828125, 17.033203125, 17.6240234375, 18.21484375, 18.8056640625, 19.396484375, 19.9873046875, 20.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 10.0, 9.0, 14.0, 16.0, 23.0, 31.0, 26.0, 28.0, 47.0, 38.0, 36.0, 53.0, 57.0, 41.0, 45.0, 43.0, 47.0, 51.0, 41.0, 41.0, 39.0, 34.0, 39.0, 23.0, 24.0, 20.0, 15.0, 11.0, 12.0, 8.0, 6.0, 9.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.7108154296875, -7.452880859375, -7.1949462890625, -6.93701171875, -6.6790771484375, -6.421142578125, -6.1632080078125, -5.9052734375, -5.6473388671875, -5.389404296875, -5.1314697265625, -4.87353515625, -4.6156005859375, -4.357666015625, -4.0997314453125, -3.841796875, -3.5838623046875, -3.325927734375, -3.0679931640625, -2.81005859375, -2.5521240234375, -2.294189453125, -2.0362548828125, -1.7783203125, -1.5203857421875, -1.262451171875, -1.0045166015625, -0.74658203125, -0.4886474609375, -0.230712890625, 0.0272216796875, 0.28515625, 0.5430908203125, 0.801025390625, 1.0589599609375, 1.31689453125, 1.5748291015625, 1.832763671875, 2.0906982421875, 2.3486328125, 2.6065673828125, 2.864501953125, 3.1224365234375, 3.38037109375, 3.6383056640625, 3.896240234375, 4.1541748046875, 4.412109375, 4.6700439453125, 4.927978515625, 5.1859130859375, 5.44384765625, 5.7017822265625, 5.959716796875, 6.2176513671875, 6.4755859375, 6.7335205078125, 6.991455078125, 7.2493896484375, 7.50732421875, 7.7652587890625, 8.023193359375, 8.2811279296875, 8.5390625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 13.0, 6.0, 3.0, 7.0, 20.0, 25.0, 27.0, 26.0, 29.0, 51.0, 37.0, 53.0, 43.0, 51.0, 48.0, 46.0, 64.0, 52.0, 40.0, 43.0, 41.0, 43.0, 38.0, 30.0, 35.0, 21.0, 22.0, 18.0, 15.0, 8.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.9693832397461, -78.72274780273438, -76.47611999511719, -74.22948455810547, -71.98284912109375, -69.73622131347656, -67.48958587646484, -65.24295043945312, -62.99632263183594, -60.749691009521484, -58.503055572509766, -56.25642395019531, -54.00979232788086, -51.763160705566406, -49.51652526855469, -47.269893646240234, -45.023258209228516, -42.77662658691406, -40.529991149902344, -38.28335952758789, -36.03672790527344, -33.79009246826172, -31.543460845947266, -29.296829223632812, -27.050195693969727, -24.80356216430664, -22.556930541992188, -20.3102970123291, -18.063663482666016, -15.817031860351562, -13.570398330688477, -11.323765754699707, -9.077136993408203, -6.830504417419434, -4.583871364593506, -2.337238311767578, -0.0906057357788086, 2.156026840209961, 4.402660369873047, 6.649292945861816, 8.895925521850586, 11.142558097839355, 13.389190673828125, 15.635824203491211, 17.882457733154297, 20.12908935546875, 22.375722885131836, 24.622356414794922, 26.868988037109375, 29.11562156677246, 31.362253189086914, 33.60888671875, 35.85551834106445, 38.102149963378906, 40.348785400390625, 42.59541702270508, 44.84204864501953, 47.088680267333984, 49.3353157043457, 51.581947326660156, 53.82857894897461, 56.07521057128906, 58.32184600830078, 60.568477630615234, 62.81511306762695]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 7.0, 5.0, 6.0, 11.0, 10.0, 14.0, 14.0, 19.0, 20.0, 16.0, 24.0, 19.0, 29.0, 25.0, 28.0, 41.0, 28.0, 32.0, 34.0, 38.0, 34.0, 35.0, 50.0, 42.0, 32.0, 40.0, 52.0, 38.0, 32.0, 20.0, 30.0, 22.0, 21.0, 20.0, 17.0, 11.0, 20.0, 7.0, 14.0, 8.0, 6.0, 9.0, 14.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.210289001464844, -47.3166389465332, -45.42298889160156, -43.52933883666992, -41.63568878173828, -39.74203872680664, -37.848388671875, -35.95473861694336, -34.06108856201172, -32.16743850708008, -30.273788452148438, -28.380138397216797, -26.486488342285156, -24.592838287353516, -22.699188232421875, -20.805538177490234, -18.911888122558594, -17.018238067626953, -15.124588012695312, -13.230937957763672, -11.337287902832031, -9.44363784790039, -7.54998779296875, -5.656337738037109, -3.7626876831054688, -1.8690376281738281, 0.0246124267578125, 1.9182624816894531, 3.8119125366210938, 5.705562591552734, 7.599212646484375, 9.492862701416016, 11.386512756347656, 13.280162811279297, 15.173812866210938, 17.067462921142578, 18.96111297607422, 20.85476303100586, 22.7484130859375, 24.64206314086914, 26.53571319580078, 28.429363250732422, 30.323013305664062, 32.2166633605957, 34.110313415527344, 36.003963470458984, 37.897613525390625, 39.791263580322266, 41.684913635253906, 43.57856369018555, 45.47221374511719, 47.36586380004883, 49.25951385498047, 51.15316390991211, 53.04681396484375, 54.94046401977539, 56.83411407470703, 58.72776412963867, 60.62141418457031, 62.51506423950195, 64.4087142944336, 66.3023681640625, 68.19601440429688, 70.08966064453125, 71.98331451416016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 8.0, 14.0, 37.0, 78.0, 105.0, 185.0, 367.0, 622.0, 1072.0, 1786.0, 3272.0, 5462.0, 9482.0, 16255.0, 27320.0, 46254.0, 76401.0, 123816.0, 192599.0, 287775.0, 396848.0, 494906.0, 548059.0, 528717.0, 449178.0, 342064.0, 238779.0, 156122.0, 97683.0, 60333.0, 36029.0, 21283.0, 12538.0, 7570.0, 4350.0, 2751.0, 1596.0, 989.0, 585.0, 392.0, 231.0, 124.0, 77.0, 65.0, 42.0, 21.0, 13.0, 13.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.21875, -47.56494140625, -45.9111328125, -44.25732421875, -42.603515625, -40.94970703125, -39.2958984375, -37.64208984375, -35.98828125, -34.33447265625, -32.6806640625, -31.02685546875, -29.373046875, -27.71923828125, -26.0654296875, -24.41162109375, -22.7578125, -21.10400390625, -19.4501953125, -17.79638671875, -16.142578125, -14.48876953125, -12.8349609375, -11.18115234375, -9.52734375, -7.87353515625, -6.2197265625, -4.56591796875, -2.912109375, -1.25830078125, 0.3955078125, 2.04931640625, 3.703125, 5.35693359375, 7.0107421875, 8.66455078125, 10.318359375, 11.97216796875, 13.6259765625, 15.27978515625, 16.93359375, 18.58740234375, 20.2412109375, 21.89501953125, 23.548828125, 25.20263671875, 26.8564453125, 28.51025390625, 30.1640625, 31.81787109375, 33.4716796875, 35.12548828125, 36.779296875, 38.43310546875, 40.0869140625, 41.74072265625, 43.39453125, 45.04833984375, 46.7021484375, 48.35595703125, 50.009765625, 51.66357421875, 53.3173828125, 54.97119140625, 56.625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 9.0, 12.0, 18.0, 12.0, 15.0, 18.0, 26.0, 22.0, 19.0, 28.0, 32.0, 31.0, 33.0, 34.0, 41.0, 39.0, 37.0, 34.0, 50.0, 42.0, 40.0, 33.0, 58.0, 36.0, 32.0, 37.0, 24.0, 25.0, 27.0, 15.0, 16.0, 16.0, 14.0, 16.0, 11.0, 4.0, 11.0, 8.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.2353515625, -43.470703125, -41.7060546875, -39.94140625, -38.1767578125, -36.412109375, -34.6474609375, -32.8828125, -31.1181640625, -29.353515625, -27.5888671875, -25.82421875, -24.0595703125, -22.294921875, -20.5302734375, -18.765625, -17.0009765625, -15.236328125, -13.4716796875, -11.70703125, -9.9423828125, -8.177734375, -6.4130859375, -4.6484375, -2.8837890625, -1.119140625, 0.6455078125, 2.41015625, 4.1748046875, 5.939453125, 7.7041015625, 9.46875, 11.2333984375, 12.998046875, 14.7626953125, 16.52734375, 18.2919921875, 20.056640625, 21.8212890625, 23.5859375, 25.3505859375, 27.115234375, 28.8798828125, 30.64453125, 32.4091796875, 34.173828125, 35.9384765625, 37.703125, 39.4677734375, 41.232421875, 42.9970703125, 44.76171875, 46.5263671875, 48.291015625, 50.0556640625, 51.8203125, 53.5849609375, 55.349609375, 57.1142578125, 58.87890625, 60.6435546875, 62.408203125, 64.1728515625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 18.0, 20.0, 38.0, 61.0, 70.0, 127.0, 217.0, 347.0, 554.0, 850.0, 1461.0, 2496.0, 4118.0, 6591.0, 10900.0, 17607.0, 28185.0, 45196.0, 70206.0, 106360.0, 158942.0, 222483.0, 298108.0, 376806.0, 437719.0, 467376.0, 452248.0, 398707.0, 324433.0, 246083.0, 176631.0, 121236.0, 80127.0, 51918.0, 33282.0, 20410.0, 12422.0, 7885.0, 4689.0, 2832.0, 1783.0, 1063.0, 658.0, 394.0, 230.0, 159.0, 94.0, 50.0, 29.0, 26.0, 14.0, 11.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.625, -49.02587890625, -47.4267578125, -45.82763671875, -44.228515625, -42.62939453125, -41.0302734375, -39.43115234375, -37.83203125, -36.23291015625, -34.6337890625, -33.03466796875, -31.435546875, -29.83642578125, -28.2373046875, -26.63818359375, -25.0390625, -23.43994140625, -21.8408203125, -20.24169921875, -18.642578125, -17.04345703125, -15.4443359375, -13.84521484375, -12.24609375, -10.64697265625, -9.0478515625, -7.44873046875, -5.849609375, -4.25048828125, -2.6513671875, -1.05224609375, 0.546875, 2.14599609375, 3.7451171875, 5.34423828125, 6.943359375, 8.54248046875, 10.1416015625, 11.74072265625, 13.33984375, 14.93896484375, 16.5380859375, 18.13720703125, 19.736328125, 21.33544921875, 22.9345703125, 24.53369140625, 26.1328125, 27.73193359375, 29.3310546875, 30.93017578125, 32.529296875, 34.12841796875, 35.7275390625, 37.32666015625, 38.92578125, 40.52490234375, 42.1240234375, 43.72314453125, 45.322265625, 46.92138671875, 48.5205078125, 50.11962890625, 51.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 12.0, 20.0, 21.0, 23.0, 23.0, 43.0, 38.0, 53.0, 57.0, 57.0, 84.0, 103.0, 105.0, 154.0, 161.0, 150.0, 206.0, 198.0, 199.0, 214.0, 258.0, 215.0, 197.0, 197.0, 190.0, 143.0, 144.0, 143.0, 114.0, 108.0, 83.0, 76.0, 55.0, 43.0, 41.0, 38.0, 27.0, 18.0, 16.0, 7.0, 13.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-27.703125, -26.891357421875, -26.07958984375, -25.267822265625, -24.4560546875, -23.644287109375, -22.83251953125, -22.020751953125, -21.208984375, -20.397216796875, -19.58544921875, -18.773681640625, -17.9619140625, -17.150146484375, -16.33837890625, -15.526611328125, -14.71484375, -13.903076171875, -13.09130859375, -12.279541015625, -11.4677734375, -10.656005859375, -9.84423828125, -9.032470703125, -8.220703125, -7.408935546875, -6.59716796875, -5.785400390625, -4.9736328125, -4.161865234375, -3.35009765625, -2.538330078125, -1.7265625, -0.914794921875, -0.10302734375, 0.708740234375, 1.5205078125, 2.332275390625, 3.14404296875, 3.955810546875, 4.767578125, 5.579345703125, 6.39111328125, 7.202880859375, 8.0146484375, 8.826416015625, 9.63818359375, 10.449951171875, 11.26171875, 12.073486328125, 12.88525390625, 13.697021484375, 14.5087890625, 15.320556640625, 16.13232421875, 16.944091796875, 17.755859375, 18.567626953125, 19.37939453125, 20.191162109375, 21.0029296875, 21.814697265625, 22.62646484375, 23.438232421875, 24.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 19.0, 14.0, 15.0, 13.0, 30.0, 26.0, 25.0, 28.0, 22.0, 35.0, 43.0, 53.0, 29.0, 38.0, 38.0, 41.0, 26.0, 43.0, 24.0, 32.0, 35.0, 33.0, 22.0, 26.0, 26.0, 25.0, 32.0, 18.0, 19.0, 20.0, 19.0, 12.0, 16.0, 14.0, 10.0, 3.0, 8.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-59.39789962768555, -57.643192291259766, -55.888484954833984, -54.1337776184082, -52.37907028198242, -50.62436294555664, -48.869659423828125, -47.114952087402344, -45.36024475097656, -43.60553741455078, -41.850830078125, -40.09612274169922, -38.34141540527344, -36.586708068847656, -34.832000732421875, -33.077293395996094, -31.322586059570312, -29.56787872314453, -27.81317138671875, -26.05846405029297, -24.303756713867188, -22.549049377441406, -20.794343948364258, -19.039636611938477, -17.284929275512695, -15.530221939086914, -13.775514602661133, -12.020808219909668, -10.266100883483887, -8.511393547058105, -6.756687164306641, -5.001979827880859, -3.2472763061523438, -1.4925692081451416, 0.26213788986206055, 2.0168447494506836, 3.771552085876465, 5.526259422302246, 7.280965805053711, 9.035673141479492, 10.790380477905273, 12.545087814331055, 14.299795150756836, 16.054500579833984, 17.809207916259766, 19.563915252685547, 21.318622589111328, 23.07332992553711, 24.82803726196289, 26.582744598388672, 28.337451934814453, 30.092159271240234, 31.846866607666016, 33.6015739440918, 35.35627746582031, 37.110984802246094, 38.865692138671875, 40.620399475097656, 42.37510681152344, 44.12981414794922, 45.884521484375, 47.63922882080078, 49.39393615722656, 51.148643493652344, 52.903350830078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 7.0, 3.0, 8.0, 5.0, 12.0, 9.0, 9.0, 16.0, 15.0, 22.0, 14.0, 24.0, 24.0, 30.0, 27.0, 35.0, 46.0, 46.0, 34.0, 31.0, 33.0, 41.0, 52.0, 33.0, 43.0, 44.0, 38.0, 25.0, 29.0, 34.0, 32.0, 27.0, 21.0, 17.0, 14.0, 17.0, 21.0, 8.0, 8.0, 12.0, 4.0, 12.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.15023422241211, -52.22712326049805, -50.30400848388672, -48.380897521972656, -46.457786560058594, -44.53467559814453, -42.61156463623047, -40.68844985961914, -38.76533889770508, -36.842227935791016, -34.91911315917969, -32.996002197265625, -31.072891235351562, -29.1497802734375, -27.226667404174805, -25.30355453491211, -23.380443572998047, -21.457332611083984, -19.53421974182129, -17.611106872558594, -15.687995910644531, -13.764883995056152, -11.841772079467773, -9.918660163879395, -7.995548248291016, -6.072436332702637, -4.149324417114258, -2.226212501525879, -0.3031005859375, 1.620011329650879, 3.543123245239258, 5.466235160827637, 7.389350891113281, 9.31246280670166, 11.235574722290039, 13.158686637878418, 15.081798553466797, 17.00490951538086, 18.928022384643555, 20.85113525390625, 22.774246215820312, 24.697357177734375, 26.62047004699707, 28.543582916259766, 30.466693878173828, 32.38980484008789, 34.31291961669922, 36.23603057861328, 38.159141540527344, 40.082252502441406, 42.00536346435547, 43.9284782409668, 45.85158920288086, 47.77470016479492, 49.69781494140625, 51.62092590332031, 53.544036865234375, 55.46714782714844, 57.3902587890625, 59.31337356567383, 61.23648452758789, 63.15959548950195, 65.08271026611328, 67.00582122802734, 68.9289321899414]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 13.0, 14.0, 33.0, 43.0, 96.0, 114.0, 161.0, 321.0, 391.0, 664.0, 1039.0, 1594.0, 2375.0, 3608.0, 5380.0, 8190.0, 12297.0, 17823.0, 25515.0, 36011.0, 47812.0, 62428.0, 77262.0, 89817.0, 97215.0, 99835.0, 95552.0, 85812.0, 72442.0, 57470.0, 43955.0, 32337.0, 22960.0, 15866.0, 10802.0, 7350.0, 4857.0, 3199.0, 2036.0, 1370.0, 865.0, 593.0, 372.0, 228.0, 152.0, 105.0, 62.0, 47.0, 28.0, 15.0, 12.0, 4.0, 9.0, 2.0, 0.0, 1.0, 2.0], "bins": [-25.859375, -25.059814453125, -24.26025390625, -23.460693359375, -22.6611328125, -21.861572265625, -21.06201171875, -20.262451171875, -19.462890625, -18.663330078125, -17.86376953125, -17.064208984375, -16.2646484375, -15.465087890625, -14.66552734375, -13.865966796875, -13.06640625, -12.266845703125, -11.46728515625, -10.667724609375, -9.8681640625, -9.068603515625, -8.26904296875, -7.469482421875, -6.669921875, -5.870361328125, -5.07080078125, -4.271240234375, -3.4716796875, -2.672119140625, -1.87255859375, -1.072998046875, -0.2734375, 0.526123046875, 1.32568359375, 2.125244140625, 2.9248046875, 3.724365234375, 4.52392578125, 5.323486328125, 6.123046875, 6.922607421875, 7.72216796875, 8.521728515625, 9.3212890625, 10.120849609375, 10.92041015625, 11.719970703125, 12.51953125, 13.319091796875, 14.11865234375, 14.918212890625, 15.7177734375, 16.517333984375, 17.31689453125, 18.116455078125, 18.916015625, 19.715576171875, 20.51513671875, 21.314697265625, 22.1142578125, 22.913818359375, 23.71337890625, 24.512939453125, 25.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 5.0, 5.0, 5.0, 12.0, 11.0, 11.0, 16.0, 14.0, 20.0, 19.0, 24.0, 19.0, 34.0, 28.0, 39.0, 44.0, 42.0, 34.0, 29.0, 35.0, 43.0, 54.0, 30.0, 44.0, 43.0, 34.0, 24.0, 34.0, 30.0, 37.0, 26.0, 17.0, 15.0, 16.0, 18.0, 17.0, 9.0, 10.0, 9.0, 5.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.58544921875, -50.6396484375, -48.69384765625, -46.748046875, -44.80224609375, -42.8564453125, -40.91064453125, -38.96484375, -37.01904296875, -35.0732421875, -33.12744140625, -31.181640625, -29.23583984375, -27.2900390625, -25.34423828125, -23.3984375, -21.45263671875, -19.5068359375, -17.56103515625, -15.615234375, -13.66943359375, -11.7236328125, -9.77783203125, -7.83203125, -5.88623046875, -3.9404296875, -1.99462890625, -0.048828125, 1.89697265625, 3.8427734375, 5.78857421875, 7.734375, 9.68017578125, 11.6259765625, 13.57177734375, 15.517578125, 17.46337890625, 19.4091796875, 21.35498046875, 23.30078125, 25.24658203125, 27.1923828125, 29.13818359375, 31.083984375, 33.02978515625, 34.9755859375, 36.92138671875, 38.8671875, 40.81298828125, 42.7587890625, 44.70458984375, 46.650390625, 48.59619140625, 50.5419921875, 52.48779296875, 54.43359375, 56.37939453125, 58.3251953125, 60.27099609375, 62.216796875, 64.16259765625, 66.1083984375, 68.05419921875, 70.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 14.0, 25.0, 28.0, 59.0, 104.0, 153.0, 255.0, 385.0, 690.0, 1088.0, 1680.0, 2699.0, 4448.0, 7208.0, 11488.0, 18255.0, 30632.0, 290415.0, 589939.0, 35324.0, 20022.0, 12766.0, 7962.0, 4826.0, 3078.0, 1957.0, 1142.0, 705.0, 476.0, 281.0, 173.0, 102.0, 68.0, 34.0, 32.0, 7.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-65.5, -63.4599609375, -61.419921875, -59.3798828125, -57.33984375, -55.2998046875, -53.259765625, -51.2197265625, -49.1796875, -47.1396484375, -45.099609375, -43.0595703125, -41.01953125, -38.9794921875, -36.939453125, -34.8994140625, -32.859375, -30.8193359375, -28.779296875, -26.7392578125, -24.69921875, -22.6591796875, -20.619140625, -18.5791015625, -16.5390625, -14.4990234375, -12.458984375, -10.4189453125, -8.37890625, -6.3388671875, -4.298828125, -2.2587890625, -0.21875, 1.8212890625, 3.861328125, 5.9013671875, 7.94140625, 9.9814453125, 12.021484375, 14.0615234375, 16.1015625, 18.1416015625, 20.181640625, 22.2216796875, 24.26171875, 26.3017578125, 28.341796875, 30.3818359375, 32.421875, 34.4619140625, 36.501953125, 38.5419921875, 40.58203125, 42.6220703125, 44.662109375, 46.7021484375, 48.7421875, 50.7822265625, 52.822265625, 54.8623046875, 56.90234375, 58.9423828125, 60.982421875, 63.0224609375, 65.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 9.0, 8.0, 11.0, 13.0, 26.0, 22.0, 19.0, 23.0, 21.0, 19.0, 33.0, 30.0, 29.0, 25.0, 36.0, 40.0, 27.0, 19.0, 37.0, 43.0, 35.0, 44.0, 39.0, 39.0, 49.0, 33.0, 33.0, 32.0, 26.0, 18.0, 15.0, 29.0, 20.0, 16.0, 18.0, 7.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.65625, -43.236328125, -41.81640625, -40.396484375, -38.9765625, -37.556640625, -36.13671875, -34.716796875, -33.296875, -31.876953125, -30.45703125, -29.037109375, -27.6171875, -26.197265625, -24.77734375, -23.357421875, -21.9375, -20.517578125, -19.09765625, -17.677734375, -16.2578125, -14.837890625, -13.41796875, -11.998046875, -10.578125, -9.158203125, -7.73828125, -6.318359375, -4.8984375, -3.478515625, -2.05859375, -0.638671875, 0.78125, 2.201171875, 3.62109375, 5.041015625, 6.4609375, 7.880859375, 9.30078125, 10.720703125, 12.140625, 13.560546875, 14.98046875, 16.400390625, 17.8203125, 19.240234375, 20.66015625, 22.080078125, 23.5, 24.919921875, 26.33984375, 27.759765625, 29.1796875, 30.599609375, 32.01953125, 33.439453125, 34.859375, 36.279296875, 37.69921875, 39.119140625, 40.5390625, 41.958984375, 43.37890625, 44.798828125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 16.0, 20.0, 34.0, 30.0, 55.0, 73.0, 93.0, 128.0, 201.0, 288.0, 414.0, 567.0, 832.0, 1202.0, 1978.0, 2967.0, 4580.0, 7203.0, 12228.0, 21373.0, 49879.0, 712994.0, 161159.0, 28935.0, 15589.0, 9273.0, 5800.0, 3625.0, 2216.0, 1541.0, 1018.0, 695.0, 436.0, 308.0, 208.0, 150.0, 138.0, 78.0, 55.0, 46.0, 27.0, 21.0, 12.0, 11.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.15234375, -4.0126953125, -3.873046875, -3.7333984375, -3.59375, -3.4541015625, -3.314453125, -3.1748046875, -3.03515625, -2.8955078125, -2.755859375, -2.6162109375, -2.4765625, -2.3369140625, -2.197265625, -2.0576171875, -1.91796875, -1.7783203125, -1.638671875, -1.4990234375, -1.359375, -1.2197265625, -1.080078125, -0.9404296875, -0.80078125, -0.6611328125, -0.521484375, -0.3818359375, -0.2421875, -0.1025390625, 0.037109375, 0.1767578125, 0.31640625, 0.4560546875, 0.595703125, 0.7353515625, 0.875, 1.0146484375, 1.154296875, 1.2939453125, 1.43359375, 1.5732421875, 1.712890625, 1.8525390625, 1.9921875, 2.1318359375, 2.271484375, 2.4111328125, 2.55078125, 2.6904296875, 2.830078125, 2.9697265625, 3.109375, 3.2490234375, 3.388671875, 3.5283203125, 3.66796875, 3.8076171875, 3.947265625, 4.0869140625, 4.2265625, 4.3662109375, 4.505859375, 4.6455078125, 4.78515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 8.0, 13.0, 12.0, 11.0, 15.0, 14.0, 31.0, 29.0, 27.0, 37.0, 40.0, 30.0, 56.0, 51.0, 72.0, 52.0, 56.0, 54.0, 43.0, 42.0, 50.0, 34.0, 33.0, 35.0, 29.0, 22.0, 21.0, 17.0, 14.0, 12.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007371902465820312, -0.0007062405347824097, -0.0006752908229827881, -0.0006443411111831665, -0.0006133913993835449, -0.0005824416875839233, -0.0005514919757843018, -0.0005205422639846802, -0.0004895925521850586, -0.000458642840385437, -0.00042769312858581543, -0.00039674341678619385, -0.00036579370498657227, -0.0003348439931869507, -0.0003038942813873291, -0.0002729445695877075, -0.00024199485778808594, -0.00021104514598846436, -0.00018009543418884277, -0.0001491457223892212, -0.00011819601058959961, -8.724629878997803e-05, -5.6296586990356445e-05, -2.5346875190734863e-05, 5.602836608886719e-06, 3.65525484085083e-05, 6.750226020812988e-05, 9.845197200775146e-05, 0.00012940168380737305, 0.00016035139560699463, 0.0001913011074066162, 0.0002222508192062378, 0.0002532005310058594, 0.00028415024280548096, 0.00031509995460510254, 0.0003460496664047241, 0.0003769993782043457, 0.0004079490900039673, 0.00043889880180358887, 0.00046984851360321045, 0.000500798225402832, 0.0005317479372024536, 0.0005626976490020752, 0.0005936473608016968, 0.0006245970726013184, 0.0006555467844009399, 0.0006864964962005615, 0.0007174462080001831, 0.0007483959197998047, 0.0007793456315994263, 0.0008102953433990479, 0.0008412450551986694, 0.000872194766998291, 0.0009031444787979126, 0.0009340941905975342, 0.0009650439023971558, 0.0009959936141967773, 0.001026943325996399, 0.0010578930377960205, 0.001088842749595642, 0.0011197924613952637, 0.0011507421731948853, 0.0011816918849945068, 0.0012126415967941284, 0.00124359130859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 11.0, 18.0, 36.0, 47.0, 44.0, 72.0, 129.0, 169.0, 329.0, 462.0, 918.0, 1639.0, 2957.0, 5474.0, 9860.0, 18464.0, 33899.0, 60495.0, 99951.0, 144459.0, 173684.0, 167542.0, 130692.0, 84932.0, 50667.0, 27940.0, 15214.0, 8239.0, 4471.0, 2399.0, 1373.0, 727.0, 415.0, 285.0, 172.0, 115.0, 80.0, 59.0, 30.0, 19.0, 19.0, 6.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.1640625, -3.070556640625, -2.97705078125, -2.883544921875, -2.7900390625, -2.696533203125, -2.60302734375, -2.509521484375, -2.416015625, -2.322509765625, -2.22900390625, -2.135498046875, -2.0419921875, -1.948486328125, -1.85498046875, -1.761474609375, -1.66796875, -1.574462890625, -1.48095703125, -1.387451171875, -1.2939453125, -1.200439453125, -1.10693359375, -1.013427734375, -0.919921875, -0.826416015625, -0.73291015625, -0.639404296875, -0.5458984375, -0.452392578125, -0.35888671875, -0.265380859375, -0.171875, -0.078369140625, 0.01513671875, 0.108642578125, 0.2021484375, 0.295654296875, 0.38916015625, 0.482666015625, 0.576171875, 0.669677734375, 0.76318359375, 0.856689453125, 0.9501953125, 1.043701171875, 1.13720703125, 1.230712890625, 1.32421875, 1.417724609375, 1.51123046875, 1.604736328125, 1.6982421875, 1.791748046875, 1.88525390625, 1.978759765625, 2.072265625, 2.165771484375, 2.25927734375, 2.352783203125, 2.4462890625, 2.539794921875, 2.63330078125, 2.726806640625, 2.8203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 11.0, 14.0, 13.0, 13.0, 27.0, 13.0, 30.0, 27.0, 18.0, 29.0, 37.0, 24.0, 39.0, 31.0, 33.0, 37.0, 40.0, 48.0, 44.0, 45.0, 45.0, 44.0, 31.0, 22.0, 43.0, 32.0, 22.0, 28.0, 24.0, 9.0, 16.0, 13.0, 11.0, 14.0, 20.0, 5.0, 4.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8568801879882812, -0.8246002197265625, -0.7923202514648438, -0.760040283203125, -0.7277603149414062, -0.6954803466796875, -0.6632003784179688, -0.63092041015625, -0.5986404418945312, -0.5663604736328125, -0.5340805053710938, -0.501800537109375, -0.46952056884765625, -0.4372406005859375, -0.40496063232421875, -0.3726806640625, -0.34040069580078125, -0.3081207275390625, -0.27584075927734375, -0.243560791015625, -0.21128082275390625, -0.1790008544921875, -0.14672088623046875, -0.11444091796875, -0.08216094970703125, -0.0498809814453125, -0.01760101318359375, 0.014678955078125, 0.04695892333984375, 0.0792388916015625, 0.11151885986328125, 0.143798828125, 0.17607879638671875, 0.2083587646484375, 0.24063873291015625, 0.272918701171875, 0.30519866943359375, 0.3374786376953125, 0.36975860595703125, 0.40203857421875, 0.43431854248046875, 0.4665985107421875, 0.49887847900390625, 0.531158447265625, 0.5634384155273438, 0.5957183837890625, 0.6279983520507812, 0.6602783203125, 0.6925582885742188, 0.7248382568359375, 0.7571182250976562, 0.789398193359375, 0.8216781616210938, 0.8539581298828125, 0.8862380981445312, 0.91851806640625, 0.9507980346679688, 0.9830780029296875, 1.0153579711914062, 1.047637939453125, 1.0799179077148438, 1.1121978759765625, 1.1444778442382812, 1.1767578125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 3.0, 4.0, 5.0, 14.0, 12.0, 5.0, 14.0, 16.0, 22.0, 16.0, 13.0, 29.0, 25.0, 29.0, 24.0, 32.0, 30.0, 40.0, 45.0, 36.0, 35.0, 31.0, 54.0, 45.0, 37.0, 25.0, 17.0, 34.0, 29.0, 27.0, 34.0, 23.0, 24.0, 23.0, 29.0, 15.0, 18.0, 12.0, 15.0, 10.0, 7.0, 15.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-61.922672271728516, -60.123634338378906, -58.32460021972656, -56.52556228637695, -54.726524353027344, -52.927486419677734, -51.128448486328125, -49.32941436767578, -47.53037643432617, -45.73133850097656, -43.93230438232422, -42.13326644897461, -40.334228515625, -38.53519058227539, -36.73615264892578, -34.93711853027344, -33.13808059692383, -31.33904266357422, -29.540006637573242, -27.740970611572266, -25.941932678222656, -24.142894744873047, -22.34385871887207, -20.544822692871094, -18.745784759521484, -16.946746826171875, -15.147710800170898, -13.348673820495605, -11.549636840820312, -9.75059986114502, -7.951562881469727, -6.152525901794434, -4.353485107421875, -2.554448127746582, -0.7554111480712891, 1.043625831604004, 2.842662811279297, 4.64169979095459, 6.440736770629883, 8.239773750305176, 10.038810729980469, 11.837847709655762, 13.636884689331055, 15.435921669006348, 17.23495864868164, 19.03399658203125, 20.833032608032227, 22.632068634033203, 24.431106567382812, 26.230144500732422, 28.0291805267334, 29.828216552734375, 31.627254486083984, 33.426292419433594, 35.22532653808594, 37.02436447143555, 38.823402404785156, 40.622440338134766, 42.421478271484375, 44.22051239013672, 46.01955032348633, 47.81858825683594, 49.61762237548828, 51.41666030883789, 53.2156982421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 9.0, 6.0, 12.0, 12.0, 21.0, 16.0, 12.0, 19.0, 24.0, 24.0, 30.0, 31.0, 35.0, 46.0, 41.0, 38.0, 27.0, 30.0, 41.0, 52.0, 36.0, 48.0, 31.0, 41.0, 28.0, 30.0, 39.0, 24.0, 24.0, 21.0, 16.0, 12.0, 23.0, 11.0, 14.0, 6.0, 15.0, 8.0, 7.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.10070037841797, -52.170501708984375, -50.24030303955078, -48.31010818481445, -46.37990951538086, -44.449710845947266, -42.51951599121094, -40.589317321777344, -38.65911865234375, -36.728919982910156, -34.79872131347656, -32.868526458740234, -30.93832778930664, -29.008129119873047, -27.077932357788086, -25.147735595703125, -23.21753692626953, -21.287338256835938, -19.357141494750977, -17.426944732666016, -15.496746063232422, -13.566548347473145, -11.636350631713867, -9.70615291595459, -7.7759552001953125, -5.845757484436035, -3.915559768676758, -1.9853620529174805, -0.055164337158203125, 1.8750333786010742, 3.8052310943603516, 5.735428810119629, 7.665626525878906, 9.595824241638184, 11.526021957397461, 13.456219673156738, 15.386417388916016, 17.31661605834961, 19.24681282043457, 21.17700958251953, 23.107208251953125, 25.03740692138672, 26.96760368347168, 28.89780044555664, 30.827999114990234, 32.75819778442383, 34.688392639160156, 36.61859130859375, 38.548789978027344, 40.47898864746094, 42.40918731689453, 44.33938217163086, 46.26958084106445, 48.19977951049805, 50.129974365234375, 52.06017303466797, 53.99037170410156, 55.920570373535156, 57.85076904296875, 59.78096389770508, 61.71116256713867, 63.641361236572266, 65.5715560913086, 67.50175476074219, 69.43195343017578]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 23.0, 32.0, 45.0, 93.0, 154.0, 263.0, 482.0, 836.0, 1606.0, 2889.0, 5478.0, 10367.0, 18643.0, 32824.0, 54837.0, 85412.0, 118716.0, 145552.0, 151630.0, 136410.0, 105598.0, 72402.0, 45511.0, 26568.0, 14945.0, 7973.0, 4194.0, 2243.0, 1265.0, 652.0, 363.0, 209.0, 127.0, 76.0, 51.0, 33.0, 19.0, 10.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -67.8330078125, -65.666015625, -63.4990234375, -61.33203125, -59.1650390625, -56.998046875, -54.8310546875, -52.6640625, -50.4970703125, -48.330078125, -46.1630859375, -43.99609375, -41.8291015625, -39.662109375, -37.4951171875, -35.328125, -33.1611328125, -30.994140625, -28.8271484375, -26.66015625, -24.4931640625, -22.326171875, -20.1591796875, -17.9921875, -15.8251953125, -13.658203125, -11.4912109375, -9.32421875, -7.1572265625, -4.990234375, -2.8232421875, -0.65625, 1.5107421875, 3.677734375, 5.8447265625, 8.01171875, 10.1787109375, 12.345703125, 14.5126953125, 16.6796875, 18.8466796875, 21.013671875, 23.1806640625, 25.34765625, 27.5146484375, 29.681640625, 31.8486328125, 34.015625, 36.1826171875, 38.349609375, 40.5166015625, 42.68359375, 44.8505859375, 47.017578125, 49.1845703125, 51.3515625, 53.5185546875, 55.685546875, 57.8525390625, 60.01953125, 62.1865234375, 64.353515625, 66.5205078125, 68.6875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 9.0, 5.0, 10.0, 14.0, 19.0, 17.0, 13.0, 22.0, 19.0, 28.0, 26.0, 32.0, 32.0, 47.0, 36.0, 43.0, 28.0, 35.0, 39.0, 44.0, 45.0, 36.0, 42.0, 40.0, 29.0, 34.0, 30.0, 34.0, 24.0, 16.0, 17.0, 12.0, 20.0, 14.0, 12.0, 9.0, 14.0, 8.0, 7.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.65625, -49.81591796875, -47.9755859375, -46.13525390625, -44.294921875, -42.45458984375, -40.6142578125, -38.77392578125, -36.93359375, -35.09326171875, -33.2529296875, -31.41259765625, -29.572265625, -27.73193359375, -25.8916015625, -24.05126953125, -22.2109375, -20.37060546875, -18.5302734375, -16.68994140625, -14.849609375, -13.00927734375, -11.1689453125, -9.32861328125, -7.48828125, -5.64794921875, -3.8076171875, -1.96728515625, -0.126953125, 1.71337890625, 3.5537109375, 5.39404296875, 7.234375, 9.07470703125, 10.9150390625, 12.75537109375, 14.595703125, 16.43603515625, 18.2763671875, 20.11669921875, 21.95703125, 23.79736328125, 25.6376953125, 27.47802734375, 29.318359375, 31.15869140625, 32.9990234375, 34.83935546875, 36.6796875, 38.52001953125, 40.3603515625, 42.20068359375, 44.041015625, 45.88134765625, 47.7216796875, 49.56201171875, 51.40234375, 53.24267578125, 55.0830078125, 56.92333984375, 58.763671875, 60.60400390625, 62.4443359375, 64.28466796875, 66.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 10.0, 6.0, 10.0, 10.0, 21.0, 43.0, 56.0, 84.0, 132.0, 191.0, 305.0, 509.0, 760.0, 1236.0, 1933.0, 3208.0, 5043.0, 7806.0, 12221.0, 18696.0, 28069.0, 40598.0, 56324.0, 75794.0, 93522.0, 107699.0, 114245.0, 109883.0, 97445.0, 79486.0, 61035.0, 43802.0, 30917.0, 20492.0, 13426.0, 8664.0, 5431.0, 3533.0, 2221.0, 1369.0, 841.0, 512.0, 332.0, 221.0, 141.0, 89.0, 62.0, 47.0, 21.0, 20.0, 13.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.96875, -48.33642578125, -46.7041015625, -45.07177734375, -43.439453125, -41.80712890625, -40.1748046875, -38.54248046875, -36.91015625, -35.27783203125, -33.6455078125, -32.01318359375, -30.380859375, -28.74853515625, -27.1162109375, -25.48388671875, -23.8515625, -22.21923828125, -20.5869140625, -18.95458984375, -17.322265625, -15.68994140625, -14.0576171875, -12.42529296875, -10.79296875, -9.16064453125, -7.5283203125, -5.89599609375, -4.263671875, -2.63134765625, -0.9990234375, 0.63330078125, 2.265625, 3.89794921875, 5.5302734375, 7.16259765625, 8.794921875, 10.42724609375, 12.0595703125, 13.69189453125, 15.32421875, 16.95654296875, 18.5888671875, 20.22119140625, 21.853515625, 23.48583984375, 25.1181640625, 26.75048828125, 28.3828125, 30.01513671875, 31.6474609375, 33.27978515625, 34.912109375, 36.54443359375, 38.1767578125, 39.80908203125, 41.44140625, 43.07373046875, 44.7060546875, 46.33837890625, 47.970703125, 49.60302734375, 51.2353515625, 52.86767578125, 54.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 12.0, 4.0, 14.0, 13.0, 11.0, 21.0, 10.0, 25.0, 18.0, 25.0, 19.0, 25.0, 26.0, 41.0, 34.0, 35.0, 38.0, 36.0, 47.0, 45.0, 59.0, 41.0, 40.0, 43.0, 42.0, 32.0, 35.0, 30.0, 29.0, 17.0, 20.0, 29.0, 10.0, 14.0, 8.0, 8.0, 12.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.625, -36.40673828125, -35.1884765625, -33.97021484375, -32.751953125, -31.53369140625, -30.3154296875, -29.09716796875, -27.87890625, -26.66064453125, -25.4423828125, -24.22412109375, -23.005859375, -21.78759765625, -20.5693359375, -19.35107421875, -18.1328125, -16.91455078125, -15.6962890625, -14.47802734375, -13.259765625, -12.04150390625, -10.8232421875, -9.60498046875, -8.38671875, -7.16845703125, -5.9501953125, -4.73193359375, -3.513671875, -2.29541015625, -1.0771484375, 0.14111328125, 1.359375, 2.57763671875, 3.7958984375, 5.01416015625, 6.232421875, 7.45068359375, 8.6689453125, 9.88720703125, 11.10546875, 12.32373046875, 13.5419921875, 14.76025390625, 15.978515625, 17.19677734375, 18.4150390625, 19.63330078125, 20.8515625, 22.06982421875, 23.2880859375, 24.50634765625, 25.724609375, 26.94287109375, 28.1611328125, 29.37939453125, 30.59765625, 31.81591796875, 33.0341796875, 34.25244140625, 35.470703125, 36.68896484375, 37.9072265625, 39.12548828125, 40.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 11.0, 13.0, 12.0, 36.0, 27.0, 55.0, 85.0, 150.0, 223.0, 356.0, 598.0, 1078.0, 2152.0, 4187.0, 8555.0, 17692.0, 35574.0, 69833.0, 123960.0, 181024.0, 202795.0, 169482.0, 109806.0, 60399.0, 30620.0, 14842.0, 7153.0, 3582.0, 1843.0, 1006.0, 572.0, 318.0, 193.0, 123.0, 62.0, 48.0, 25.0, 26.0, 13.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.30078125, -28.3671875, -27.43359375, -26.5, -25.56640625, -24.6328125, -23.69921875, -22.765625, -21.83203125, -20.8984375, -19.96484375, -19.03125, -18.09765625, -17.1640625, -16.23046875, -15.296875, -14.36328125, -13.4296875, -12.49609375, -11.5625, -10.62890625, -9.6953125, -8.76171875, -7.828125, -6.89453125, -5.9609375, -5.02734375, -4.09375, -3.16015625, -2.2265625, -1.29296875, -0.359375, 0.57421875, 1.5078125, 2.44140625, 3.375, 4.30859375, 5.2421875, 6.17578125, 7.109375, 8.04296875, 8.9765625, 9.91015625, 10.84375, 11.77734375, 12.7109375, 13.64453125, 14.578125, 15.51171875, 16.4453125, 17.37890625, 18.3125, 19.24609375, 20.1796875, 21.11328125, 22.046875, 22.98046875, 23.9140625, 24.84765625, 25.78125, 26.71484375, 27.6484375, 28.58203125, 29.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 10.0, 11.0, 8.0, 8.0, 18.0, 25.0, 34.0, 33.0, 54.0, 60.0, 65.0, 72.0, 71.0, 91.0, 69.0, 83.0, 61.0, 49.0, 40.0, 45.0, 33.0, 15.0, 14.0, 14.0, 7.0, 8.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.005054473876953125, -0.00494047999382019, -0.004826486110687256, -0.004712492227554321, -0.004598498344421387, -0.004484504461288452, -0.004370510578155518, -0.004256516695022583, -0.0041425228118896484, -0.004028528928756714, -0.003914535045623779, -0.0038005411624908447, -0.00368654727935791, -0.0035725533962249756, -0.003458559513092041, -0.0033445656299591064, -0.003230571746826172, -0.0031165778636932373, -0.0030025839805603027, -0.002888590097427368, -0.0027745962142944336, -0.002660602331161499, -0.0025466084480285645, -0.00243261456489563, -0.0023186206817626953, -0.0022046267986297607, -0.002090632915496826, -0.0019766390323638916, -0.001862645149230957, -0.0017486512660980225, -0.0016346573829650879, -0.0015206634998321533, -0.0014066696166992188, -0.0012926757335662842, -0.0011786818504333496, -0.001064687967300415, -0.0009506940841674805, -0.0008367002010345459, -0.0007227063179016113, -0.0006087124347686768, -0.0004947185516357422, -0.0003807246685028076, -0.00026673078536987305, -0.00015273690223693848, -3.8743019104003906e-05, 7.525086402893066e-05, 0.00018924474716186523, 0.0003032386302947998, 0.0004172325134277344, 0.0005312263965606689, 0.0006452202796936035, 0.0007592141628265381, 0.0008732080459594727, 0.0009872019290924072, 0.0011011958122253418, 0.0012151896953582764, 0.001329183578491211, 0.0014431774616241455, 0.00155717134475708, 0.0016711652278900146, 0.0017851591110229492, 0.0018991529941558838, 0.0020131468772888184, 0.002127140760421753, 0.0022411346435546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 8.0, 7.0, 11.0, 18.0, 26.0, 46.0, 53.0, 91.0, 156.0, 268.0, 369.0, 628.0, 1035.0, 1678.0, 2683.0, 4770.0, 8837.0, 16130.0, 29619.0, 51987.0, 86848.0, 130224.0, 165309.0, 170468.0, 141135.0, 98507.0, 60199.0, 34386.0, 18875.0, 10412.0, 5687.0, 3243.0, 1931.0, 1108.0, 647.0, 419.0, 254.0, 147.0, 109.0, 95.0, 44.0, 27.0, 22.0, 12.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.734375, -24.88037109375, -24.0263671875, -23.17236328125, -22.318359375, -21.46435546875, -20.6103515625, -19.75634765625, -18.90234375, -18.04833984375, -17.1943359375, -16.34033203125, -15.486328125, -14.63232421875, -13.7783203125, -12.92431640625, -12.0703125, -11.21630859375, -10.3623046875, -9.50830078125, -8.654296875, -7.80029296875, -6.9462890625, -6.09228515625, -5.23828125, -4.38427734375, -3.5302734375, -2.67626953125, -1.822265625, -0.96826171875, -0.1142578125, 0.73974609375, 1.59375, 2.44775390625, 3.3017578125, 4.15576171875, 5.009765625, 5.86376953125, 6.7177734375, 7.57177734375, 8.42578125, 9.27978515625, 10.1337890625, 10.98779296875, 11.841796875, 12.69580078125, 13.5498046875, 14.40380859375, 15.2578125, 16.11181640625, 16.9658203125, 17.81982421875, 18.673828125, 19.52783203125, 20.3818359375, 21.23583984375, 22.08984375, 22.94384765625, 23.7978515625, 24.65185546875, 25.505859375, 26.35986328125, 27.2138671875, 28.06787109375, 28.921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 12.0, 17.0, 25.0, 24.0, 29.0, 38.0, 50.0, 65.0, 70.0, 84.0, 68.0, 64.0, 84.0, 55.0, 56.0, 53.0, 42.0, 42.0, 17.0, 26.0, 14.0, 16.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -12.9974365234375, -12.533935546875, -12.0704345703125, -11.60693359375, -11.1434326171875, -10.679931640625, -10.2164306640625, -9.7529296875, -9.2894287109375, -8.825927734375, -8.3624267578125, -7.89892578125, -7.4354248046875, -6.971923828125, -6.5084228515625, -6.044921875, -5.5814208984375, -5.117919921875, -4.6544189453125, -4.19091796875, -3.7274169921875, -3.263916015625, -2.8004150390625, -2.3369140625, -1.8734130859375, -1.409912109375, -0.9464111328125, -0.48291015625, -0.0194091796875, 0.444091796875, 0.9075927734375, 1.37109375, 1.8345947265625, 2.298095703125, 2.7615966796875, 3.22509765625, 3.6885986328125, 4.152099609375, 4.6156005859375, 5.0791015625, 5.5426025390625, 6.006103515625, 6.4696044921875, 6.93310546875, 7.3966064453125, 7.860107421875, 8.3236083984375, 8.787109375, 9.2506103515625, 9.714111328125, 10.1776123046875, 10.64111328125, 11.1046142578125, 11.568115234375, 12.0316162109375, 12.4951171875, 12.9586181640625, 13.422119140625, 13.8856201171875, 14.34912109375, 14.8126220703125, 15.276123046875, 15.7396240234375, 16.203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 10.0, 16.0, 22.0, 18.0, 22.0, 31.0, 27.0, 32.0, 37.0, 37.0, 35.0, 42.0, 47.0, 34.0, 50.0, 45.0, 38.0, 24.0, 40.0, 27.0, 23.0, 27.0, 36.0, 25.0, 33.0, 31.0, 25.0, 21.0, 21.0, 19.0, 10.0, 14.0, 8.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.84510803222656, -58.98116683959961, -57.11722946166992, -55.25328826904297, -53.389347076416016, -51.52540588378906, -49.661468505859375, -47.79752731323242, -45.93358612060547, -44.069644927978516, -42.20570755004883, -40.341766357421875, -38.47782516479492, -36.61388397216797, -34.74994659423828, -32.88600540161133, -31.02206802368164, -29.15812873840332, -27.294187545776367, -25.430248260498047, -23.566307067871094, -21.702367782592773, -19.838428497314453, -17.9744873046875, -16.11054801940918, -14.246607780456543, -12.382667541503906, -10.518728256225586, -8.65478801727295, -6.7908477783203125, -4.926908493041992, -3.0629682540893555, -1.1990318298339844, 0.6649081707000732, 2.528848171234131, 4.392787933349609, 6.256728172302246, 8.120668411254883, 9.984607696533203, 11.84854793548584, 13.712488174438477, 15.576428413391113, 17.44036865234375, 19.30430793762207, 21.16824722290039, 23.032188415527344, 24.896127700805664, 26.760066986083984, 28.624008178710938, 30.487947463989258, 32.35188674926758, 34.21582794189453, 36.079769134521484, 37.94371032714844, 39.807647705078125, 41.67158889770508, 43.53553009033203, 45.399471282958984, 47.26340866088867, 49.127349853515625, 50.99129104614258, 52.85523223876953, 54.71916961669922, 56.58311080932617, 58.44704818725586]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 2.0, 9.0, 11.0, 16.0, 13.0, 9.0, 19.0, 18.0, 32.0, 31.0, 25.0, 37.0, 32.0, 25.0, 42.0, 36.0, 36.0, 40.0, 40.0, 36.0, 32.0, 41.0, 33.0, 43.0, 41.0, 30.0, 20.0, 32.0, 35.0, 24.0, 26.0, 16.0, 14.0, 13.0, 14.0, 9.0, 14.0, 10.0, 3.0, 11.0, 8.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.64284133911133, -52.721534729003906, -50.800228118896484, -48.87892150878906, -46.95761489868164, -45.03630828857422, -43.1150016784668, -41.193695068359375, -39.27238845825195, -37.35108184814453, -35.42977523803711, -33.50846862792969, -31.587162017822266, -29.665855407714844, -27.744548797607422, -25.8232421875, -23.901935577392578, -21.980628967285156, -20.059322357177734, -18.138015747070312, -16.21670913696289, -14.295402526855469, -12.374095916748047, -10.452789306640625, -8.531482696533203, -6.610176086425781, -4.688869476318359, -2.7675628662109375, -0.8462562561035156, 1.0750503540039062, 2.996356964111328, 4.91766357421875, 6.838966369628906, 8.760272979736328, 10.68157958984375, 12.602886199951172, 14.524192810058594, 16.445499420166016, 18.366806030273438, 20.28811264038086, 22.20941925048828, 24.130725860595703, 26.052032470703125, 27.973339080810547, 29.89464569091797, 31.81595230102539, 33.73725891113281, 35.658565521240234, 37.579872131347656, 39.50117874145508, 41.4224853515625, 43.34379196166992, 45.265098571777344, 47.186405181884766, 49.10771179199219, 51.02901840209961, 52.95032501220703, 54.87163162231445, 56.792938232421875, 58.7142448425293, 60.63555145263672, 62.55685806274414, 64.47816467285156, 66.39947509765625, 68.3207778930664]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 20.0, 46.0, 59.0, 123.0, 174.0, 298.0, 485.0, 803.0, 1253.0, 2126.0, 3530.0, 5505.0, 9112.0, 14945.0, 24060.0, 38424.0, 60402.0, 92812.0, 140249.0, 203516.0, 280648.0, 364383.0, 438720.0, 476999.0, 470202.0, 420598.0, 343168.0, 260727.0, 185471.0, 126067.0, 83052.0, 54487.0, 34546.0, 21552.0, 13518.0, 8436.0, 5191.0, 3225.0, 2025.0, 1231.0, 734.0, 498.0, 314.0, 202.0, 125.0, 65.0, 45.0, 29.0, 23.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0], "bins": [-46.8125, -45.388671875, -43.96484375, -42.541015625, -41.1171875, -39.693359375, -38.26953125, -36.845703125, -35.421875, -33.998046875, -32.57421875, -31.150390625, -29.7265625, -28.302734375, -26.87890625, -25.455078125, -24.03125, -22.607421875, -21.18359375, -19.759765625, -18.3359375, -16.912109375, -15.48828125, -14.064453125, -12.640625, -11.216796875, -9.79296875, -8.369140625, -6.9453125, -5.521484375, -4.09765625, -2.673828125, -1.25, 0.173828125, 1.59765625, 3.021484375, 4.4453125, 5.869140625, 7.29296875, 8.716796875, 10.140625, 11.564453125, 12.98828125, 14.412109375, 15.8359375, 17.259765625, 18.68359375, 20.107421875, 21.53125, 22.955078125, 24.37890625, 25.802734375, 27.2265625, 28.650390625, 30.07421875, 31.498046875, 32.921875, 34.345703125, 35.76953125, 37.193359375, 38.6171875, 40.041015625, 41.46484375, 42.888671875, 44.3125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 14.0, 12.0, 15.0, 23.0, 14.0, 28.0, 32.0, 34.0, 40.0, 30.0, 34.0, 36.0, 37.0, 27.0, 43.0, 47.0, 43.0, 36.0, 36.0, 41.0, 43.0, 30.0, 28.0, 32.0, 31.0, 29.0, 25.0, 12.0, 18.0, 22.0, 5.0, 13.0, 14.0, 8.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.65283203125, -44.9306640625, -43.20849609375, -41.486328125, -39.76416015625, -38.0419921875, -36.31982421875, -34.59765625, -32.87548828125, -31.1533203125, -29.43115234375, -27.708984375, -25.98681640625, -24.2646484375, -22.54248046875, -20.8203125, -19.09814453125, -17.3759765625, -15.65380859375, -13.931640625, -12.20947265625, -10.4873046875, -8.76513671875, -7.04296875, -5.32080078125, -3.5986328125, -1.87646484375, -0.154296875, 1.56787109375, 3.2900390625, 5.01220703125, 6.734375, 8.45654296875, 10.1787109375, 11.90087890625, 13.623046875, 15.34521484375, 17.0673828125, 18.78955078125, 20.51171875, 22.23388671875, 23.9560546875, 25.67822265625, 27.400390625, 29.12255859375, 30.8447265625, 32.56689453125, 34.2890625, 36.01123046875, 37.7333984375, 39.45556640625, 41.177734375, 42.89990234375, 44.6220703125, 46.34423828125, 48.06640625, 49.78857421875, 51.5107421875, 53.23291015625, 54.955078125, 56.67724609375, 58.3994140625, 60.12158203125, 61.84375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 12.0, 17.0, 30.0, 57.0, 114.0, 155.0, 317.0, 517.0, 909.0, 1703.0, 2894.0, 5337.0, 9258.0, 16180.0, 27868.0, 46970.0, 76536.0, 121801.0, 185460.0, 265494.0, 358204.0, 441560.0, 495081.0, 498400.0, 452484.0, 371805.0, 280442.0, 197543.0, 131098.0, 83177.0, 51024.0, 30400.0, 17688.0, 10230.0, 5962.0, 3311.0, 1824.0, 1051.0, 570.0, 315.0, 221.0, 110.0, 64.0, 32.0, 27.0, 11.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.7578125, -48.046875, -46.3359375, -44.625, -42.9140625, -41.203125, -39.4921875, -37.78125, -36.0703125, -34.359375, -32.6484375, -30.9375, -29.2265625, -27.515625, -25.8046875, -24.09375, -22.3828125, -20.671875, -18.9609375, -17.25, -15.5390625, -13.828125, -12.1171875, -10.40625, -8.6953125, -6.984375, -5.2734375, -3.5625, -1.8515625, -0.140625, 1.5703125, 3.28125, 4.9921875, 6.703125, 8.4140625, 10.125, 11.8359375, 13.546875, 15.2578125, 16.96875, 18.6796875, 20.390625, 22.1015625, 23.8125, 25.5234375, 27.234375, 28.9453125, 30.65625, 32.3671875, 34.078125, 35.7890625, 37.5, 39.2109375, 40.921875, 42.6328125, 44.34375, 46.0546875, 47.765625, 49.4765625, 51.1875, 52.8984375, 54.609375, 56.3203125, 58.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 16.0, 12.0, 16.0, 24.0, 29.0, 41.0, 39.0, 48.0, 66.0, 74.0, 99.0, 119.0, 120.0, 140.0, 134.0, 185.0, 169.0, 202.0, 190.0, 220.0, 209.0, 187.0, 228.0, 188.0, 189.0, 170.0, 152.0, 130.0, 117.0, 107.0, 102.0, 79.0, 53.0, 38.0, 38.0, 33.0, 27.0, 18.0, 25.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.41552734375, -23.6123046875, -22.80908203125, -22.005859375, -21.20263671875, -20.3994140625, -19.59619140625, -18.79296875, -17.98974609375, -17.1865234375, -16.38330078125, -15.580078125, -14.77685546875, -13.9736328125, -13.17041015625, -12.3671875, -11.56396484375, -10.7607421875, -9.95751953125, -9.154296875, -8.35107421875, -7.5478515625, -6.74462890625, -5.94140625, -5.13818359375, -4.3349609375, -3.53173828125, -2.728515625, -1.92529296875, -1.1220703125, -0.31884765625, 0.484375, 1.28759765625, 2.0908203125, 2.89404296875, 3.697265625, 4.50048828125, 5.3037109375, 6.10693359375, 6.91015625, 7.71337890625, 8.5166015625, 9.31982421875, 10.123046875, 10.92626953125, 11.7294921875, 12.53271484375, 13.3359375, 14.13916015625, 14.9423828125, 15.74560546875, 16.548828125, 17.35205078125, 18.1552734375, 18.95849609375, 19.76171875, 20.56494140625, 21.3681640625, 22.17138671875, 22.974609375, 23.77783203125, 24.5810546875, 25.38427734375, 26.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 11.0, 8.0, 17.0, 11.0, 7.0, 13.0, 20.0, 12.0, 14.0, 28.0, 27.0, 26.0, 28.0, 32.0, 38.0, 41.0, 44.0, 39.0, 44.0, 33.0, 40.0, 38.0, 23.0, 43.0, 29.0, 28.0, 32.0, 38.0, 33.0, 18.0, 22.0, 15.0, 21.0, 11.0, 14.0, 9.0, 14.0, 13.0, 12.0, 5.0, 6.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-52.89725875854492, -51.18734359741211, -49.47743225097656, -47.76751708984375, -46.0576057434082, -44.34769058227539, -42.637779235839844, -40.92786407470703, -39.217952728271484, -37.50803756713867, -35.798126220703125, -34.08821105957031, -32.378299713134766, -30.668384552001953, -28.958473205566406, -27.248558044433594, -25.538644790649414, -23.828731536865234, -22.118818283081055, -20.408905029296875, -18.698991775512695, -16.989078521728516, -15.27916431427002, -13.56925106048584, -11.85933780670166, -10.14942455291748, -8.4395112991333, -6.729597568511963, -5.019684314727783, -3.3097705841064453, -1.5998573303222656, 0.11005592346191406, 1.8199691772460938, 3.5298824310302734, 5.239795684814453, 6.949709415435791, 8.659622192382812, 10.369536399841309, 12.079449653625488, 13.789362907409668, 15.499276161193848, 17.209190368652344, 18.919103622436523, 20.629016876220703, 22.338930130004883, 24.048843383789062, 25.758756637573242, 27.468669891357422, 29.1785831451416, 30.88849639892578, 32.598411560058594, 34.30832290649414, 36.01823806762695, 37.7281494140625, 39.43806457519531, 41.14797592163086, 42.85789108276367, 44.567806243896484, 46.27771759033203, 47.987632751464844, 49.69754409790039, 51.4074592590332, 53.11737060546875, 54.82728576660156, 56.53719711303711]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 11.0, 10.0, 13.0, 13.0, 13.0, 14.0, 12.0, 25.0, 29.0, 22.0, 29.0, 34.0, 42.0, 42.0, 42.0, 38.0, 31.0, 44.0, 46.0, 39.0, 44.0, 33.0, 41.0, 34.0, 30.0, 36.0, 36.0, 27.0, 27.0, 21.0, 17.0, 16.0, 22.0, 12.0, 8.0, 8.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.406978607177734, -54.4423713684082, -52.477760314941406, -50.513153076171875, -48.548545837402344, -46.58393859863281, -44.619327545166016, -42.654720306396484, -40.69010925292969, -38.725502014160156, -36.76089096069336, -34.79628372192383, -32.8316764831543, -30.867067337036133, -28.90245819091797, -26.937850952148438, -24.973243713378906, -23.008634567260742, -21.04402732849121, -19.079418182373047, -17.114810943603516, -15.150201797485352, -13.185592651367188, -11.22098445892334, -9.256376266479492, -7.2917680740356445, -5.327159404754639, -3.362550735473633, -1.3979425430297852, 0.5666656494140625, 2.5312747955322266, 4.495882987976074, 6.460487365722656, 8.425095558166504, 10.389703750610352, 12.354312896728516, 14.318921089172363, 16.28352928161621, 18.248138427734375, 20.212745666503906, 22.17735481262207, 24.141963958740234, 26.106571197509766, 28.07118034362793, 30.035789489746094, 32.000396728515625, 33.965003967285156, 35.92961502075195, 37.894222259521484, 39.858829498291016, 41.82344055175781, 43.788047790527344, 45.752655029296875, 47.717262268066406, 49.6818733215332, 51.646480560302734, 53.61109161376953, 55.57569885253906, 57.54030990600586, 59.50491714477539, 61.46952438354492, 63.43413543701172, 65.39874267578125, 67.36334991455078, 69.32795715332031]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 10.0, 16.0, 21.0, 30.0, 43.0, 86.0, 129.0, 215.0, 375.0, 558.0, 1076.0, 1997.0, 3360.0, 5758.0, 9964.0, 17244.0, 28364.0, 46069.0, 69920.0, 98552.0, 125818.0, 140518.0, 137160.0, 116620.0, 87808.0, 60409.0, 38963.0, 23937.0, 14071.0, 8159.0, 4787.0, 2788.0, 1610.0, 889.0, 478.0, 288.0, 171.0, 112.0, 66.0, 37.0, 29.0, 16.0, 9.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.675048828125, -23.81884765625, -22.962646484375, -22.1064453125, -21.250244140625, -20.39404296875, -19.537841796875, -18.681640625, -17.825439453125, -16.96923828125, -16.113037109375, -15.2568359375, -14.400634765625, -13.54443359375, -12.688232421875, -11.83203125, -10.975830078125, -10.11962890625, -9.263427734375, -8.4072265625, -7.551025390625, -6.69482421875, -5.838623046875, -4.982421875, -4.126220703125, -3.27001953125, -2.413818359375, -1.5576171875, -0.701416015625, 0.15478515625, 1.010986328125, 1.8671875, 2.723388671875, 3.57958984375, 4.435791015625, 5.2919921875, 6.148193359375, 7.00439453125, 7.860595703125, 8.716796875, 9.572998046875, 10.42919921875, 11.285400390625, 12.1416015625, 12.997802734375, 13.85400390625, 14.710205078125, 15.56640625, 16.422607421875, 17.27880859375, 18.135009765625, 18.9912109375, 19.847412109375, 20.70361328125, 21.559814453125, 22.416015625, 23.272216796875, 24.12841796875, 24.984619140625, 25.8408203125, 26.697021484375, 27.55322265625, 28.409423828125, 29.265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 10.0, 15.0, 14.0, 10.0, 14.0, 14.0, 22.0, 31.0, 23.0, 31.0, 34.0, 37.0, 41.0, 45.0, 40.0, 31.0, 42.0, 45.0, 39.0, 41.0, 36.0, 43.0, 33.0, 28.0, 38.0, 33.0, 31.0, 23.0, 23.0, 18.0, 14.0, 21.0, 16.0, 6.0, 8.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.03125, -55.04541015625, -53.0595703125, -51.07373046875, -49.087890625, -47.10205078125, -45.1162109375, -43.13037109375, -41.14453125, -39.15869140625, -37.1728515625, -35.18701171875, -33.201171875, -31.21533203125, -29.2294921875, -27.24365234375, -25.2578125, -23.27197265625, -21.2861328125, -19.30029296875, -17.314453125, -15.32861328125, -13.3427734375, -11.35693359375, -9.37109375, -7.38525390625, -5.3994140625, -3.41357421875, -1.427734375, 0.55810546875, 2.5439453125, 4.52978515625, 6.515625, 8.50146484375, 10.4873046875, 12.47314453125, 14.458984375, 16.44482421875, 18.4306640625, 20.41650390625, 22.40234375, 24.38818359375, 26.3740234375, 28.35986328125, 30.345703125, 32.33154296875, 34.3173828125, 36.30322265625, 38.2890625, 40.27490234375, 42.2607421875, 44.24658203125, 46.232421875, 48.21826171875, 50.2041015625, 52.18994140625, 54.17578125, 56.16162109375, 58.1474609375, 60.13330078125, 62.119140625, 64.10498046875, 66.0908203125, 68.07666015625, 70.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 24.0, 35.0, 49.0, 86.0, 116.0, 221.0, 411.0, 717.0, 1363.0, 2507.0, 4492.0, 8247.0, 15361.0, 29134.0, 192290.0, 717800.0, 35699.0, 18448.0, 9742.0, 5211.0, 2848.0, 1671.0, 879.0, 510.0, 245.0, 121.0, 106.0, 67.0, 35.0, 21.0, 15.0, 13.0, 4.0, 3.0, 11.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.625, -80.205078125, -77.78515625, -75.365234375, -72.9453125, -70.525390625, -68.10546875, -65.685546875, -63.265625, -60.845703125, -58.42578125, -56.005859375, -53.5859375, -51.166015625, -48.74609375, -46.326171875, -43.90625, -41.486328125, -39.06640625, -36.646484375, -34.2265625, -31.806640625, -29.38671875, -26.966796875, -24.546875, -22.126953125, -19.70703125, -17.287109375, -14.8671875, -12.447265625, -10.02734375, -7.607421875, -5.1875, -2.767578125, -0.34765625, 2.072265625, 4.4921875, 6.912109375, 9.33203125, 11.751953125, 14.171875, 16.591796875, 19.01171875, 21.431640625, 23.8515625, 26.271484375, 28.69140625, 31.111328125, 33.53125, 35.951171875, 38.37109375, 40.791015625, 43.2109375, 45.630859375, 48.05078125, 50.470703125, 52.890625, 55.310546875, 57.73046875, 60.150390625, 62.5703125, 64.990234375, 67.41015625, 69.830078125, 72.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 17.0, 15.0, 19.0, 24.0, 13.0, 28.0, 34.0, 32.0, 38.0, 36.0, 31.0, 35.0, 41.0, 37.0, 39.0, 23.0, 37.0, 26.0, 30.0, 45.0, 43.0, 28.0, 35.0, 20.0, 39.0, 27.0, 20.0, 21.0, 14.0, 17.0, 13.0, 15.0, 18.0, 4.0, 8.0, 6.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-37.46875, -36.17626953125, -34.8837890625, -33.59130859375, -32.298828125, -31.00634765625, -29.7138671875, -28.42138671875, -27.12890625, -25.83642578125, -24.5439453125, -23.25146484375, -21.958984375, -20.66650390625, -19.3740234375, -18.08154296875, -16.7890625, -15.49658203125, -14.2041015625, -12.91162109375, -11.619140625, -10.32666015625, -9.0341796875, -7.74169921875, -6.44921875, -5.15673828125, -3.8642578125, -2.57177734375, -1.279296875, 0.01318359375, 1.3056640625, 2.59814453125, 3.890625, 5.18310546875, 6.4755859375, 7.76806640625, 9.060546875, 10.35302734375, 11.6455078125, 12.93798828125, 14.23046875, 15.52294921875, 16.8154296875, 18.10791015625, 19.400390625, 20.69287109375, 21.9853515625, 23.27783203125, 24.5703125, 25.86279296875, 27.1552734375, 28.44775390625, 29.740234375, 31.03271484375, 32.3251953125, 33.61767578125, 34.91015625, 36.20263671875, 37.4951171875, 38.78759765625, 40.080078125, 41.37255859375, 42.6650390625, 43.95751953125, 45.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 22.0, 23.0, 28.0, 36.0, 43.0, 56.0, 92.0, 136.0, 213.0, 332.0, 549.0, 848.0, 1436.0, 2504.0, 4515.0, 8505.0, 16439.0, 35883.0, 672400.0, 244580.0, 28724.0, 13991.0, 7360.0, 4156.0, 2251.0, 1222.0, 782.0, 432.0, 274.0, 199.0, 141.0, 76.0, 79.0, 45.0, 30.0, 32.0, 30.0, 10.0, 14.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.18359375, -5.02099609375, -4.8583984375, -4.69580078125, -4.533203125, -4.37060546875, -4.2080078125, -4.04541015625, -3.8828125, -3.72021484375, -3.5576171875, -3.39501953125, -3.232421875, -3.06982421875, -2.9072265625, -2.74462890625, -2.58203125, -2.41943359375, -2.2568359375, -2.09423828125, -1.931640625, -1.76904296875, -1.6064453125, -1.44384765625, -1.28125, -1.11865234375, -0.9560546875, -0.79345703125, -0.630859375, -0.46826171875, -0.3056640625, -0.14306640625, 0.01953125, 0.18212890625, 0.3447265625, 0.50732421875, 0.669921875, 0.83251953125, 0.9951171875, 1.15771484375, 1.3203125, 1.48291015625, 1.6455078125, 1.80810546875, 1.970703125, 2.13330078125, 2.2958984375, 2.45849609375, 2.62109375, 2.78369140625, 2.9462890625, 3.10888671875, 3.271484375, 3.43408203125, 3.5966796875, 3.75927734375, 3.921875, 4.08447265625, 4.2470703125, 4.40966796875, 4.572265625, 4.73486328125, 4.8974609375, 5.06005859375, 5.22265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 5.0, 18.0, 23.0, 12.0, 25.0, 20.0, 34.0, 29.0, 51.0, 49.0, 44.0, 57.0, 57.0, 52.0, 62.0, 45.0, 51.0, 36.0, 35.0, 32.0, 33.0, 31.0, 25.0, 20.0, 17.0, 13.0, 12.0, 10.0, 8.0, 7.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00061798095703125, -0.0006001219153404236, -0.0005822628736495972, -0.0005644038319587708, -0.0005465447902679443, -0.0005286857485771179, -0.0005108267068862915, -0.0004929676651954651, -0.00047510862350463867, -0.00045724958181381226, -0.00043939054012298584, -0.0004215314984321594, -0.000403672456741333, -0.0003858134150505066, -0.0003679543733596802, -0.00035009533166885376, -0.00033223628997802734, -0.00031437724828720093, -0.0002965182065963745, -0.0002786591649055481, -0.0002608001232147217, -0.00024294108152389526, -0.00022508203983306885, -0.00020722299814224243, -0.00018936395645141602, -0.0001715049147605896, -0.00015364587306976318, -0.00013578683137893677, -0.00011792778968811035, -0.00010006874799728394, -8.220970630645752e-05, -6.43506646156311e-05, -4.649162292480469e-05, -2.863258123397827e-05, -1.0773539543151855e-05, 7.0855021476745605e-06, 2.4944543838500977e-05, 4.280358552932739e-05, 6.066262722015381e-05, 7.852166891098022e-05, 9.638071060180664e-05, 0.00011423975229263306, 0.00013209879398345947, 0.0001499578356742859, 0.0001678168773651123, 0.00018567591905593872, 0.00020353496074676514, 0.00022139400243759155, 0.00023925304412841797, 0.0002571120858192444, 0.0002749711275100708, 0.0002928301692008972, 0.00031068921089172363, 0.00032854825258255005, 0.00034640729427337646, 0.0003642663359642029, 0.0003821253776550293, 0.0003999844193458557, 0.00041784346103668213, 0.00043570250272750854, 0.00045356154441833496, 0.0004714205861091614, 0.0004892796277999878, 0.0005071386694908142, 0.0005249977111816406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 6.0, 10.0, 14.0, 22.0, 20.0, 36.0, 49.0, 73.0, 120.0, 156.0, 219.0, 280.0, 439.0, 610.0, 949.0, 1560.0, 2572.0, 4545.0, 8854.0, 18010.0, 36725.0, 74127.0, 136651.0, 208399.0, 219956.0, 156264.0, 87894.0, 43924.0, 21741.0, 10681.0, 5577.0, 2995.0, 1724.0, 1093.0, 694.0, 484.0, 300.0, 224.0, 163.0, 111.0, 87.0, 84.0, 38.0, 25.0, 20.0, 6.0, 12.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.525390625, -3.40838623046875, -3.2913818359375, -3.17437744140625, -3.057373046875, -2.94036865234375, -2.8233642578125, -2.70635986328125, -2.58935546875, -2.47235107421875, -2.3553466796875, -2.23834228515625, -2.121337890625, -2.00433349609375, -1.8873291015625, -1.77032470703125, -1.6533203125, -1.53631591796875, -1.4193115234375, -1.30230712890625, -1.185302734375, -1.06829833984375, -0.9512939453125, -0.83428955078125, -0.71728515625, -0.60028076171875, -0.4832763671875, -0.36627197265625, -0.249267578125, -0.13226318359375, -0.0152587890625, 0.10174560546875, 0.21875, 0.33575439453125, 0.4527587890625, 0.56976318359375, 0.686767578125, 0.80377197265625, 0.9207763671875, 1.03778076171875, 1.15478515625, 1.27178955078125, 1.3887939453125, 1.50579833984375, 1.622802734375, 1.73980712890625, 1.8568115234375, 1.97381591796875, 2.0908203125, 2.20782470703125, 2.3248291015625, 2.44183349609375, 2.558837890625, 2.67584228515625, 2.7928466796875, 2.90985107421875, 3.02685546875, 3.14385986328125, 3.2608642578125, 3.37786865234375, 3.494873046875, 3.61187744140625, 3.7288818359375, 3.84588623046875, 3.962890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 20.0, 18.0, 31.0, 31.0, 62.0, 77.0, 96.0, 113.0, 118.0, 102.0, 80.0, 61.0, 44.0, 28.0, 14.0, 14.0, 8.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4547882080078125, -1.404693603515625, -1.3545989990234375, -1.30450439453125, -1.2544097900390625, -1.204315185546875, -1.1542205810546875, -1.1041259765625, -1.0540313720703125, -1.003936767578125, -0.9538421630859375, -0.90374755859375, -0.8536529541015625, -0.803558349609375, -0.7534637451171875, -0.703369140625, -0.6532745361328125, -0.603179931640625, -0.5530853271484375, -0.50299072265625, -0.4528961181640625, -0.402801513671875, -0.3527069091796875, -0.3026123046875, -0.2525177001953125, -0.202423095703125, -0.1523284912109375, -0.10223388671875, -0.0521392822265625, -0.002044677734375, 0.0480499267578125, 0.09814453125, 0.1482391357421875, 0.198333740234375, 0.2484283447265625, 0.29852294921875, 0.3486175537109375, 0.398712158203125, 0.4488067626953125, 0.4989013671875, 0.5489959716796875, 0.599090576171875, 0.6491851806640625, 0.69927978515625, 0.7493743896484375, 0.799468994140625, 0.8495635986328125, 0.899658203125, 0.9497528076171875, 0.999847412109375, 1.0499420166015625, 1.10003662109375, 1.1501312255859375, 1.200225830078125, 1.2503204345703125, 1.3004150390625, 1.3505096435546875, 1.400604248046875, 1.4506988525390625, 1.50079345703125, 1.5508880615234375, 1.600982666015625, 1.6510772705078125, 1.701171875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 5.0, 10.0, 9.0, 11.0, 10.0, 14.0, 9.0, 14.0, 13.0, 16.0, 20.0, 30.0, 19.0, 21.0, 22.0, 35.0, 42.0, 35.0, 33.0, 39.0, 43.0, 37.0, 40.0, 37.0, 34.0, 31.0, 31.0, 34.0, 42.0, 29.0, 26.0, 28.0, 21.0, 20.0, 17.0, 16.0, 20.0, 5.0, 9.0, 16.0, 10.0, 14.0, 6.0, 1.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.85308837890625, -50.14957809448242, -48.44607162475586, -46.74256134033203, -45.0390510559082, -43.335540771484375, -41.63203430175781, -39.928524017333984, -38.225013732910156, -36.52150344848633, -34.817996978759766, -33.11448669433594, -31.41097640991211, -29.707468032836914, -28.00395965576172, -26.30044937133789, -24.596942901611328, -22.893434524536133, -21.189924240112305, -19.48641586303711, -17.78290557861328, -16.079397201538086, -14.37588882446289, -12.672379493713379, -10.968870162963867, -9.265360832214355, -7.561851978302002, -5.858343124389648, -4.154833793640137, -2.451324462890625, -0.7478160858154297, 0.955693244934082, 2.6592025756835938, 4.3627119064331055, 6.066220760345459, 7.7697296142578125, 9.473238945007324, 11.176748275756836, 12.880256652832031, 14.583765983581543, 16.287275314331055, 17.99078369140625, 19.694293975830078, 21.397802352905273, 23.10131072998047, 24.804821014404297, 26.508329391479492, 28.211837768554688, 29.915348052978516, 31.61885643005371, 33.322364807128906, 35.025875091552734, 36.72938537597656, 38.432891845703125, 40.13640213012695, 41.83991241455078, 43.543418884277344, 45.24692916870117, 46.950435638427734, 48.65394592285156, 50.35745620727539, 52.06096649169922, 53.76447296142578, 55.46798324584961, 57.17149353027344]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 8.0, 11.0, 16.0, 11.0, 14.0, 15.0, 25.0, 23.0, 27.0, 34.0, 32.0, 35.0, 45.0, 32.0, 46.0, 33.0, 45.0, 44.0, 37.0, 42.0, 30.0, 50.0, 30.0, 30.0, 40.0, 27.0, 32.0, 30.0, 19.0, 18.0, 13.0, 16.0, 24.0, 4.0, 14.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.00938415527344, -55.027931213378906, -53.04648208618164, -51.06502914428711, -49.083580017089844, -47.10212707519531, -45.12067413330078, -43.139225006103516, -41.15777587890625, -39.17632293701172, -37.19487380981445, -35.21342086791992, -33.231971740722656, -31.250518798828125, -29.269067764282227, -27.287616729736328, -25.306163787841797, -23.3247127532959, -21.34326171875, -19.36180877685547, -17.380359649658203, -15.398907661437988, -13.417455673217773, -11.436004638671875, -9.454553604125977, -7.473102569580078, -5.4916510581970215, -3.510199546813965, -1.5287485122680664, 0.45270252227783203, 2.434154510498047, 4.415605545043945, 6.397056579589844, 8.378507614135742, 10.35995864868164, 12.341410636901855, 14.322861671447754, 16.30431365966797, 18.285764694213867, 20.267215728759766, 22.248666763305664, 24.230117797851562, 26.21156883239746, 28.19301986694336, 30.17447280883789, 32.155921936035156, 34.13737487792969, 36.11882781982422, 38.100276947021484, 40.081729888916016, 42.06317901611328, 44.04463195800781, 46.02608108520508, 48.00753402709961, 49.988983154296875, 51.970436096191406, 53.95188903808594, 55.93334197998047, 57.914791107177734, 59.896244049072266, 61.87769317626953, 63.85914611816406, 65.8405990600586, 67.82205200195312, 69.80349731445312]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 18.0, 18.0, 43.0, 63.0, 101.0, 184.0, 282.0, 496.0, 893.0, 1534.0, 2670.0, 4636.0, 8102.0, 13836.0, 22784.0, 36187.0, 54462.0, 76886.0, 100217.0, 118705.0, 127268.0, 122384.0, 106039.0, 83518.0, 60636.0, 41409.0, 26437.0, 16125.0, 9627.0, 5593.0, 3118.0, 1877.0, 967.0, 598.0, 350.0, 201.0, 114.0, 67.0, 45.0, 22.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.96875, -53.17529296875, -51.3818359375, -49.58837890625, -47.794921875, -46.00146484375, -44.2080078125, -42.41455078125, -40.62109375, -38.82763671875, -37.0341796875, -35.24072265625, -33.447265625, -31.65380859375, -29.8603515625, -28.06689453125, -26.2734375, -24.47998046875, -22.6865234375, -20.89306640625, -19.099609375, -17.30615234375, -15.5126953125, -13.71923828125, -11.92578125, -10.13232421875, -8.3388671875, -6.54541015625, -4.751953125, -2.95849609375, -1.1650390625, 0.62841796875, 2.421875, 4.21533203125, 6.0087890625, 7.80224609375, 9.595703125, 11.38916015625, 13.1826171875, 14.97607421875, 16.76953125, 18.56298828125, 20.3564453125, 22.14990234375, 23.943359375, 25.73681640625, 27.5302734375, 29.32373046875, 31.1171875, 32.91064453125, 34.7041015625, 36.49755859375, 38.291015625, 40.08447265625, 41.8779296875, 43.67138671875, 45.46484375, 47.25830078125, 49.0517578125, 50.84521484375, 52.638671875, 54.43212890625, 56.2255859375, 58.01904296875, 59.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 10.0, 11.0, 13.0, 14.0, 10.0, 14.0, 12.0, 21.0, 29.0, 30.0, 30.0, 35.0, 35.0, 36.0, 38.0, 47.0, 40.0, 43.0, 45.0, 35.0, 39.0, 35.0, 44.0, 31.0, 29.0, 33.0, 38.0, 31.0, 31.0, 15.0, 16.0, 17.0, 20.0, 17.0, 9.0, 9.0, 10.0, 4.0, 7.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.71875, -52.81591796875, -50.9130859375, -49.01025390625, -47.107421875, -45.20458984375, -43.3017578125, -41.39892578125, -39.49609375, -37.59326171875, -35.6904296875, -33.78759765625, -31.884765625, -29.98193359375, -28.0791015625, -26.17626953125, -24.2734375, -22.37060546875, -20.4677734375, -18.56494140625, -16.662109375, -14.75927734375, -12.8564453125, -10.95361328125, -9.05078125, -7.14794921875, -5.2451171875, -3.34228515625, -1.439453125, 0.46337890625, 2.3662109375, 4.26904296875, 6.171875, 8.07470703125, 9.9775390625, 11.88037109375, 13.783203125, 15.68603515625, 17.5888671875, 19.49169921875, 21.39453125, 23.29736328125, 25.2001953125, 27.10302734375, 29.005859375, 30.90869140625, 32.8115234375, 34.71435546875, 36.6171875, 38.52001953125, 40.4228515625, 42.32568359375, 44.228515625, 46.13134765625, 48.0341796875, 49.93701171875, 51.83984375, 53.74267578125, 55.6455078125, 57.54833984375, 59.451171875, 61.35400390625, 63.2568359375, 65.15966796875, 67.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 15.0, 26.0, 26.0, 47.0, 93.0, 142.0, 245.0, 425.0, 748.0, 1379.0, 2651.0, 4791.0, 8485.0, 15129.0, 25978.0, 42115.0, 64208.0, 90517.0, 116813.0, 133375.0, 135467.0, 121817.0, 98133.0, 70803.0, 46488.0, 29235.0, 17300.0, 9924.0, 5457.0, 2992.0, 1692.0, 888.0, 457.0, 279.0, 161.0, 88.0, 59.0, 36.0, 28.0, 12.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-64.0625, -62.18505859375, -60.3076171875, -58.43017578125, -56.552734375, -54.67529296875, -52.7978515625, -50.92041015625, -49.04296875, -47.16552734375, -45.2880859375, -43.41064453125, -41.533203125, -39.65576171875, -37.7783203125, -35.90087890625, -34.0234375, -32.14599609375, -30.2685546875, -28.39111328125, -26.513671875, -24.63623046875, -22.7587890625, -20.88134765625, -19.00390625, -17.12646484375, -15.2490234375, -13.37158203125, -11.494140625, -9.61669921875, -7.7392578125, -5.86181640625, -3.984375, -2.10693359375, -0.2294921875, 1.64794921875, 3.525390625, 5.40283203125, 7.2802734375, 9.15771484375, 11.03515625, 12.91259765625, 14.7900390625, 16.66748046875, 18.544921875, 20.42236328125, 22.2998046875, 24.17724609375, 26.0546875, 27.93212890625, 29.8095703125, 31.68701171875, 33.564453125, 35.44189453125, 37.3193359375, 39.19677734375, 41.07421875, 42.95166015625, 44.8291015625, 46.70654296875, 48.583984375, 50.46142578125, 52.3388671875, 54.21630859375, 56.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 8.0, 10.0, 21.0, 12.0, 14.0, 34.0, 34.0, 35.0, 31.0, 31.0, 33.0, 39.0, 37.0, 41.0, 43.0, 40.0, 38.0, 46.0, 43.0, 39.0, 38.0, 35.0, 33.0, 26.0, 24.0, 34.0, 33.0, 23.0, 14.0, 17.0, 11.0, 14.0, 5.0, 11.0, 8.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.2587890625, -32.955078125, -31.6513671875, -30.34765625, -29.0439453125, -27.740234375, -26.4365234375, -25.1328125, -23.8291015625, -22.525390625, -21.2216796875, -19.91796875, -18.6142578125, -17.310546875, -16.0068359375, -14.703125, -13.3994140625, -12.095703125, -10.7919921875, -9.48828125, -8.1845703125, -6.880859375, -5.5771484375, -4.2734375, -2.9697265625, -1.666015625, -0.3623046875, 0.94140625, 2.2451171875, 3.548828125, 4.8525390625, 6.15625, 7.4599609375, 8.763671875, 10.0673828125, 11.37109375, 12.6748046875, 13.978515625, 15.2822265625, 16.5859375, 17.8896484375, 19.193359375, 20.4970703125, 21.80078125, 23.1044921875, 24.408203125, 25.7119140625, 27.015625, 28.3193359375, 29.623046875, 30.9267578125, 32.23046875, 33.5341796875, 34.837890625, 36.1416015625, 37.4453125, 38.7490234375, 40.052734375, 41.3564453125, 42.66015625, 43.9638671875, 45.267578125, 46.5712890625, 47.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 15.0, 18.0, 32.0, 45.0, 113.0, 222.0, 370.0, 724.0, 1563.0, 3602.0, 8526.0, 20222.0, 46512.0, 101883.0, 180054.0, 233613.0, 208294.0, 129957.0, 64116.0, 27944.0, 11632.0, 4889.0, 2116.0, 974.0, 500.0, 254.0, 135.0, 75.0, 53.0, 35.0, 21.0, 8.0, 10.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.9091796875, -38.724609375, -37.5400390625, -36.35546875, -35.1708984375, -33.986328125, -32.8017578125, -31.6171875, -30.4326171875, -29.248046875, -28.0634765625, -26.87890625, -25.6943359375, -24.509765625, -23.3251953125, -22.140625, -20.9560546875, -19.771484375, -18.5869140625, -17.40234375, -16.2177734375, -15.033203125, -13.8486328125, -12.6640625, -11.4794921875, -10.294921875, -9.1103515625, -7.92578125, -6.7412109375, -5.556640625, -4.3720703125, -3.1875, -2.0029296875, -0.818359375, 0.3662109375, 1.55078125, 2.7353515625, 3.919921875, 5.1044921875, 6.2890625, 7.4736328125, 8.658203125, 9.8427734375, 11.02734375, 12.2119140625, 13.396484375, 14.5810546875, 15.765625, 16.9501953125, 18.134765625, 19.3193359375, 20.50390625, 21.6884765625, 22.873046875, 24.0576171875, 25.2421875, 26.4267578125, 27.611328125, 28.7958984375, 29.98046875, 31.1650390625, 32.349609375, 33.5341796875, 34.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 11.0, 11.0, 13.0, 17.0, 30.0, 24.0, 26.0, 28.0, 24.0, 37.0, 34.0, 41.0, 42.0, 57.0, 44.0, 52.0, 46.0, 46.0, 37.0, 43.0, 41.0, 34.0, 36.0, 27.0, 25.0, 19.0, 21.0, 20.0, 20.0, 16.0, 10.0, 7.0, 9.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.002246856689453125, -0.0021781325340270996, -0.0021094083786010742, -0.002040684223175049, -0.0019719600677490234, -0.001903235912322998, -0.0018345117568969727, -0.0017657876014709473, -0.0016970634460449219, -0.0016283392906188965, -0.001559615135192871, -0.0014908909797668457, -0.0014221668243408203, -0.001353442668914795, -0.0012847185134887695, -0.0012159943580627441, -0.0011472702026367188, -0.0010785460472106934, -0.001009821891784668, -0.0009410977363586426, -0.0008723735809326172, -0.0008036494255065918, -0.0007349252700805664, -0.000666201114654541, -0.0005974769592285156, -0.0005287528038024902, -0.00046002864837646484, -0.00039130449295043945, -0.00032258033752441406, -0.00025385618209838867, -0.00018513202667236328, -0.00011640787124633789, -4.76837158203125e-05, 2.104043960571289e-05, 8.976459503173828e-05, 0.00015848875045776367, 0.00022721290588378906, 0.00029593706130981445, 0.00036466121673583984, 0.00043338537216186523, 0.0005021095275878906, 0.000570833683013916, 0.0006395578384399414, 0.0007082819938659668, 0.0007770061492919922, 0.0008457303047180176, 0.000914454460144043, 0.0009831786155700684, 0.0010519027709960938, 0.0011206269264221191, 0.0011893510818481445, 0.00125807523727417, 0.0013267993927001953, 0.0013955235481262207, 0.001464247703552246, 0.0015329718589782715, 0.0016016960144042969, 0.0016704201698303223, 0.0017391443252563477, 0.001807868480682373, 0.0018765926361083984, 0.0019453167915344238, 0.0020140409469604492, 0.0020827651023864746, 0.0021514892578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 14.0, 28.0, 39.0, 75.0, 90.0, 178.0, 251.0, 463.0, 683.0, 1144.0, 1897.0, 3243.0, 5687.0, 9818.0, 16813.0, 30027.0, 49888.0, 79978.0, 115233.0, 145215.0, 155958.0, 140039.0, 108431.0, 73550.0, 45660.0, 26973.0, 15566.0, 8969.0, 5175.0, 2985.0, 1754.0, 1064.0, 636.0, 366.0, 259.0, 149.0, 86.0, 58.0, 29.0, 19.0, 23.0, 4.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.0830078125, -23.291015625, -22.4990234375, -21.70703125, -20.9150390625, -20.123046875, -19.3310546875, -18.5390625, -17.7470703125, -16.955078125, -16.1630859375, -15.37109375, -14.5791015625, -13.787109375, -12.9951171875, -12.203125, -11.4111328125, -10.619140625, -9.8271484375, -9.03515625, -8.2431640625, -7.451171875, -6.6591796875, -5.8671875, -5.0751953125, -4.283203125, -3.4912109375, -2.69921875, -1.9072265625, -1.115234375, -0.3232421875, 0.46875, 1.2607421875, 2.052734375, 2.8447265625, 3.63671875, 4.4287109375, 5.220703125, 6.0126953125, 6.8046875, 7.5966796875, 8.388671875, 9.1806640625, 9.97265625, 10.7646484375, 11.556640625, 12.3486328125, 13.140625, 13.9326171875, 14.724609375, 15.5166015625, 16.30859375, 17.1005859375, 17.892578125, 18.6845703125, 19.4765625, 20.2685546875, 21.060546875, 21.8525390625, 22.64453125, 23.4365234375, 24.228515625, 25.0205078125, 25.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 21.0, 21.0, 40.0, 29.0, 42.0, 58.0, 55.0, 67.0, 85.0, 72.0, 69.0, 66.0, 70.0, 54.0, 56.0, 39.0, 26.0, 27.0, 18.0, 20.0, 10.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.4757080078125, -11.037353515625, -10.5989990234375, -10.16064453125, -9.7222900390625, -9.283935546875, -8.8455810546875, -8.4072265625, -7.9688720703125, -7.530517578125, -7.0921630859375, -6.65380859375, -6.2154541015625, -5.777099609375, -5.3387451171875, -4.900390625, -4.4620361328125, -4.023681640625, -3.5853271484375, -3.14697265625, -2.7086181640625, -2.270263671875, -1.8319091796875, -1.3935546875, -0.9552001953125, -0.516845703125, -0.0784912109375, 0.35986328125, 0.7982177734375, 1.236572265625, 1.6749267578125, 2.11328125, 2.5516357421875, 2.989990234375, 3.4283447265625, 3.86669921875, 4.3050537109375, 4.743408203125, 5.1817626953125, 5.6201171875, 6.0584716796875, 6.496826171875, 6.9351806640625, 7.37353515625, 7.8118896484375, 8.250244140625, 8.6885986328125, 9.126953125, 9.5653076171875, 10.003662109375, 10.4420166015625, 10.88037109375, 11.3187255859375, 11.757080078125, 12.1954345703125, 12.6337890625, 13.0721435546875, 13.510498046875, 13.9488525390625, 14.38720703125, 14.8255615234375, 15.263916015625, 15.7022705078125, 16.140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 11.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 18.0, 27.0, 42.0, 33.0, 30.0, 33.0, 45.0, 55.0, 30.0, 37.0, 46.0, 40.0, 45.0, 36.0, 42.0, 36.0, 36.0, 21.0, 28.0, 25.0, 28.0, 18.0, 29.0, 18.0, 10.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 10.0, 2.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.68506622314453, -49.852203369140625, -48.01934051513672, -46.18647384643555, -44.35361099243164, -42.520748138427734, -40.68788528442383, -38.855018615722656, -37.02215576171875, -35.189292907714844, -33.35643005371094, -31.5235652923584, -29.69070053100586, -27.857837677001953, -26.024974822998047, -24.192110061645508, -22.3592472076416, -20.526384353637695, -18.693519592285156, -16.86065673828125, -15.027791976928711, -13.194929122924805, -11.362065315246582, -9.52920150756836, -7.696337699890137, -5.863473892211914, -4.030610084533691, -2.197746753692627, -0.3648829460144043, 1.4679803848266602, 3.300844192504883, 5.1337080001831055, 6.966571807861328, 8.79943561553955, 10.632299423217773, 12.46516227722168, 14.298027038574219, 16.130889892578125, 17.96375274658203, 19.79661750793457, 21.62948226928711, 23.462345123291016, 25.295209884643555, 27.12807273864746, 28.9609375, 30.793800354003906, 32.62666320800781, 34.45952606201172, 36.292388916015625, 38.12525177001953, 39.95811462402344, 41.79098129272461, 43.623844146728516, 45.45670700073242, 47.28956985473633, 49.1224365234375, 50.955299377441406, 52.78816223144531, 54.62102508544922, 56.45389175415039, 58.2867546081543, 60.1196174621582, 61.95248031616211, 63.78534698486328, 65.61820983886719]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 12.0, 10.0, 16.0, 13.0, 15.0, 12.0, 25.0, 18.0, 22.0, 27.0, 30.0, 36.0, 31.0, 30.0, 38.0, 45.0, 37.0, 35.0, 32.0, 30.0, 37.0, 48.0, 43.0, 36.0, 26.0, 22.0, 24.0, 22.0, 29.0, 24.0, 20.0, 14.0, 18.0, 20.0, 16.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-57.952789306640625, -56.12928009033203, -54.30577087402344, -52.482261657714844, -50.65875244140625, -48.835243225097656, -47.01173400878906, -45.188228607177734, -43.36471939086914, -41.54121017456055, -39.71770095825195, -37.89419174194336, -36.070682525634766, -34.24717712402344, -32.423667907714844, -30.60015869140625, -28.776647567749023, -26.95313835144043, -25.129629135131836, -23.306121826171875, -21.48261260986328, -19.659103393554688, -17.835594177246094, -16.0120849609375, -14.188576698303223, -12.365067481994629, -10.541559219360352, -8.718050003051758, -6.894541263580322, -5.071032524108887, -3.247523307800293, -1.4240150451660156, 0.3994941711425781, 2.2230029106140137, 4.046511650085449, 5.870020866394043, 7.6935296058654785, 9.517038345336914, 11.340547561645508, 13.164055824279785, 14.987565040588379, 16.811073303222656, 18.63458251953125, 20.458091735839844, 22.281600952148438, 24.10511016845703, 25.928619384765625, 27.752126693725586, 29.57563591003418, 31.399145126342773, 33.222652435302734, 35.04616165161133, 36.86967086791992, 38.693180084228516, 40.51668930053711, 42.3401985168457, 44.1637077331543, 45.98721694946289, 47.810726165771484, 49.63423538208008, 51.45774459838867, 53.28125, 55.104759216308594, 56.92826843261719, 58.75177764892578]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 9.0, 7.0, 12.0, 16.0, 41.0, 56.0, 114.0, 171.0, 276.0, 518.0, 845.0, 1430.0, 2432.0, 3982.0, 6618.0, 11230.0, 18183.0, 29285.0, 47799.0, 75373.0, 115975.0, 171795.0, 244658.0, 327657.0, 406329.0, 464337.0, 480116.0, 448525.0, 383491.0, 300464.0, 221609.0, 154049.0, 102335.0, 66236.0, 41896.0, 26034.0, 16115.0, 9533.0, 6024.0, 3466.0, 2147.0, 1237.0, 791.0, 462.0, 261.0, 158.0, 80.0, 50.0, 26.0, 9.0, 9.0, 7.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-46.3125, -44.83544921875, -43.3583984375, -41.88134765625, -40.404296875, -38.92724609375, -37.4501953125, -35.97314453125, -34.49609375, -33.01904296875, -31.5419921875, -30.06494140625, -28.587890625, -27.11083984375, -25.6337890625, -24.15673828125, -22.6796875, -21.20263671875, -19.7255859375, -18.24853515625, -16.771484375, -15.29443359375, -13.8173828125, -12.34033203125, -10.86328125, -9.38623046875, -7.9091796875, -6.43212890625, -4.955078125, -3.47802734375, -2.0009765625, -0.52392578125, 0.953125, 2.43017578125, 3.9072265625, 5.38427734375, 6.861328125, 8.33837890625, 9.8154296875, 11.29248046875, 12.76953125, 14.24658203125, 15.7236328125, 17.20068359375, 18.677734375, 20.15478515625, 21.6318359375, 23.10888671875, 24.5859375, 26.06298828125, 27.5400390625, 29.01708984375, 30.494140625, 31.97119140625, 33.4482421875, 34.92529296875, 36.40234375, 37.87939453125, 39.3564453125, 40.83349609375, 42.310546875, 43.78759765625, 45.2646484375, 46.74169921875, 48.21875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 8.0, 9.0, 11.0, 14.0, 13.0, 15.0, 9.0, 20.0, 20.0, 20.0, 18.0, 32.0, 31.0, 24.0, 35.0, 37.0, 36.0, 44.0, 36.0, 38.0, 25.0, 36.0, 35.0, 52.0, 37.0, 32.0, 37.0, 23.0, 21.0, 23.0, 25.0, 22.0, 19.0, 16.0, 19.0, 17.0, 20.0, 8.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.96875, -47.3779296875, -45.787109375, -44.1962890625, -42.60546875, -41.0146484375, -39.423828125, -37.8330078125, -36.2421875, -34.6513671875, -33.060546875, -31.4697265625, -29.87890625, -28.2880859375, -26.697265625, -25.1064453125, -23.515625, -21.9248046875, -20.333984375, -18.7431640625, -17.15234375, -15.5615234375, -13.970703125, -12.3798828125, -10.7890625, -9.1982421875, -7.607421875, -6.0166015625, -4.42578125, -2.8349609375, -1.244140625, 0.3466796875, 1.9375, 3.5283203125, 5.119140625, 6.7099609375, 8.30078125, 9.8916015625, 11.482421875, 13.0732421875, 14.6640625, 16.2548828125, 17.845703125, 19.4365234375, 21.02734375, 22.6181640625, 24.208984375, 25.7998046875, 27.390625, 28.9814453125, 30.572265625, 32.1630859375, 33.75390625, 35.3447265625, 36.935546875, 38.5263671875, 40.1171875, 41.7080078125, 43.298828125, 44.8896484375, 46.48046875, 48.0712890625, 49.662109375, 51.2529296875, 52.84375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 12.0, 18.0, 41.0, 39.0, 75.0, 123.0, 193.0, 360.0, 598.0, 1028.0, 1830.0, 2987.0, 5234.0, 8709.0, 14719.0, 24372.0, 39141.0, 62090.0, 95903.0, 142267.0, 203593.0, 273915.0, 347688.0, 412171.0, 447502.0, 448860.0, 413315.0, 352027.0, 278462.0, 206765.0, 145842.0, 98444.0, 64030.0, 40405.0, 24981.0, 14831.0, 8919.0, 5273.0, 3100.0, 1875.0, 1003.0, 621.0, 403.0, 215.0, 113.0, 81.0, 44.0, 21.0, 23.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.25, -50.66796875, -49.0859375, -47.50390625, -45.921875, -44.33984375, -42.7578125, -41.17578125, -39.59375, -38.01171875, -36.4296875, -34.84765625, -33.265625, -31.68359375, -30.1015625, -28.51953125, -26.9375, -25.35546875, -23.7734375, -22.19140625, -20.609375, -19.02734375, -17.4453125, -15.86328125, -14.28125, -12.69921875, -11.1171875, -9.53515625, -7.953125, -6.37109375, -4.7890625, -3.20703125, -1.625, -0.04296875, 1.5390625, 3.12109375, 4.703125, 6.28515625, 7.8671875, 9.44921875, 11.03125, 12.61328125, 14.1953125, 15.77734375, 17.359375, 18.94140625, 20.5234375, 22.10546875, 23.6875, 25.26953125, 26.8515625, 28.43359375, 30.015625, 31.59765625, 33.1796875, 34.76171875, 36.34375, 37.92578125, 39.5078125, 41.08984375, 42.671875, 44.25390625, 45.8359375, 47.41796875, 49.0]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 15.0, 17.0, 23.0, 32.0, 36.0, 40.0, 61.0, 70.0, 92.0, 87.0, 102.0, 132.0, 132.0, 143.0, 167.0, 183.0, 187.0, 176.0, 192.0, 185.0, 160.0, 207.0, 170.0, 165.0, 148.0, 154.0, 135.0, 117.0, 119.0, 86.0, 84.0, 73.0, 80.0, 61.0, 38.0, 38.0, 31.0, 17.0, 11.0, 13.0, 11.0, 7.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.189697265625, -20.47314453125, -19.756591796875, -19.0400390625, -18.323486328125, -17.60693359375, -16.890380859375, -16.173828125, -15.457275390625, -14.74072265625, -14.024169921875, -13.3076171875, -12.591064453125, -11.87451171875, -11.157958984375, -10.44140625, -9.724853515625, -9.00830078125, -8.291748046875, -7.5751953125, -6.858642578125, -6.14208984375, -5.425537109375, -4.708984375, -3.992431640625, -3.27587890625, -2.559326171875, -1.8427734375, -1.126220703125, -0.40966796875, 0.306884765625, 1.0234375, 1.739990234375, 2.45654296875, 3.173095703125, 3.8896484375, 4.606201171875, 5.32275390625, 6.039306640625, 6.755859375, 7.472412109375, 8.18896484375, 8.905517578125, 9.6220703125, 10.338623046875, 11.05517578125, 11.771728515625, 12.48828125, 13.204833984375, 13.92138671875, 14.637939453125, 15.3544921875, 16.071044921875, 16.78759765625, 17.504150390625, 18.220703125, 18.937255859375, 19.65380859375, 20.370361328125, 21.0869140625, 21.803466796875, 22.52001953125, 23.236572265625, 23.953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 13.0, 10.0, 18.0, 17.0, 9.0, 15.0, 25.0, 28.0, 32.0, 36.0, 36.0, 41.0, 38.0, 43.0, 42.0, 45.0, 46.0, 54.0, 49.0, 43.0, 26.0, 32.0, 42.0, 29.0, 30.0, 16.0, 25.0, 22.0, 21.0, 18.0, 13.0, 11.0, 19.0, 8.0, 5.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.52864074707031, -57.64255905151367, -55.75647735595703, -53.870399475097656, -51.984317779541016, -50.098236083984375, -48.212154388427734, -46.326072692871094, -44.43999099731445, -42.55390930175781, -40.66782760620117, -38.78174591064453, -36.895668029785156, -35.009586334228516, -33.123504638671875, -31.237422943115234, -29.351343154907227, -27.465261459350586, -25.579181671142578, -23.693099975585938, -21.807018280029297, -19.920936584472656, -18.03485679626465, -16.148775100708008, -14.262694358825684, -12.37661361694336, -10.490531921386719, -8.604451179504395, -6.718369960784912, -4.83228874206543, -2.9462080001831055, -1.0601263046264648, 0.8259544372558594, 2.712035655975342, 4.598116874694824, 6.484197616577148, 8.370279312133789, 10.256360054016113, 12.142440795898438, 14.028522491455078, 15.914603233337402, 17.800683975219727, 19.686765670776367, 21.572845458984375, 23.458927154541016, 25.345008850097656, 27.231090545654297, 29.117172241210938, 31.003252029418945, 32.88933181762695, 34.775413513183594, 36.661495208740234, 38.547576904296875, 40.433658599853516, 42.319740295410156, 44.20581817626953, 46.09189987182617, 47.97798156738281, 49.86406326293945, 51.750144958496094, 53.63622283935547, 55.52230453491211, 57.40838623046875, 59.29446792602539, 61.18054962158203]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 12.0, 21.0, 17.0, 21.0, 18.0, 21.0, 26.0, 34.0, 35.0, 25.0, 49.0, 34.0, 36.0, 36.0, 48.0, 48.0, 48.0, 23.0, 33.0, 30.0, 29.0, 40.0, 31.0, 30.0, 37.0, 20.0, 21.0, 26.0, 17.0, 22.0, 14.0, 10.0, 9.0, 12.0, 7.0, 4.0, 2.0, 11.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-64.69147491455078, -62.7783203125, -60.86516571044922, -58.95201110839844, -57.038856506347656, -55.125701904296875, -53.21254348754883, -51.29938888549805, -49.386234283447266, -47.473079681396484, -45.5599250793457, -43.64677047729492, -41.733612060546875, -39.820457458496094, -37.90730285644531, -35.99414825439453, -34.08099365234375, -32.16783905029297, -30.254684448242188, -28.341527938842773, -26.428373336791992, -24.51521873474121, -22.602062225341797, -20.688907623291016, -18.775753021240234, -16.862598419189453, -14.949442863464355, -13.036287307739258, -11.123132705688477, -9.209978103637695, -7.296822547912598, -5.3836669921875, -3.4705162048339844, -1.557361125946045, 0.35579395294189453, 2.268949031829834, 4.182104110717773, 6.095258712768555, 8.008414268493652, 9.92156982421875, 11.834724426269531, 13.747879028320312, 15.66103458404541, 17.574190139770508, 19.48734474182129, 21.40049934387207, 23.313655853271484, 25.226810455322266, 27.139965057373047, 29.053119659423828, 30.96627426147461, 32.87942886352539, 34.79258728027344, 36.70574188232422, 38.618896484375, 40.53205108642578, 42.44520568847656, 44.358360290527344, 46.271514892578125, 48.184669494628906, 50.09782409667969, 52.01097869873047, 53.924137115478516, 55.8372917175293, 57.75044631958008]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 15.0, 21.0, 42.0, 52.0, 110.0, 204.0, 287.0, 446.0, 667.0, 1074.0, 1732.0, 2695.0, 4164.0, 6549.0, 9802.0, 14721.0, 21784.0, 31119.0, 43144.0, 56914.0, 72665.0, 87571.0, 98149.0, 103846.0, 101154.0, 92112.0, 77995.0, 62614.0, 47788.0, 34640.0, 24810.0, 17211.0, 11566.0, 7461.0, 4902.0, 3037.0, 2011.0, 1298.0, 807.0, 497.0, 305.0, 206.0, 139.0, 88.0, 50.0, 31.0, 23.0, 7.0, 8.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-18.328125, -17.74951171875, -17.1708984375, -16.59228515625, -16.013671875, -15.43505859375, -14.8564453125, -14.27783203125, -13.69921875, -13.12060546875, -12.5419921875, -11.96337890625, -11.384765625, -10.80615234375, -10.2275390625, -9.64892578125, -9.0703125, -8.49169921875, -7.9130859375, -7.33447265625, -6.755859375, -6.17724609375, -5.5986328125, -5.02001953125, -4.44140625, -3.86279296875, -3.2841796875, -2.70556640625, -2.126953125, -1.54833984375, -0.9697265625, -0.39111328125, 0.1875, 0.76611328125, 1.3447265625, 1.92333984375, 2.501953125, 3.08056640625, 3.6591796875, 4.23779296875, 4.81640625, 5.39501953125, 5.9736328125, 6.55224609375, 7.130859375, 7.70947265625, 8.2880859375, 8.86669921875, 9.4453125, 10.02392578125, 10.6025390625, 11.18115234375, 11.759765625, 12.33837890625, 12.9169921875, 13.49560546875, 14.07421875, 14.65283203125, 15.2314453125, 15.81005859375, 16.388671875, 16.96728515625, 17.5458984375, 18.12451171875, 18.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 13.0, 18.0, 19.0, 21.0, 20.0, 19.0, 22.0, 35.0, 33.0, 27.0, 52.0, 30.0, 36.0, 40.0, 38.0, 54.0, 44.0, 29.0, 26.0, 36.0, 30.0, 37.0, 34.0, 24.0, 40.0, 23.0, 21.0, 24.0, 20.0, 16.0, 21.0, 9.0, 9.0, 14.0, 3.0, 7.0, 3.0, 4.0, 11.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-65.375, -63.4619140625, -61.548828125, -59.6357421875, -57.72265625, -55.8095703125, -53.896484375, -51.9833984375, -50.0703125, -48.1572265625, -46.244140625, -44.3310546875, -42.41796875, -40.5048828125, -38.591796875, -36.6787109375, -34.765625, -32.8525390625, -30.939453125, -29.0263671875, -27.11328125, -25.2001953125, -23.287109375, -21.3740234375, -19.4609375, -17.5478515625, -15.634765625, -13.7216796875, -11.80859375, -9.8955078125, -7.982421875, -6.0693359375, -4.15625, -2.2431640625, -0.330078125, 1.5830078125, 3.49609375, 5.4091796875, 7.322265625, 9.2353515625, 11.1484375, 13.0615234375, 14.974609375, 16.8876953125, 18.80078125, 20.7138671875, 22.626953125, 24.5400390625, 26.453125, 28.3662109375, 30.279296875, 32.1923828125, 34.10546875, 36.0185546875, 37.931640625, 39.8447265625, 41.7578125, 43.6708984375, 45.583984375, 47.4970703125, 49.41015625, 51.3232421875, 53.236328125, 55.1494140625, 57.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 29.0, 20.0, 47.0, 68.0, 115.0, 166.0, 271.0, 439.0, 714.0, 1163.0, 1796.0, 3071.0, 5055.0, 8535.0, 14536.0, 24678.0, 65859.0, 822944.0, 44245.0, 22326.0, 12982.0, 7681.0, 4560.0, 2755.0, 1676.0, 1004.0, 679.0, 361.0, 249.0, 153.0, 108.0, 62.0, 43.0, 32.0, 29.0, 17.0, 13.0, 10.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.75146484375, -60.7529296875, -58.75439453125, -56.755859375, -54.75732421875, -52.7587890625, -50.76025390625, -48.76171875, -46.76318359375, -44.7646484375, -42.76611328125, -40.767578125, -38.76904296875, -36.7705078125, -34.77197265625, -32.7734375, -30.77490234375, -28.7763671875, -26.77783203125, -24.779296875, -22.78076171875, -20.7822265625, -18.78369140625, -16.78515625, -14.78662109375, -12.7880859375, -10.78955078125, -8.791015625, -6.79248046875, -4.7939453125, -2.79541015625, -0.796875, 1.20166015625, 3.2001953125, 5.19873046875, 7.197265625, 9.19580078125, 11.1943359375, 13.19287109375, 15.19140625, 17.18994140625, 19.1884765625, 21.18701171875, 23.185546875, 25.18408203125, 27.1826171875, 29.18115234375, 31.1796875, 33.17822265625, 35.1767578125, 37.17529296875, 39.173828125, 41.17236328125, 43.1708984375, 45.16943359375, 47.16796875, 49.16650390625, 51.1650390625, 53.16357421875, 55.162109375, 57.16064453125, 59.1591796875, 61.15771484375, 63.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 7.0, 3.0, 5.0, 12.0, 12.0, 16.0, 20.0, 20.0, 15.0, 15.0, 16.0, 33.0, 22.0, 32.0, 33.0, 28.0, 31.0, 42.0, 46.0, 42.0, 39.0, 36.0, 44.0, 46.0, 29.0, 36.0, 34.0, 31.0, 35.0, 24.0, 36.0, 11.0, 23.0, 16.0, 16.0, 15.0, 14.0, 11.0, 13.0, 8.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-36.5, -35.20703125, -33.9140625, -32.62109375, -31.328125, -30.03515625, -28.7421875, -27.44921875, -26.15625, -24.86328125, -23.5703125, -22.27734375, -20.984375, -19.69140625, -18.3984375, -17.10546875, -15.8125, -14.51953125, -13.2265625, -11.93359375, -10.640625, -9.34765625, -8.0546875, -6.76171875, -5.46875, -4.17578125, -2.8828125, -1.58984375, -0.296875, 0.99609375, 2.2890625, 3.58203125, 4.875, 6.16796875, 7.4609375, 8.75390625, 10.046875, 11.33984375, 12.6328125, 13.92578125, 15.21875, 16.51171875, 17.8046875, 19.09765625, 20.390625, 21.68359375, 22.9765625, 24.26953125, 25.5625, 26.85546875, 28.1484375, 29.44140625, 30.734375, 32.02734375, 33.3203125, 34.61328125, 35.90625, 37.19921875, 38.4921875, 39.78515625, 41.078125, 42.37109375, 43.6640625, 44.95703125, 46.25]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 6.0, 13.0, 16.0, 20.0, 20.0, 28.0, 30.0, 54.0, 55.0, 85.0, 135.0, 197.0, 307.0, 415.0, 587.0, 875.0, 1283.0, 1981.0, 3019.0, 4365.0, 6915.0, 10843.0, 18394.0, 34143.0, 428441.0, 451171.0, 35013.0, 18489.0, 11139.0, 6921.0, 4500.0, 2956.0, 1949.0, 1310.0, 900.0, 582.0, 412.0, 292.0, 216.0, 153.0, 93.0, 56.0, 37.0, 31.0, 28.0, 22.0, 21.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.021484375, -2.924041748046875, -2.82659912109375, -2.729156494140625, -2.6317138671875, -2.534271240234375, -2.43682861328125, -2.339385986328125, -2.241943359375, -2.144500732421875, -2.04705810546875, -1.949615478515625, -1.8521728515625, -1.754730224609375, -1.65728759765625, -1.559844970703125, -1.46240234375, -1.364959716796875, -1.26751708984375, -1.170074462890625, -1.0726318359375, -0.975189208984375, -0.87774658203125, -0.780303955078125, -0.682861328125, -0.585418701171875, -0.48797607421875, -0.390533447265625, -0.2930908203125, -0.195648193359375, -0.09820556640625, -0.000762939453125, 0.0966796875, 0.194122314453125, 0.29156494140625, 0.389007568359375, 0.4864501953125, 0.583892822265625, 0.68133544921875, 0.778778076171875, 0.876220703125, 0.973663330078125, 1.07110595703125, 1.168548583984375, 1.2659912109375, 1.363433837890625, 1.46087646484375, 1.558319091796875, 1.65576171875, 1.753204345703125, 1.85064697265625, 1.948089599609375, 2.0455322265625, 2.142974853515625, 2.24041748046875, 2.337860107421875, 2.435302734375, 2.532745361328125, 2.63018798828125, 2.727630615234375, 2.8250732421875, 2.922515869140625, 3.01995849609375, 3.117401123046875, 3.21484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 3.0, 10.0, 8.0, 11.0, 16.0, 13.0, 20.0, 38.0, 41.0, 43.0, 49.0, 49.0, 70.0, 67.0, 55.0, 72.0, 68.0, 66.0, 60.0, 49.0, 34.0, 32.0, 21.0, 20.0, 19.0, 14.0, 6.0, 7.0, 8.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006780624389648438, -0.0006585270166397095, -0.0006389915943145752, -0.0006194561719894409, -0.0005999207496643066, -0.0005803853273391724, -0.0005608499050140381, -0.0005413144826889038, -0.0005217790603637695, -0.0005022436380386353, -0.000482708215713501, -0.0004631727933883667, -0.0004436373710632324, -0.00042410194873809814, -0.00040456652641296387, -0.0003850311040878296, -0.0003654956817626953, -0.00034596025943756104, -0.00032642483711242676, -0.0003068894147872925, -0.0002873539924621582, -0.0002678185701370239, -0.00024828314781188965, -0.00022874772548675537, -0.0002092123031616211, -0.00018967688083648682, -0.00017014145851135254, -0.00015060603618621826, -0.00013107061386108398, -0.00011153519153594971, -9.199976921081543e-05, -7.246434688568115e-05, -5.2928924560546875e-05, -3.33935022354126e-05, -1.385807991027832e-05, 5.677342414855957e-06, 2.5212764739990234e-05, 4.474818706512451e-05, 6.428360939025879e-05, 8.381903171539307e-05, 0.00010335445404052734, 0.00012288987636566162, 0.0001424252986907959, 0.00016196072101593018, 0.00018149614334106445, 0.00020103156566619873, 0.000220566987991333, 0.00024010241031646729, 0.00025963783264160156, 0.00027917325496673584, 0.0002987086772918701, 0.0003182440996170044, 0.00033777952194213867, 0.00035731494426727295, 0.0003768503665924072, 0.0003963857889175415, 0.0004159212112426758, 0.00043545663356781006, 0.00045499205589294434, 0.0004745274782180786, 0.0004940629005432129, 0.0005135983228683472, 0.0005331337451934814, 0.0005526691675186157, 0.00057220458984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 17.0, 23.0, 42.0, 58.0, 122.0, 160.0, 317.0, 476.0, 899.0, 1422.0, 2460.0, 4068.0, 7191.0, 12502.0, 21338.0, 36166.0, 58505.0, 87191.0, 118613.0, 141771.0, 146817.0, 130243.0, 100603.0, 69246.0, 44349.0, 26678.0, 15494.0, 8971.0, 5285.0, 3039.0, 1759.0, 1077.0, 636.0, 409.0, 240.0, 131.0, 81.0, 54.0, 38.0, 14.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.57421875, -2.491729736328125, -2.40924072265625, -2.326751708984375, -2.2442626953125, -2.161773681640625, -2.07928466796875, -1.996795654296875, -1.914306640625, -1.831817626953125, -1.74932861328125, -1.666839599609375, -1.5843505859375, -1.501861572265625, -1.41937255859375, -1.336883544921875, -1.25439453125, -1.171905517578125, -1.08941650390625, -1.006927490234375, -0.9244384765625, -0.841949462890625, -0.75946044921875, -0.676971435546875, -0.594482421875, -0.511993408203125, -0.42950439453125, -0.347015380859375, -0.2645263671875, -0.182037353515625, -0.09954833984375, -0.017059326171875, 0.0654296875, 0.147918701171875, 0.23040771484375, 0.312896728515625, 0.3953857421875, 0.477874755859375, 0.56036376953125, 0.642852783203125, 0.725341796875, 0.807830810546875, 0.89031982421875, 0.972808837890625, 1.0552978515625, 1.137786865234375, 1.22027587890625, 1.302764892578125, 1.38525390625, 1.467742919921875, 1.55023193359375, 1.632720947265625, 1.7152099609375, 1.797698974609375, 1.88018798828125, 1.962677001953125, 2.045166015625, 2.127655029296875, 2.21014404296875, 2.292633056640625, 2.3751220703125, 2.457611083984375, 2.54010009765625, 2.622589111328125, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 7.0, 15.0, 14.0, 18.0, 19.0, 34.0, 45.0, 40.0, 63.0, 56.0, 77.0, 63.0, 70.0, 67.0, 58.0, 58.0, 62.0, 46.0, 32.0, 30.0, 30.0, 14.0, 14.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3828125, -1.342437744140625, -1.30206298828125, -1.261688232421875, -1.2213134765625, -1.180938720703125, -1.14056396484375, -1.100189208984375, -1.059814453125, -1.019439697265625, -0.97906494140625, -0.938690185546875, -0.8983154296875, -0.857940673828125, -0.81756591796875, -0.777191162109375, -0.73681640625, -0.696441650390625, -0.65606689453125, -0.615692138671875, -0.5753173828125, -0.534942626953125, -0.49456787109375, -0.454193115234375, -0.413818359375, -0.373443603515625, -0.33306884765625, -0.292694091796875, -0.2523193359375, -0.211944580078125, -0.17156982421875, -0.131195068359375, -0.0908203125, -0.050445556640625, -0.01007080078125, 0.030303955078125, 0.0706787109375, 0.111053466796875, 0.15142822265625, 0.191802978515625, 0.232177734375, 0.272552490234375, 0.31292724609375, 0.353302001953125, 0.3936767578125, 0.434051513671875, 0.47442626953125, 0.514801025390625, 0.55517578125, 0.595550537109375, 0.63592529296875, 0.676300048828125, 0.7166748046875, 0.757049560546875, 0.79742431640625, 0.837799072265625, 0.878173828125, 0.918548583984375, 0.95892333984375, 0.999298095703125, 1.0396728515625, 1.080047607421875, 1.12042236328125, 1.160797119140625, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 6.0, 6.0, 8.0, 14.0, 14.0, 19.0, 26.0, 13.0, 29.0, 21.0, 42.0, 37.0, 29.0, 40.0, 49.0, 32.0, 48.0, 41.0, 48.0, 54.0, 37.0, 40.0, 32.0, 25.0, 36.0, 33.0, 31.0, 16.0, 21.0, 19.0, 20.0, 19.0, 14.0, 17.0, 11.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.30906295776367, -57.45502471923828, -55.600990295410156, -53.746952056884766, -51.89291763305664, -50.03887939453125, -48.184844970703125, -46.330806732177734, -44.476768493652344, -42.62273025512695, -40.76869583129883, -38.91465759277344, -37.06062316894531, -35.20658493041992, -33.35254669189453, -31.498512268066406, -29.64447593688965, -27.79043960571289, -25.936403274536133, -24.082366943359375, -22.228328704833984, -20.374292373657227, -18.52025604248047, -16.666217803955078, -14.812182426452637, -12.958146095275879, -11.104108810424805, -9.250072479248047, -7.396035671234131, -5.541998863220215, -3.687962532043457, -1.8339252471923828, 0.020111083984375, 1.8741477727890015, 3.728184461593628, 5.582221031188965, 7.436257839202881, 9.290294647216797, 11.144330978393555, 12.998368263244629, 14.852404594421387, 16.70644187927246, 18.56047821044922, 20.414514541625977, 22.268550872802734, 24.122589111328125, 25.97662353515625, 27.83066177368164, 29.6846981048584, 31.538734436035156, 33.39277267456055, 35.24680709838867, 37.10084533691406, 38.95487976074219, 40.80891799926758, 42.66295623779297, 44.516990661621094, 46.371028900146484, 48.22506332397461, 50.0791015625, 51.933135986328125, 53.787174224853516, 55.641212463378906, 57.49524688720703, 59.34928512573242]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 5.0, 8.0, 14.0, 14.0, 19.0, 19.0, 22.0, 21.0, 22.0, 33.0, 30.0, 33.0, 40.0, 38.0, 34.0, 40.0, 42.0, 52.0, 44.0, 35.0, 23.0, 37.0, 28.0, 37.0, 35.0, 25.0, 37.0, 25.0, 21.0, 25.0, 25.0, 11.0, 23.0, 7.0, 12.0, 12.0, 6.0, 8.0, 1.0, 7.0, 7.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-66.13524627685547, -64.21019744873047, -62.28514099121094, -60.36009216308594, -58.43503952026367, -56.509986877441406, -54.584938049316406, -52.65988540649414, -50.734832763671875, -48.80978012084961, -46.884727478027344, -44.959678649902344, -43.03462600708008, -41.10957336425781, -39.18452453613281, -37.25947189331055, -35.33441925048828, -33.409366607666016, -31.484315872192383, -29.55926513671875, -27.634212493896484, -25.70915985107422, -23.784109115600586, -21.859058380126953, -19.934005737304688, -18.008953094482422, -16.08390235900879, -14.15885066986084, -12.23379898071289, -10.308747291564941, -8.383695602416992, -6.458643913269043, -4.533588409423828, -2.608536720275879, -0.6834850311279297, 1.2415666580200195, 3.1666183471679688, 5.091670036315918, 7.016721725463867, 8.941773414611816, 10.866825103759766, 12.791876792907715, 14.716928482055664, 16.641979217529297, 18.567031860351562, 20.492084503173828, 22.41713523864746, 24.342185974121094, 26.26723861694336, 28.192291259765625, 30.117341995239258, 32.04239273071289, 33.967445373535156, 35.89249801635742, 37.81755065917969, 39.74259948730469, 41.66765213012695, 43.59270477294922, 45.51775360107422, 47.442806243896484, 49.36785888671875, 51.292911529541016, 53.21796417236328, 55.14301300048828, 57.06806564331055]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 12.0, 15.0, 16.0, 33.0, 49.0, 95.0, 162.0, 254.0, 468.0, 770.0, 1227.0, 2063.0, 3467.0, 5427.0, 8808.0, 13491.0, 20254.0, 29931.0, 41901.0, 56631.0, 72347.0, 87351.0, 98721.0, 104176.0, 102123.0, 94705.0, 80175.0, 65328.0, 50269.0, 36078.0, 25508.0, 17168.0, 11135.0, 7174.0, 4477.0, 2629.0, 1563.0, 1021.0, 609.0, 347.0, 220.0, 126.0, 85.0, 47.0, 39.0, 18.0, 19.0, 7.0, 7.0, 6.0, 3.0, 3.0], "bins": [-51.625, -50.18212890625, -48.7392578125, -47.29638671875, -45.853515625, -44.41064453125, -42.9677734375, -41.52490234375, -40.08203125, -38.63916015625, -37.1962890625, -35.75341796875, -34.310546875, -32.86767578125, -31.4248046875, -29.98193359375, -28.5390625, -27.09619140625, -25.6533203125, -24.21044921875, -22.767578125, -21.32470703125, -19.8818359375, -18.43896484375, -16.99609375, -15.55322265625, -14.1103515625, -12.66748046875, -11.224609375, -9.78173828125, -8.3388671875, -6.89599609375, -5.453125, -4.01025390625, -2.5673828125, -1.12451171875, 0.318359375, 1.76123046875, 3.2041015625, 4.64697265625, 6.08984375, 7.53271484375, 8.9755859375, 10.41845703125, 11.861328125, 13.30419921875, 14.7470703125, 16.18994140625, 17.6328125, 19.07568359375, 20.5185546875, 21.96142578125, 23.404296875, 24.84716796875, 26.2900390625, 27.73291015625, 29.17578125, 30.61865234375, 32.0615234375, 33.50439453125, 34.947265625, 36.39013671875, 37.8330078125, 39.27587890625, 40.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 10.0, 5.0, 8.0, 13.0, 17.0, 18.0, 15.0, 23.0, 26.0, 20.0, 31.0, 31.0, 33.0, 46.0, 33.0, 41.0, 35.0, 38.0, 54.0, 48.0, 32.0, 29.0, 34.0, 27.0, 43.0, 31.0, 24.0, 36.0, 25.0, 24.0, 23.0, 21.0, 15.0, 17.0, 8.0, 13.0, 11.0, 7.0, 6.0, 2.0, 9.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-63.90625, -62.03857421875, -60.1708984375, -58.30322265625, -56.435546875, -54.56787109375, -52.7001953125, -50.83251953125, -48.96484375, -47.09716796875, -45.2294921875, -43.36181640625, -41.494140625, -39.62646484375, -37.7587890625, -35.89111328125, -34.0234375, -32.15576171875, -30.2880859375, -28.42041015625, -26.552734375, -24.68505859375, -22.8173828125, -20.94970703125, -19.08203125, -17.21435546875, -15.3466796875, -13.47900390625, -11.611328125, -9.74365234375, -7.8759765625, -6.00830078125, -4.140625, -2.27294921875, -0.4052734375, 1.46240234375, 3.330078125, 5.19775390625, 7.0654296875, 8.93310546875, 10.80078125, 12.66845703125, 14.5361328125, 16.40380859375, 18.271484375, 20.13916015625, 22.0068359375, 23.87451171875, 25.7421875, 27.60986328125, 29.4775390625, 31.34521484375, 33.212890625, 35.08056640625, 36.9482421875, 38.81591796875, 40.68359375, 42.55126953125, 44.4189453125, 46.28662109375, 48.154296875, 50.02197265625, 51.8896484375, 53.75732421875, 55.625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 14.0, 19.0, 28.0, 42.0, 71.0, 109.0, 225.0, 400.0, 653.0, 1157.0, 2127.0, 3751.0, 6469.0, 11028.0, 18452.0, 29698.0, 45634.0, 66206.0, 88613.0, 109342.0, 122416.0, 123803.0, 113711.0, 95141.0, 72251.0, 51625.0, 33926.0, 21354.0, 12700.0, 7534.0, 4322.0, 2441.0, 1436.0, 809.0, 460.0, 244.0, 118.0, 93.0, 50.0, 30.0, 21.0, 11.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-59.71875, -57.9697265625, -56.220703125, -54.4716796875, -52.72265625, -50.9736328125, -49.224609375, -47.4755859375, -45.7265625, -43.9775390625, -42.228515625, -40.4794921875, -38.73046875, -36.9814453125, -35.232421875, -33.4833984375, -31.734375, -29.9853515625, -28.236328125, -26.4873046875, -24.73828125, -22.9892578125, -21.240234375, -19.4912109375, -17.7421875, -15.9931640625, -14.244140625, -12.4951171875, -10.74609375, -8.9970703125, -7.248046875, -5.4990234375, -3.75, -2.0009765625, -0.251953125, 1.4970703125, 3.24609375, 4.9951171875, 6.744140625, 8.4931640625, 10.2421875, 11.9912109375, 13.740234375, 15.4892578125, 17.23828125, 18.9873046875, 20.736328125, 22.4853515625, 24.234375, 25.9833984375, 27.732421875, 29.4814453125, 31.23046875, 32.9794921875, 34.728515625, 36.4775390625, 38.2265625, 39.9755859375, 41.724609375, 43.4736328125, 45.22265625, 46.9716796875, 48.720703125, 50.4697265625, 52.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 1.0, 7.0, 5.0, 9.0, 8.0, 18.0, 8.0, 13.0, 13.0, 18.0, 21.0, 25.0, 43.0, 45.0, 32.0, 42.0, 42.0, 44.0, 32.0, 45.0, 43.0, 48.0, 40.0, 36.0, 51.0, 46.0, 42.0, 32.0, 20.0, 28.0, 21.0, 20.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.1611328125, -32.884765625, -31.6083984375, -30.33203125, -29.0556640625, -27.779296875, -26.5029296875, -25.2265625, -23.9501953125, -22.673828125, -21.3974609375, -20.12109375, -18.8447265625, -17.568359375, -16.2919921875, -15.015625, -13.7392578125, -12.462890625, -11.1865234375, -9.91015625, -8.6337890625, -7.357421875, -6.0810546875, -4.8046875, -3.5283203125, -2.251953125, -0.9755859375, 0.30078125, 1.5771484375, 2.853515625, 4.1298828125, 5.40625, 6.6826171875, 7.958984375, 9.2353515625, 10.51171875, 11.7880859375, 13.064453125, 14.3408203125, 15.6171875, 16.8935546875, 18.169921875, 19.4462890625, 20.72265625, 21.9990234375, 23.275390625, 24.5517578125, 25.828125, 27.1044921875, 28.380859375, 29.6572265625, 30.93359375, 32.2099609375, 33.486328125, 34.7626953125, 36.0390625, 37.3154296875, 38.591796875, 39.8681640625, 41.14453125, 42.4208984375, 43.697265625, 44.9736328125, 46.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 11.0, 26.0, 34.0, 57.0, 58.0, 121.0, 203.0, 293.0, 503.0, 857.0, 1322.0, 2229.0, 3670.0, 6008.0, 9759.0, 15776.0, 25028.0, 38276.0, 56786.0, 79037.0, 101597.0, 119689.0, 125760.0, 119399.0, 101764.0, 79075.0, 56686.0, 38493.0, 24879.0, 15709.0, 9812.0, 5992.0, 3702.0, 2404.0, 1351.0, 852.0, 538.0, 310.0, 189.0, 108.0, 81.0, 39.0, 25.0, 18.0, 9.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.265625, -20.630859375, -19.99609375, -19.361328125, -18.7265625, -18.091796875, -17.45703125, -16.822265625, -16.1875, -15.552734375, -14.91796875, -14.283203125, -13.6484375, -13.013671875, -12.37890625, -11.744140625, -11.109375, -10.474609375, -9.83984375, -9.205078125, -8.5703125, -7.935546875, -7.30078125, -6.666015625, -6.03125, -5.396484375, -4.76171875, -4.126953125, -3.4921875, -2.857421875, -2.22265625, -1.587890625, -0.953125, -0.318359375, 0.31640625, 0.951171875, 1.5859375, 2.220703125, 2.85546875, 3.490234375, 4.125, 4.759765625, 5.39453125, 6.029296875, 6.6640625, 7.298828125, 7.93359375, 8.568359375, 9.203125, 9.837890625, 10.47265625, 11.107421875, 11.7421875, 12.376953125, 13.01171875, 13.646484375, 14.28125, 14.916015625, 15.55078125, 16.185546875, 16.8203125, 17.455078125, 18.08984375, 18.724609375, 19.359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 0.0, 9.0, 6.0, 11.0, 9.0, 19.0, 26.0, 30.0, 28.0, 29.0, 40.0, 29.0, 35.0, 44.0, 47.0, 39.0, 58.0, 50.0, 52.0, 53.0, 52.0, 48.0, 54.0, 35.0, 30.0, 28.0, 21.0, 13.0, 14.0, 19.0, 13.0, 15.0, 8.0, 13.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027179718017578125, -0.0026380717754364014, -0.0025581717491149902, -0.002478271722793579, -0.002398371696472168, -0.002318471670150757, -0.0022385716438293457, -0.0021586716175079346, -0.0020787715911865234, -0.0019988715648651123, -0.0019189715385437012, -0.00183907151222229, -0.001759171485900879, -0.0016792714595794678, -0.0015993714332580566, -0.0015194714069366455, -0.0014395713806152344, -0.0013596713542938232, -0.0012797713279724121, -0.001199871301651001, -0.0011199712753295898, -0.0010400712490081787, -0.0009601712226867676, -0.0008802711963653564, -0.0008003711700439453, -0.0007204711437225342, -0.000640571117401123, -0.0005606710910797119, -0.0004807710647583008, -0.00040087103843688965, -0.0003209710121154785, -0.00024107098579406738, -0.00016117095947265625, -8.127093315124512e-05, -1.3709068298339844e-06, 7.852911949157715e-05, 0.00015842914581298828, 0.00023832917213439941, 0.00031822919845581055, 0.0003981292247772217, 0.0004780292510986328, 0.0005579292774200439, 0.0006378293037414551, 0.0007177293300628662, 0.0007976293563842773, 0.0008775293827056885, 0.0009574294090270996, 0.0010373294353485107, 0.0011172294616699219, 0.001197129487991333, 0.0012770295143127441, 0.0013569295406341553, 0.0014368295669555664, 0.0015167295932769775, 0.0015966296195983887, 0.0016765296459197998, 0.001756429672241211, 0.001836329698562622, 0.0019162297248840332, 0.0019961297512054443, 0.0020760297775268555, 0.0021559298038482666, 0.0022358298301696777, 0.002315729856491089, 0.0023956298828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 6.0, 10.0, 9.0, 15.0, 24.0, 29.0, 54.0, 79.0, 110.0, 181.0, 239.0, 386.0, 592.0, 894.0, 1309.0, 2182.0, 3423.0, 5398.0, 8586.0, 13496.0, 20716.0, 30839.0, 45531.0, 62592.0, 82705.0, 101267.0, 113885.0, 116311.0, 108279.0, 92450.0, 73503.0, 53948.0, 37497.0, 25511.0, 16645.0, 10920.0, 6888.0, 4310.0, 2761.0, 1780.0, 1084.0, 688.0, 512.0, 318.0, 188.0, 141.0, 74.0, 67.0, 42.0, 27.0, 30.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.61376953125, -17.9775390625, -17.34130859375, -16.705078125, -16.06884765625, -15.4326171875, -14.79638671875, -14.16015625, -13.52392578125, -12.8876953125, -12.25146484375, -11.615234375, -10.97900390625, -10.3427734375, -9.70654296875, -9.0703125, -8.43408203125, -7.7978515625, -7.16162109375, -6.525390625, -5.88916015625, -5.2529296875, -4.61669921875, -3.98046875, -3.34423828125, -2.7080078125, -2.07177734375, -1.435546875, -0.79931640625, -0.1630859375, 0.47314453125, 1.109375, 1.74560546875, 2.3818359375, 3.01806640625, 3.654296875, 4.29052734375, 4.9267578125, 5.56298828125, 6.19921875, 6.83544921875, 7.4716796875, 8.10791015625, 8.744140625, 9.38037109375, 10.0166015625, 10.65283203125, 11.2890625, 11.92529296875, 12.5615234375, 13.19775390625, 13.833984375, 14.47021484375, 15.1064453125, 15.74267578125, 16.37890625, 17.01513671875, 17.6513671875, 18.28759765625, 18.923828125, 19.56005859375, 20.1962890625, 20.83251953125, 21.46875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 18.0, 14.0, 26.0, 34.0, 28.0, 29.0, 44.0, 43.0, 53.0, 32.0, 40.0, 53.0, 39.0, 45.0, 45.0, 55.0, 37.0, 46.0, 47.0, 37.0, 33.0, 26.0, 25.0, 18.0, 15.0, 10.0, 9.0, 13.0, 14.0, 9.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.5401611328125, -10.244384765625, -9.9486083984375, -9.65283203125, -9.3570556640625, -9.061279296875, -8.7655029296875, -8.4697265625, -8.1739501953125, -7.878173828125, -7.5823974609375, -7.28662109375, -6.9908447265625, -6.695068359375, -6.3992919921875, -6.103515625, -5.8077392578125, -5.511962890625, -5.2161865234375, -4.92041015625, -4.6246337890625, -4.328857421875, -4.0330810546875, -3.7373046875, -3.4415283203125, -3.145751953125, -2.8499755859375, -2.55419921875, -2.2584228515625, -1.962646484375, -1.6668701171875, -1.37109375, -1.0753173828125, -0.779541015625, -0.4837646484375, -0.18798828125, 0.1077880859375, 0.403564453125, 0.6993408203125, 0.9951171875, 1.2908935546875, 1.586669921875, 1.8824462890625, 2.17822265625, 2.4739990234375, 2.769775390625, 3.0655517578125, 3.361328125, 3.6571044921875, 3.952880859375, 4.2486572265625, 4.54443359375, 4.8402099609375, 5.135986328125, 5.4317626953125, 5.7275390625, 6.0233154296875, 6.319091796875, 6.6148681640625, 6.91064453125, 7.2064208984375, 7.502197265625, 7.7979736328125, 8.09375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 9.0, 6.0, 7.0, 10.0, 12.0, 16.0, 17.0, 13.0, 21.0, 14.0, 20.0, 28.0, 29.0, 40.0, 26.0, 30.0, 35.0, 33.0, 45.0, 32.0, 48.0, 36.0, 41.0, 30.0, 36.0, 37.0, 25.0, 40.0, 22.0, 34.0, 32.0, 30.0, 13.0, 15.0, 16.0, 20.0, 12.0, 19.0, 12.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.6223258972168, -50.923892974853516, -49.2254638671875, -47.52703094482422, -45.82859802246094, -44.130165100097656, -42.431732177734375, -40.73330307006836, -39.03487014770508, -37.3364372253418, -35.63800811767578, -33.9395751953125, -32.24114227294922, -30.542709350585938, -28.84427833557129, -27.14584732055664, -25.44741439819336, -23.748981475830078, -22.05055046081543, -20.35211944580078, -18.6536865234375, -16.95525360107422, -15.25682258605957, -13.558390617370605, -11.85995864868164, -10.161526679992676, -8.463094711303711, -6.764662742614746, -5.066230773925781, -3.3677988052368164, -1.6693668365478516, 0.02906513214111328, 1.7274932861328125, 3.4259252548217773, 5.124357223510742, 6.822789192199707, 8.521221160888672, 10.219653129577637, 11.918085098266602, 13.616517066955566, 15.314949035644531, 17.013381958007812, 18.71181297302246, 20.41024398803711, 22.10867691040039, 23.807109832763672, 25.50554084777832, 27.20397186279297, 28.90240478515625, 30.60083770751953, 32.29927062988281, 33.99769973754883, 35.69613265991211, 37.39456558227539, 39.092994689941406, 40.79142761230469, 42.48986053466797, 44.18829345703125, 45.88672637939453, 47.58515548706055, 49.28358840942383, 50.98202133178711, 52.680450439453125, 54.378883361816406, 56.07731628417969]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 9.0, 1.0, 6.0, 6.0, 16.0, 18.0, 15.0, 20.0, 17.0, 16.0, 24.0, 32.0, 28.0, 34.0, 28.0, 34.0, 38.0, 33.0, 36.0, 35.0, 32.0, 43.0, 48.0, 46.0, 39.0, 21.0, 17.0, 29.0, 32.0, 23.0, 27.0, 24.0, 20.0, 22.0, 17.0, 18.0, 11.0, 17.0, 10.0, 9.0, 11.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0], "bins": [-60.79109191894531, -58.962013244628906, -57.132938385009766, -55.303863525390625, -53.47478485107422, -51.64570617675781, -49.81663131713867, -47.98755645751953, -46.158477783203125, -44.32939910888672, -42.50032424926758, -40.67124938964844, -38.84217071533203, -37.013092041015625, -35.184017181396484, -33.354942321777344, -31.525863647460938, -29.696786880493164, -27.86771011352539, -26.038633346557617, -24.209556579589844, -22.38047981262207, -20.551403045654297, -18.722326278686523, -16.89324951171875, -15.064172744750977, -13.235095977783203, -11.40601921081543, -9.576942443847656, -7.747865676879883, -5.918788909912109, -4.089712142944336, -2.2606353759765625, -0.43155860900878906, 1.3975181579589844, 3.226594924926758, 5.055671691894531, 6.884748458862305, 8.713825225830078, 10.542901992797852, 12.371978759765625, 14.201055526733398, 16.030132293701172, 17.859209060668945, 19.68828582763672, 21.517362594604492, 23.346439361572266, 25.17551612854004, 27.004592895507812, 28.833669662475586, 30.66274642944336, 32.4918212890625, 34.320899963378906, 36.14997863769531, 37.97905349731445, 39.808128356933594, 41.63720703125, 43.466285705566406, 45.29536056518555, 47.12443542480469, 48.953514099121094, 50.7825927734375, 52.61166763305664, 54.44074249267578, 56.26982116699219]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 15.0, 16.0, 43.0, 53.0, 110.0, 202.0, 302.0, 560.0, 948.0, 1499.0, 2658.0, 4424.0, 7812.0, 12695.0, 21313.0, 34675.0, 56118.0, 87907.0, 135690.0, 197674.0, 274988.0, 359450.0, 433133.0, 476629.0, 474078.0, 429743.0, 355592.0, 271669.0, 193760.0, 132617.0, 86380.0, 54948.0, 34199.0, 20833.0, 12862.0, 7606.0, 4562.0, 2650.0, 1510.0, 927.0, 585.0, 333.0, 217.0, 109.0, 72.0, 44.0, 24.0, 16.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-50.0, -48.48388671875, -46.9677734375, -45.45166015625, -43.935546875, -42.41943359375, -40.9033203125, -39.38720703125, -37.87109375, -36.35498046875, -34.8388671875, -33.32275390625, -31.806640625, -30.29052734375, -28.7744140625, -27.25830078125, -25.7421875, -24.22607421875, -22.7099609375, -21.19384765625, -19.677734375, -18.16162109375, -16.6455078125, -15.12939453125, -13.61328125, -12.09716796875, -10.5810546875, -9.06494140625, -7.548828125, -6.03271484375, -4.5166015625, -3.00048828125, -1.484375, 0.03173828125, 1.5478515625, 3.06396484375, 4.580078125, 6.09619140625, 7.6123046875, 9.12841796875, 10.64453125, 12.16064453125, 13.6767578125, 15.19287109375, 16.708984375, 18.22509765625, 19.7412109375, 21.25732421875, 22.7734375, 24.28955078125, 25.8056640625, 27.32177734375, 28.837890625, 30.35400390625, 31.8701171875, 33.38623046875, 34.90234375, 36.41845703125, 37.9345703125, 39.45068359375, 40.966796875, 42.48291015625, 43.9990234375, 45.51513671875, 47.03125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 3.0, 7.0, 14.0, 17.0, 18.0, 17.0, 14.0, 10.0, 35.0, 27.0, 28.0, 37.0, 26.0, 33.0, 32.0, 33.0, 33.0, 42.0, 36.0, 41.0, 40.0, 53.0, 33.0, 26.0, 16.0, 27.0, 34.0, 20.0, 30.0, 23.0, 27.0, 16.0, 16.0, 19.0, 14.0, 16.0, 16.0, 10.0, 9.0, 6.0, 7.0, 10.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-53.53125, -51.93359375, -50.3359375, -48.73828125, -47.140625, -45.54296875, -43.9453125, -42.34765625, -40.75, -39.15234375, -37.5546875, -35.95703125, -34.359375, -32.76171875, -31.1640625, -29.56640625, -27.96875, -26.37109375, -24.7734375, -23.17578125, -21.578125, -19.98046875, -18.3828125, -16.78515625, -15.1875, -13.58984375, -11.9921875, -10.39453125, -8.796875, -7.19921875, -5.6015625, -4.00390625, -2.40625, -0.80859375, 0.7890625, 2.38671875, 3.984375, 5.58203125, 7.1796875, 8.77734375, 10.375, 11.97265625, 13.5703125, 15.16796875, 16.765625, 18.36328125, 19.9609375, 21.55859375, 23.15625, 24.75390625, 26.3515625, 27.94921875, 29.546875, 31.14453125, 32.7421875, 34.33984375, 35.9375, 37.53515625, 39.1328125, 40.73046875, 42.328125, 43.92578125, 45.5234375, 47.12109375, 48.71875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 15.0, 21.0, 45.0, 64.0, 87.0, 155.0, 255.0, 443.0, 727.0, 1218.0, 1868.0, 3018.0, 4789.0, 7671.0, 11638.0, 18312.0, 27826.0, 41486.0, 60697.0, 87082.0, 121527.0, 162519.0, 212577.0, 264046.0, 314088.0, 353107.0, 376755.0, 377906.0, 358145.0, 319335.0, 270766.0, 219291.0, 169721.0, 125538.0, 91449.0, 63584.0, 44140.0, 29060.0, 19277.0, 12505.0, 8014.0, 5046.0, 3227.0, 1969.0, 1299.0, 731.0, 498.0, 303.0, 169.0, 109.0, 77.0, 36.0, 24.0, 11.0, 7.0, 5.0, 2.0, 3.0], "bins": [-44.625, -43.275390625, -41.92578125, -40.576171875, -39.2265625, -37.876953125, -36.52734375, -35.177734375, -33.828125, -32.478515625, -31.12890625, -29.779296875, -28.4296875, -27.080078125, -25.73046875, -24.380859375, -23.03125, -21.681640625, -20.33203125, -18.982421875, -17.6328125, -16.283203125, -14.93359375, -13.583984375, -12.234375, -10.884765625, -9.53515625, -8.185546875, -6.8359375, -5.486328125, -4.13671875, -2.787109375, -1.4375, -0.087890625, 1.26171875, 2.611328125, 3.9609375, 5.310546875, 6.66015625, 8.009765625, 9.359375, 10.708984375, 12.05859375, 13.408203125, 14.7578125, 16.107421875, 17.45703125, 18.806640625, 20.15625, 21.505859375, 22.85546875, 24.205078125, 25.5546875, 26.904296875, 28.25390625, 29.603515625, 30.953125, 32.302734375, 33.65234375, 35.001953125, 36.3515625, 37.701171875, 39.05078125, 40.400390625, 41.75]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 8.0, 11.0, 17.0, 19.0, 19.0, 20.0, 41.0, 33.0, 59.0, 67.0, 73.0, 93.0, 110.0, 115.0, 123.0, 132.0, 176.0, 167.0, 175.0, 197.0, 202.0, 216.0, 192.0, 212.0, 189.0, 175.0, 157.0, 159.0, 147.0, 127.0, 110.0, 94.0, 99.0, 60.0, 63.0, 36.0, 43.0, 35.0, 24.0, 17.0, 8.0, 14.0, 9.0, 5.0, 5.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.754638671875, -21.96240234375, -21.170166015625, -20.3779296875, -19.585693359375, -18.79345703125, -18.001220703125, -17.208984375, -16.416748046875, -15.62451171875, -14.832275390625, -14.0400390625, -13.247802734375, -12.45556640625, -11.663330078125, -10.87109375, -10.078857421875, -9.28662109375, -8.494384765625, -7.7021484375, -6.909912109375, -6.11767578125, -5.325439453125, -4.533203125, -3.740966796875, -2.94873046875, -2.156494140625, -1.3642578125, -0.572021484375, 0.22021484375, 1.012451171875, 1.8046875, 2.596923828125, 3.38916015625, 4.181396484375, 4.9736328125, 5.765869140625, 6.55810546875, 7.350341796875, 8.142578125, 8.934814453125, 9.72705078125, 10.519287109375, 11.3115234375, 12.103759765625, 12.89599609375, 13.688232421875, 14.48046875, 15.272705078125, 16.06494140625, 16.857177734375, 17.6494140625, 18.441650390625, 19.23388671875, 20.026123046875, 20.818359375, 21.610595703125, 22.40283203125, 23.195068359375, 23.9873046875, 24.779541015625, 25.57177734375, 26.364013671875, 27.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 9.0, 8.0, 17.0, 17.0, 17.0, 17.0, 22.0, 17.0, 25.0, 25.0, 27.0, 30.0, 36.0, 35.0, 40.0, 36.0, 50.0, 42.0, 37.0, 39.0, 47.0, 40.0, 33.0, 37.0, 40.0, 31.0, 28.0, 24.0, 21.0, 19.0, 20.0, 15.0, 13.0, 12.0, 11.0, 16.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-55.089813232421875, -53.33258819580078, -51.57536697387695, -49.818145751953125, -48.06092071533203, -46.30369567871094, -44.54647445678711, -42.78925323486328, -41.03202819824219, -39.274803161621094, -37.517581939697266, -35.76036071777344, -34.003135681152344, -32.24591064453125, -30.488689422607422, -28.73146629333496, -26.9742431640625, -25.21702003479004, -23.459796905517578, -21.702573776245117, -19.945350646972656, -18.188127517700195, -16.430904388427734, -14.673681259155273, -12.916458129882812, -11.159235000610352, -9.40201187133789, -7.64478874206543, -5.887565612792969, -4.130342483520508, -2.373119354248047, -0.6158962249755859, 1.1413230895996094, 2.8985462188720703, 4.655769348144531, 6.412992477416992, 8.170215606689453, 9.927438735961914, 11.684661865234375, 13.441884994506836, 15.199108123779297, 16.956331253051758, 18.71355438232422, 20.47077751159668, 22.22800064086914, 23.9852237701416, 25.742446899414062, 27.499670028686523, 29.256893157958984, 31.014116287231445, 32.771339416503906, 34.528564453125, 36.28578567504883, 38.043006896972656, 39.80023193359375, 41.557456970214844, 43.31467819213867, 45.0718994140625, 46.829124450683594, 48.58634948730469, 50.343570709228516, 52.100791931152344, 53.85801696777344, 55.61524200439453, 57.37246322631836]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 9.0, 17.0, 8.0, 20.0, 15.0, 20.0, 19.0, 18.0, 27.0, 38.0, 43.0, 33.0, 37.0, 54.0, 56.0, 48.0, 42.0, 54.0, 45.0, 50.0, 34.0, 28.0, 30.0, 40.0, 34.0, 20.0, 20.0, 24.0, 16.0, 24.0, 9.0, 18.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.63072204589844, -65.49087524414062, -63.35102844238281, -61.211181640625, -59.07133483886719, -56.931488037109375, -54.79164123535156, -52.65179443359375, -50.51194763183594, -48.372100830078125, -46.23225402832031, -44.0924072265625, -41.95256042480469, -39.812713623046875, -37.67286682128906, -35.53302001953125, -33.39317321777344, -31.253326416015625, -29.113479614257812, -26.9736328125, -24.833786010742188, -22.693939208984375, -20.554092407226562, -18.41424560546875, -16.274398803710938, -14.134552001953125, -11.994705200195312, -9.8548583984375, -7.7150115966796875, -5.575164794921875, -3.4353179931640625, -1.29547119140625, 0.8443679809570312, 2.9842147827148438, 5.124061584472656, 7.263908386230469, 9.403755187988281, 11.543601989746094, 13.683448791503906, 15.823295593261719, 17.96314239501953, 20.102989196777344, 22.242835998535156, 24.38268280029297, 26.52252960205078, 28.662376403808594, 30.802223205566406, 32.94207000732422, 35.08191680908203, 37.221763610839844, 39.361610412597656, 41.50145721435547, 43.64130401611328, 45.781150817871094, 47.920997619628906, 50.06084442138672, 52.20069122314453, 54.340538024902344, 56.480384826660156, 58.62023162841797, 60.76007843017578, 62.899925231933594, 65.0397720336914, 67.17961883544922, 69.31946563720703]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 25.0, 26.0, 62.0, 91.0, 138.0, 260.0, 396.0, 603.0, 914.0, 1605.0, 2527.0, 4223.0, 6642.0, 10523.0, 16486.0, 24841.0, 37094.0, 52564.0, 70562.0, 89126.0, 105253.0, 114155.0, 112891.0, 102152.0, 84774.0, 66581.0, 48129.0, 33654.0, 22522.0, 14510.0, 9563.0, 5936.0, 3661.0, 2251.0, 1482.0, 885.0, 568.0, 317.0, 194.0, 133.0, 80.0, 50.0, 38.0, 18.0, 9.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.265625, -16.740478515625, -16.21533203125, -15.690185546875, -15.1650390625, -14.639892578125, -14.11474609375, -13.589599609375, -13.064453125, -12.539306640625, -12.01416015625, -11.489013671875, -10.9638671875, -10.438720703125, -9.91357421875, -9.388427734375, -8.86328125, -8.338134765625, -7.81298828125, -7.287841796875, -6.7626953125, -6.237548828125, -5.71240234375, -5.187255859375, -4.662109375, -4.136962890625, -3.61181640625, -3.086669921875, -2.5615234375, -2.036376953125, -1.51123046875, -0.986083984375, -0.4609375, 0.064208984375, 0.58935546875, 1.114501953125, 1.6396484375, 2.164794921875, 2.68994140625, 3.215087890625, 3.740234375, 4.265380859375, 4.79052734375, 5.315673828125, 5.8408203125, 6.365966796875, 6.89111328125, 7.416259765625, 7.94140625, 8.466552734375, 8.99169921875, 9.516845703125, 10.0419921875, 10.567138671875, 11.09228515625, 11.617431640625, 12.142578125, 12.667724609375, 13.19287109375, 13.718017578125, 14.2431640625, 14.768310546875, 15.29345703125, 15.818603515625, 16.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 14.0, 10.0, 19.0, 16.0, 21.0, 17.0, 20.0, 27.0, 41.0, 39.0, 36.0, 37.0, 55.0, 50.0, 53.0, 40.0, 52.0, 53.0, 43.0, 35.0, 28.0, 28.0, 43.0, 31.0, 20.0, 21.0, 21.0, 17.0, 25.0, 10.0, 16.0, 8.0, 6.0, 1.0, 8.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.375, -65.232421875, -63.08984375, -60.947265625, -58.8046875, -56.662109375, -54.51953125, -52.376953125, -50.234375, -48.091796875, -45.94921875, -43.806640625, -41.6640625, -39.521484375, -37.37890625, -35.236328125, -33.09375, -30.951171875, -28.80859375, -26.666015625, -24.5234375, -22.380859375, -20.23828125, -18.095703125, -15.953125, -13.810546875, -11.66796875, -9.525390625, -7.3828125, -5.240234375, -3.09765625, -0.955078125, 1.1875, 3.330078125, 5.47265625, 7.615234375, 9.7578125, 11.900390625, 14.04296875, 16.185546875, 18.328125, 20.470703125, 22.61328125, 24.755859375, 26.8984375, 29.041015625, 31.18359375, 33.326171875, 35.46875, 37.611328125, 39.75390625, 41.896484375, 44.0390625, 46.181640625, 48.32421875, 50.466796875, 52.609375, 54.751953125, 56.89453125, 59.037109375, 61.1796875, 63.322265625, 65.46484375, 67.607421875, 69.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 19.0, 28.0, 42.0, 59.0, 101.0, 124.0, 210.0, 380.0, 701.0, 1161.0, 1983.0, 3774.0, 6799.0, 12682.0, 24370.0, 64058.0, 846814.0, 41624.0, 19884.0, 10689.0, 5795.0, 3108.0, 1713.0, 987.0, 581.0, 323.0, 197.0, 124.0, 83.0, 51.0, 20.0, 14.0, 13.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-68.375, -66.26171875, -64.1484375, -62.03515625, -59.921875, -57.80859375, -55.6953125, -53.58203125, -51.46875, -49.35546875, -47.2421875, -45.12890625, -43.015625, -40.90234375, -38.7890625, -36.67578125, -34.5625, -32.44921875, -30.3359375, -28.22265625, -26.109375, -23.99609375, -21.8828125, -19.76953125, -17.65625, -15.54296875, -13.4296875, -11.31640625, -9.203125, -7.08984375, -4.9765625, -2.86328125, -0.75, 1.36328125, 3.4765625, 5.58984375, 7.703125, 9.81640625, 11.9296875, 14.04296875, 16.15625, 18.26953125, 20.3828125, 22.49609375, 24.609375, 26.72265625, 28.8359375, 30.94921875, 33.0625, 35.17578125, 37.2890625, 39.40234375, 41.515625, 43.62890625, 45.7421875, 47.85546875, 49.96875, 52.08203125, 54.1953125, 56.30859375, 58.421875, 60.53515625, 62.6484375, 64.76171875, 66.875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 7.0, 12.0, 12.0, 15.0, 9.0, 14.0, 5.0, 19.0, 21.0, 22.0, 26.0, 42.0, 27.0, 27.0, 37.0, 34.0, 41.0, 35.0, 43.0, 42.0, 48.0, 37.0, 42.0, 31.0, 38.0, 22.0, 22.0, 29.0, 34.0, 32.0, 29.0, 21.0, 20.0, 10.0, 11.0, 14.0, 22.0, 6.0, 12.0, 8.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.90625, -39.634765625, -38.36328125, -37.091796875, -35.8203125, -34.548828125, -33.27734375, -32.005859375, -30.734375, -29.462890625, -28.19140625, -26.919921875, -25.6484375, -24.376953125, -23.10546875, -21.833984375, -20.5625, -19.291015625, -18.01953125, -16.748046875, -15.4765625, -14.205078125, -12.93359375, -11.662109375, -10.390625, -9.119140625, -7.84765625, -6.576171875, -5.3046875, -4.033203125, -2.76171875, -1.490234375, -0.21875, 1.052734375, 2.32421875, 3.595703125, 4.8671875, 6.138671875, 7.41015625, 8.681640625, 9.953125, 11.224609375, 12.49609375, 13.767578125, 15.0390625, 16.310546875, 17.58203125, 18.853515625, 20.125, 21.396484375, 22.66796875, 23.939453125, 25.2109375, 26.482421875, 27.75390625, 29.025390625, 30.296875, 31.568359375, 32.83984375, 34.111328125, 35.3828125, 36.654296875, 37.92578125, 39.197265625, 40.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 13.0, 4.0, 8.0, 12.0, 25.0, 21.0, 44.0, 62.0, 109.0, 173.0, 270.0, 430.0, 665.0, 1062.0, 1890.0, 3042.0, 5166.0, 9334.0, 17119.0, 35667.0, 691283.0, 219865.0, 28840.0, 14297.0, 7822.0, 4469.0, 2664.0, 1589.0, 966.0, 588.0, 362.0, 223.0, 151.0, 115.0, 71.0, 46.0, 28.0, 21.0, 9.0, 6.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.046875, -3.923736572265625, -3.80059814453125, -3.677459716796875, -3.5543212890625, -3.431182861328125, -3.30804443359375, -3.184906005859375, -3.061767578125, -2.938629150390625, -2.81549072265625, -2.692352294921875, -2.5692138671875, -2.446075439453125, -2.32293701171875, -2.199798583984375, -2.07666015625, -1.953521728515625, -1.83038330078125, -1.707244873046875, -1.5841064453125, -1.460968017578125, -1.33782958984375, -1.214691162109375, -1.091552734375, -0.968414306640625, -0.84527587890625, -0.722137451171875, -0.5989990234375, -0.475860595703125, -0.35272216796875, -0.229583740234375, -0.1064453125, 0.016693115234375, 0.13983154296875, 0.262969970703125, 0.3861083984375, 0.509246826171875, 0.63238525390625, 0.755523681640625, 0.878662109375, 1.001800537109375, 1.12493896484375, 1.248077392578125, 1.3712158203125, 1.494354248046875, 1.61749267578125, 1.740631103515625, 1.86376953125, 1.986907958984375, 2.11004638671875, 2.233184814453125, 2.3563232421875, 2.479461669921875, 2.60260009765625, 2.725738525390625, 2.848876953125, 2.972015380859375, 3.09515380859375, 3.218292236328125, 3.3414306640625, 3.464569091796875, 3.58770751953125, 3.710845947265625, 3.833984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 15.0, 24.0, 19.0, 22.0, 20.0, 31.0, 41.0, 53.0, 45.0, 64.0, 62.0, 55.0, 69.0, 69.0, 62.0, 52.0, 51.0, 46.0, 38.0, 34.0, 22.0, 13.0, 11.0, 11.0, 15.0, 6.0, 3.0, 3.0, 2.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032973289489746094, -0.0003195516765117645, -0.0003093704581260681, -0.0002991892397403717, -0.0002890080213546753, -0.0002788268029689789, -0.00026864558458328247, -0.00025846436619758606, -0.00024828314781188965, -0.00023810192942619324, -0.00022792071104049683, -0.00021773949265480042, -0.000207558274269104, -0.0001973770558834076, -0.00018719583749771118, -0.00017701461911201477, -0.00016683340072631836, -0.00015665218234062195, -0.00014647096395492554, -0.00013628974556922913, -0.00012610852718353271, -0.0001159273087978363, -0.00010574609041213989, -9.556487202644348e-05, -8.538365364074707e-05, -7.520243525505066e-05, -6.502121686935425e-05, -5.483999848365784e-05, -4.4658780097961426e-05, -3.4477561712265015e-05, -2.4296343326568604e-05, -1.4115124940872192e-05, -3.933906555175781e-06, 6.24731183052063e-06, 1.642853021621704e-05, 2.6609748601913452e-05, 3.679096698760986e-05, 4.6972185373306274e-05, 5.7153403759002686e-05, 6.73346221446991e-05, 7.751584053039551e-05, 8.769705891609192e-05, 9.787827730178833e-05, 0.00010805949568748474, 0.00011824071407318115, 0.00012842193245887756, 0.00013860315084457397, 0.00014878436923027039, 0.0001589655876159668, 0.0001691468060016632, 0.00017932802438735962, 0.00018950924277305603, 0.00019969046115875244, 0.00020987167954444885, 0.00022005289793014526, 0.00023023411631584167, 0.00024041533470153809, 0.0002505965530872345, 0.0002607777714729309, 0.0002709589898586273, 0.00028114020824432373, 0.00029132142663002014, 0.00030150264501571655, 0.00031168386340141296, 0.0003218650817871094]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 20.0, 22.0, 48.0, 83.0, 96.0, 142.0, 225.0, 328.0, 539.0, 804.0, 1305.0, 1914.0, 2805.0, 4298.0, 6560.0, 9772.0, 14553.0, 21426.0, 30320.0, 42355.0, 56279.0, 72241.0, 87534.0, 99925.0, 104887.0, 102726.0, 92544.0, 77478.0, 61433.0, 46939.0, 34226.0, 24359.0, 16709.0, 11382.0, 7474.0, 5017.0, 3372.0, 2109.0, 1528.0, 947.0, 672.0, 386.0, 258.0, 174.0, 112.0, 86.0, 37.0, 37.0, 14.0, 14.0, 12.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.19140625, -2.122222900390625, -2.05303955078125, -1.983856201171875, -1.9146728515625, -1.845489501953125, -1.77630615234375, -1.707122802734375, -1.637939453125, -1.568756103515625, -1.49957275390625, -1.430389404296875, -1.3612060546875, -1.292022705078125, -1.22283935546875, -1.153656005859375, -1.08447265625, -1.015289306640625, -0.94610595703125, -0.876922607421875, -0.8077392578125, -0.738555908203125, -0.66937255859375, -0.600189208984375, -0.531005859375, -0.461822509765625, -0.39263916015625, -0.323455810546875, -0.2542724609375, -0.185089111328125, -0.11590576171875, -0.046722412109375, 0.0224609375, 0.091644287109375, 0.16082763671875, 0.230010986328125, 0.2991943359375, 0.368377685546875, 0.43756103515625, 0.506744384765625, 0.575927734375, 0.645111083984375, 0.71429443359375, 0.783477783203125, 0.8526611328125, 0.921844482421875, 0.99102783203125, 1.060211181640625, 1.12939453125, 1.198577880859375, 1.26776123046875, 1.336944580078125, 1.4061279296875, 1.475311279296875, 1.54449462890625, 1.613677978515625, 1.682861328125, 1.752044677734375, 1.82122802734375, 1.890411376953125, 1.9595947265625, 2.028778076171875, 2.09796142578125, 2.167144775390625, 2.236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 4.0, 13.0, 17.0, 19.0, 13.0, 22.0, 20.0, 17.0, 30.0, 29.0, 26.0, 40.0, 32.0, 39.0, 28.0, 31.0, 30.0, 40.0, 35.0, 43.0, 31.0, 38.0, 34.0, 40.0, 27.0, 28.0, 32.0, 28.0, 24.0, 34.0, 33.0, 23.0, 20.0, 18.0, 18.0, 7.0, 9.0, 8.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9815673828125, -0.948486328125, -0.9154052734375, -0.88232421875, -0.8492431640625, -0.816162109375, -0.7830810546875, -0.75, -0.7169189453125, -0.683837890625, -0.6507568359375, -0.61767578125, -0.5845947265625, -0.551513671875, -0.5184326171875, -0.4853515625, -0.4522705078125, -0.419189453125, -0.3861083984375, -0.35302734375, -0.3199462890625, -0.286865234375, -0.2537841796875, -0.220703125, -0.1876220703125, -0.154541015625, -0.1214599609375, -0.08837890625, -0.0552978515625, -0.022216796875, 0.0108642578125, 0.0439453125, 0.0770263671875, 0.110107421875, 0.1431884765625, 0.17626953125, 0.2093505859375, 0.242431640625, 0.2755126953125, 0.30859375, 0.3416748046875, 0.374755859375, 0.4078369140625, 0.44091796875, 0.4739990234375, 0.507080078125, 0.5401611328125, 0.5732421875, 0.6063232421875, 0.639404296875, 0.6724853515625, 0.70556640625, 0.7386474609375, 0.771728515625, 0.8048095703125, 0.837890625, 0.8709716796875, 0.904052734375, 0.9371337890625, 0.97021484375, 1.0032958984375, 1.036376953125, 1.0694580078125, 1.1025390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 12.0, 10.0, 4.0, 19.0, 14.0, 19.0, 26.0, 18.0, 22.0, 22.0, 31.0, 33.0, 40.0, 27.0, 58.0, 29.0, 48.0, 49.0, 39.0, 30.0, 42.0, 43.0, 41.0, 36.0, 37.0, 37.0, 33.0, 18.0, 21.0, 21.0, 15.0, 24.0, 13.0, 15.0, 13.0, 6.0, 6.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.38033676147461, -53.55709457397461, -51.73385238647461, -49.91061019897461, -48.08736801147461, -46.26412582397461, -44.440887451171875, -42.617645263671875, -40.794403076171875, -38.971160888671875, -37.147918701171875, -35.324676513671875, -33.501434326171875, -31.678192138671875, -29.854951858520508, -28.031709671020508, -26.208465576171875, -24.385223388671875, -22.561981201171875, -20.738739013671875, -18.915496826171875, -17.092254638671875, -15.269014358520508, -13.445772171020508, -11.622529983520508, -9.799287796020508, -7.976046085357666, -6.152804374694824, -4.329562187194824, -2.506319999694824, -0.6830787658691406, 1.1401634216308594, 2.9634056091308594, 4.786647796630859, 6.609889507293701, 8.433131217956543, 10.256373405456543, 12.079615592956543, 13.902856826782227, 15.726099014282227, 17.549341201782227, 19.372583389282227, 21.195825576782227, 23.019065856933594, 24.842308044433594, 26.665550231933594, 28.488792419433594, 30.312034606933594, 32.135276794433594, 33.958518981933594, 35.781761169433594, 37.605003356933594, 39.428245544433594, 41.251487731933594, 43.074729919433594, 44.897972106933594, 46.721214294433594, 48.544456481933594, 50.367698669433594, 52.190940856933594, 54.014183044433594, 55.837425231933594, 57.660667419433594, 59.483909606933594, 61.30714797973633]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 10.0, 9.0, 12.0, 14.0, 18.0, 15.0, 22.0, 21.0, 19.0, 26.0, 34.0, 48.0, 34.0, 50.0, 49.0, 50.0, 53.0, 45.0, 57.0, 53.0, 32.0, 40.0, 24.0, 36.0, 36.0, 33.0, 13.0, 21.0, 27.0, 21.0, 18.0, 12.0, 14.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.64140319824219, -66.4472427368164, -64.25308227539062, -62.058921813964844, -59.86476135253906, -57.67060089111328, -55.4764404296875, -53.28227996826172, -51.08811950683594, -48.893959045410156, -46.699798583984375, -44.505638122558594, -42.31147766113281, -40.11731719970703, -37.92315673828125, -35.72899627685547, -33.53483581542969, -31.340675354003906, -29.146514892578125, -26.952354431152344, -24.758193969726562, -22.56403350830078, -20.369873046875, -18.17571258544922, -15.981552124023438, -13.787391662597656, -11.593231201171875, -9.399070739746094, -7.2049102783203125, -5.010749816894531, -2.81658935546875, -0.6224288940429688, 1.5717391967773438, 3.765899658203125, 5.960060119628906, 8.154220581054688, 10.348381042480469, 12.54254150390625, 14.736701965332031, 16.930862426757812, 19.125022888183594, 21.319183349609375, 23.513343811035156, 25.707504272460938, 27.90166473388672, 30.0958251953125, 32.28998565673828, 34.48414611816406, 36.678306579589844, 38.872467041015625, 41.066627502441406, 43.26078796386719, 45.45494842529297, 47.64910888671875, 49.84326934814453, 52.03742980957031, 54.231590270996094, 56.425750732421875, 58.619911193847656, 60.81407165527344, 63.00823211669922, 65.202392578125, 67.39655303955078, 69.59071350097656, 71.78487396240234]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 13.0, 24.0, 25.0, 29.0, 46.0, 90.0, 129.0, 212.0, 346.0, 580.0, 894.0, 1339.0, 2063.0, 3184.0, 4697.0, 7297.0, 10661.0, 15494.0, 21968.0, 30123.0, 40381.0, 51593.0, 63610.0, 75477.0, 84733.0, 90799.0, 91530.0, 88087.0, 79538.0, 68016.0, 56747.0, 44721.0, 34137.0, 24851.0, 17738.0, 12511.0, 8646.0, 5731.0, 3692.0, 2449.0, 1595.0, 1008.0, 651.0, 409.0, 247.0, 160.0, 125.0, 63.0, 37.0, 18.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0], "bins": [-42.40625, -41.12890625, -39.8515625, -38.57421875, -37.296875, -36.01953125, -34.7421875, -33.46484375, -32.1875, -30.91015625, -29.6328125, -28.35546875, -27.078125, -25.80078125, -24.5234375, -23.24609375, -21.96875, -20.69140625, -19.4140625, -18.13671875, -16.859375, -15.58203125, -14.3046875, -13.02734375, -11.75, -10.47265625, -9.1953125, -7.91796875, -6.640625, -5.36328125, -4.0859375, -2.80859375, -1.53125, -0.25390625, 1.0234375, 2.30078125, 3.578125, 4.85546875, 6.1328125, 7.41015625, 8.6875, 9.96484375, 11.2421875, 12.51953125, 13.796875, 15.07421875, 16.3515625, 17.62890625, 18.90625, 20.18359375, 21.4609375, 22.73828125, 24.015625, 25.29296875, 26.5703125, 27.84765625, 29.125, 30.40234375, 31.6796875, 32.95703125, 34.234375, 35.51171875, 36.7890625, 38.06640625, 39.34375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 14.0, 9.0, 12.0, 11.0, 21.0, 8.0, 23.0, 23.0, 20.0, 23.0, 34.0, 44.0, 41.0, 44.0, 52.0, 48.0, 54.0, 48.0, 54.0, 47.0, 40.0, 38.0, 26.0, 37.0, 37.0, 31.0, 15.0, 23.0, 24.0, 20.0, 21.0, 10.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.322265625, -62.20703125, -60.091796875, -57.9765625, -55.861328125, -53.74609375, -51.630859375, -49.515625, -47.400390625, -45.28515625, -43.169921875, -41.0546875, -38.939453125, -36.82421875, -34.708984375, -32.59375, -30.478515625, -28.36328125, -26.248046875, -24.1328125, -22.017578125, -19.90234375, -17.787109375, -15.671875, -13.556640625, -11.44140625, -9.326171875, -7.2109375, -5.095703125, -2.98046875, -0.865234375, 1.25, 3.365234375, 5.48046875, 7.595703125, 9.7109375, 11.826171875, 13.94140625, 16.056640625, 18.171875, 20.287109375, 22.40234375, 24.517578125, 26.6328125, 28.748046875, 30.86328125, 32.978515625, 35.09375, 37.208984375, 39.32421875, 41.439453125, 43.5546875, 45.669921875, 47.78515625, 49.900390625, 52.015625, 54.130859375, 56.24609375, 58.361328125, 60.4765625, 62.591796875, 64.70703125, 66.822265625, 68.9375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 21.0, 29.0, 53.0, 77.0, 118.0, 225.0, 288.0, 487.0, 761.0, 1279.0, 1951.0, 3001.0, 4818.0, 7415.0, 11288.0, 16811.0, 24220.0, 34115.0, 46992.0, 61471.0, 76301.0, 88742.0, 98193.0, 100575.0, 97178.0, 87484.0, 74515.0, 59920.0, 46068.0, 33728.0, 23543.0, 16018.0, 10990.0, 7156.0, 4562.0, 3006.0, 1872.0, 1176.0, 814.0, 470.0, 318.0, 178.0, 99.0, 78.0, 49.0, 34.0, 22.0, 9.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-43.53125, -42.1474609375, -40.763671875, -39.3798828125, -37.99609375, -36.6123046875, -35.228515625, -33.8447265625, -32.4609375, -31.0771484375, -29.693359375, -28.3095703125, -26.92578125, -25.5419921875, -24.158203125, -22.7744140625, -21.390625, -20.0068359375, -18.623046875, -17.2392578125, -15.85546875, -14.4716796875, -13.087890625, -11.7041015625, -10.3203125, -8.9365234375, -7.552734375, -6.1689453125, -4.78515625, -3.4013671875, -2.017578125, -0.6337890625, 0.75, 2.1337890625, 3.517578125, 4.9013671875, 6.28515625, 7.6689453125, 9.052734375, 10.4365234375, 11.8203125, 13.2041015625, 14.587890625, 15.9716796875, 17.35546875, 18.7392578125, 20.123046875, 21.5068359375, 22.890625, 24.2744140625, 25.658203125, 27.0419921875, 28.42578125, 29.8095703125, 31.193359375, 32.5771484375, 33.9609375, 35.3447265625, 36.728515625, 38.1123046875, 39.49609375, 40.8798828125, 42.263671875, 43.6474609375, 45.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 5.0, 6.0, 12.0, 19.0, 14.0, 23.0, 25.0, 38.0, 35.0, 36.0, 49.0, 45.0, 55.0, 59.0, 54.0, 54.0, 52.0, 45.0, 49.0, 44.0, 34.0, 40.0, 45.0, 39.0, 22.0, 18.0, 14.0, 16.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.71875, -50.111328125, -48.50390625, -46.896484375, -45.2890625, -43.681640625, -42.07421875, -40.466796875, -38.859375, -37.251953125, -35.64453125, -34.037109375, -32.4296875, -30.822265625, -29.21484375, -27.607421875, -26.0, -24.392578125, -22.78515625, -21.177734375, -19.5703125, -17.962890625, -16.35546875, -14.748046875, -13.140625, -11.533203125, -9.92578125, -8.318359375, -6.7109375, -5.103515625, -3.49609375, -1.888671875, -0.28125, 1.326171875, 2.93359375, 4.541015625, 6.1484375, 7.755859375, 9.36328125, 10.970703125, 12.578125, 14.185546875, 15.79296875, 17.400390625, 19.0078125, 20.615234375, 22.22265625, 23.830078125, 25.4375, 27.044921875, 28.65234375, 30.259765625, 31.8671875, 33.474609375, 35.08203125, 36.689453125, 38.296875, 39.904296875, 41.51171875, 43.119140625, 44.7265625, 46.333984375, 47.94140625, 49.548828125, 51.15625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 38.0, 58.0, 85.0, 132.0, 235.0, 315.0, 513.0, 913.0, 1517.0, 2534.0, 4281.0, 6962.0, 11518.0, 18253.0, 28655.0, 43167.0, 62105.0, 83495.0, 103356.0, 118686.0, 122406.0, 113826.0, 96462.0, 74870.0, 53835.0, 36811.0, 24170.0, 15287.0, 9507.0, 5800.0, 3416.0, 2143.0, 1209.0, 730.0, 462.0, 278.0, 179.0, 109.0, 67.0, 41.0, 28.0, 21.0, 13.0, 9.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.15869140625, -18.5048828125, -17.85107421875, -17.197265625, -16.54345703125, -15.8896484375, -15.23583984375, -14.58203125, -13.92822265625, -13.2744140625, -12.62060546875, -11.966796875, -11.31298828125, -10.6591796875, -10.00537109375, -9.3515625, -8.69775390625, -8.0439453125, -7.39013671875, -6.736328125, -6.08251953125, -5.4287109375, -4.77490234375, -4.12109375, -3.46728515625, -2.8134765625, -2.15966796875, -1.505859375, -0.85205078125, -0.1982421875, 0.45556640625, 1.109375, 1.76318359375, 2.4169921875, 3.07080078125, 3.724609375, 4.37841796875, 5.0322265625, 5.68603515625, 6.33984375, 6.99365234375, 7.6474609375, 8.30126953125, 8.955078125, 9.60888671875, 10.2626953125, 10.91650390625, 11.5703125, 12.22412109375, 12.8779296875, 13.53173828125, 14.185546875, 14.83935546875, 15.4931640625, 16.14697265625, 16.80078125, 17.45458984375, 18.1083984375, 18.76220703125, 19.416015625, 20.06982421875, 20.7236328125, 21.37744140625, 22.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 10.0, 5.0, 15.0, 14.0, 11.0, 18.0, 24.0, 28.0, 26.0, 32.0, 33.0, 38.0, 45.0, 46.0, 48.0, 53.0, 48.0, 47.0, 47.0, 39.0, 43.0, 50.0, 37.0, 36.0, 20.0, 31.0, 23.0, 22.0, 20.0, 9.0, 11.0, 10.0, 8.0, 5.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.002513885498046875, -0.002439558506011963, -0.0023652315139770508, -0.0022909045219421387, -0.0022165775299072266, -0.0021422505378723145, -0.0020679235458374023, -0.0019935965538024902, -0.0019192695617675781, -0.001844942569732666, -0.001770615577697754, -0.0016962885856628418, -0.0016219615936279297, -0.0015476346015930176, -0.0014733076095581055, -0.0013989806175231934, -0.0013246536254882812, -0.0012503266334533691, -0.001175999641418457, -0.001101672649383545, -0.0010273456573486328, -0.0009530186653137207, -0.0008786916732788086, -0.0008043646812438965, -0.0007300376892089844, -0.0006557106971740723, -0.0005813837051391602, -0.000507056713104248, -0.00043272972106933594, -0.00035840272903442383, -0.0002840757369995117, -0.0002097487449645996, -0.0001354217529296875, -6.109476089477539e-05, 1.3232231140136719e-05, 8.755922317504883e-05, 0.00016188621520996094, 0.00023621320724487305, 0.00031054019927978516, 0.00038486719131469727, 0.0004591941833496094, 0.0005335211753845215, 0.0006078481674194336, 0.0006821751594543457, 0.0007565021514892578, 0.0008308291435241699, 0.000905156135559082, 0.0009794831275939941, 0.0010538101196289062, 0.0011281371116638184, 0.0012024641036987305, 0.0012767910957336426, 0.0013511180877685547, 0.0014254450798034668, 0.001499772071838379, 0.001574099063873291, 0.0016484260559082031, 0.0017227530479431152, 0.0017970800399780273, 0.0018714070320129395, 0.0019457340240478516, 0.0020200610160827637, 0.0020943880081176758, 0.002168715000152588, 0.0022430419921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 12.0, 30.0, 42.0, 66.0, 78.0, 140.0, 184.0, 326.0, 497.0, 731.0, 1142.0, 1761.0, 2695.0, 4207.0, 6469.0, 9805.0, 14688.0, 21966.0, 32010.0, 44478.0, 60519.0, 77594.0, 93598.0, 104777.0, 108160.0, 103839.0, 91634.0, 74998.0, 58021.0, 42679.0, 30336.0, 20854.0, 14099.0, 8991.0, 5948.0, 3856.0, 2576.0, 1673.0, 1083.0, 725.0, 426.0, 284.0, 183.0, 115.0, 88.0, 61.0, 28.0, 24.0, 11.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-19.265625, -18.652587890625, -18.03955078125, -17.426513671875, -16.8134765625, -16.200439453125, -15.58740234375, -14.974365234375, -14.361328125, -13.748291015625, -13.13525390625, -12.522216796875, -11.9091796875, -11.296142578125, -10.68310546875, -10.070068359375, -9.45703125, -8.843994140625, -8.23095703125, -7.617919921875, -7.0048828125, -6.391845703125, -5.77880859375, -5.165771484375, -4.552734375, -3.939697265625, -3.32666015625, -2.713623046875, -2.1005859375, -1.487548828125, -0.87451171875, -0.261474609375, 0.3515625, 0.964599609375, 1.57763671875, 2.190673828125, 2.8037109375, 3.416748046875, 4.02978515625, 4.642822265625, 5.255859375, 5.868896484375, 6.48193359375, 7.094970703125, 7.7080078125, 8.321044921875, 8.93408203125, 9.547119140625, 10.16015625, 10.773193359375, 11.38623046875, 11.999267578125, 12.6123046875, 13.225341796875, 13.83837890625, 14.451416015625, 15.064453125, 15.677490234375, 16.29052734375, 16.903564453125, 17.5166015625, 18.129638671875, 18.74267578125, 19.355712890625, 19.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 2.0, 14.0, 12.0, 4.0, 17.0, 28.0, 26.0, 20.0, 24.0, 37.0, 47.0, 45.0, 42.0, 53.0, 50.0, 54.0, 48.0, 43.0, 54.0, 45.0, 38.0, 41.0, 42.0, 29.0, 27.0, 25.0, 24.0, 19.0, 21.0, 11.0, 9.0, 12.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-10.4375, -10.1297607421875, -9.822021484375, -9.5142822265625, -9.20654296875, -8.8988037109375, -8.591064453125, -8.2833251953125, -7.9755859375, -7.6678466796875, -7.360107421875, -7.0523681640625, -6.74462890625, -6.4368896484375, -6.129150390625, -5.8214111328125, -5.513671875, -5.2059326171875, -4.898193359375, -4.5904541015625, -4.28271484375, -3.9749755859375, -3.667236328125, -3.3594970703125, -3.0517578125, -2.7440185546875, -2.436279296875, -2.1285400390625, -1.82080078125, -1.5130615234375, -1.205322265625, -0.8975830078125, -0.58984375, -0.2821044921875, 0.025634765625, 0.3333740234375, 0.64111328125, 0.9488525390625, 1.256591796875, 1.5643310546875, 1.8720703125, 2.1798095703125, 2.487548828125, 2.7952880859375, 3.10302734375, 3.4107666015625, 3.718505859375, 4.0262451171875, 4.333984375, 4.6417236328125, 4.949462890625, 5.2572021484375, 5.56494140625, 5.8726806640625, 6.180419921875, 6.4881591796875, 6.7958984375, 7.1036376953125, 7.411376953125, 7.7191162109375, 8.02685546875, 8.3345947265625, 8.642333984375, 8.9500732421875, 9.2578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 13.0, 18.0, 10.0, 22.0, 17.0, 22.0, 24.0, 24.0, 26.0, 24.0, 32.0, 29.0, 33.0, 30.0, 34.0, 45.0, 39.0, 37.0, 33.0, 41.0, 29.0, 41.0, 35.0, 30.0, 32.0, 28.0, 22.0, 19.0, 14.0, 25.0, 15.0, 18.0, 13.0, 16.0, 11.0, 20.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.57626724243164, -46.00093078613281, -44.425594329833984, -42.850257873535156, -41.274925231933594, -39.699588775634766, -38.12425231933594, -36.54891586303711, -34.97357940673828, -33.39824295043945, -31.822908401489258, -30.24757194519043, -28.6722354888916, -27.096900939941406, -25.521564483642578, -23.94622802734375, -22.370893478393555, -20.795557022094727, -19.22022247314453, -17.644886016845703, -16.069549560546875, -14.494214057922363, -12.918878555297852, -11.343542098999023, -9.768206596374512, -8.19287109375, -6.617534637451172, -5.04219913482666, -3.4668631553649902, -1.8915271759033203, -0.3161916732788086, 1.2591447830200195, 2.8344802856445312, 4.409816265106201, 5.985152244567871, 7.560487747192383, 9.135824203491211, 10.711159706115723, 12.286495208740234, 13.861831665039062, 15.437167167663574, 17.012502670288086, 18.587839126586914, 20.16317367553711, 21.738510131835938, 23.313846588134766, 24.889183044433594, 26.464519500732422, 28.039854049682617, 29.615190505981445, 31.19052505493164, 32.76586151123047, 34.3411979675293, 35.916534423828125, 37.49186706542969, 39.06720733642578, 40.642539978027344, 42.21787643432617, 43.793212890625, 45.36854553222656, 46.94388198852539, 48.51921844482422, 50.09455490112305, 51.669891357421875, 53.2452278137207]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 10.0, 14.0, 10.0, 18.0, 14.0, 16.0, 34.0, 18.0, 31.0, 32.0, 37.0, 30.0, 41.0, 38.0, 44.0, 37.0, 34.0, 56.0, 47.0, 50.0, 33.0, 41.0, 41.0, 37.0, 37.0, 24.0, 25.0, 20.0, 18.0, 15.0, 16.0, 9.0, 11.0, 8.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.180599212646484, -61.082515716552734, -58.984432220458984, -56.8863525390625, -54.78826904296875, -52.690185546875, -50.59210205078125, -48.4940185546875, -46.39593505859375, -44.2978515625, -42.19976806640625, -40.1016845703125, -38.003604888916016, -35.905521392822266, -33.807437896728516, -31.709354400634766, -29.61127471923828, -27.51319122314453, -25.415109634399414, -23.317026138305664, -21.218944549560547, -19.120861053466797, -17.022777557373047, -14.924695014953613, -12.82661247253418, -10.728529930114746, -8.630447387695312, -6.5323638916015625, -4.434281349182129, -2.3361988067626953, -0.2381153106689453, 1.8599672317504883, 3.9580459594726562, 6.05612850189209, 8.154211044311523, 10.252294540405273, 12.350377082824707, 14.44845962524414, 16.54654312133789, 18.64462661743164, 20.742708206176758, 22.840791702270508, 24.938873291015625, 27.036956787109375, 29.135040283203125, 31.233121871948242, 33.331207275390625, 35.42928695678711, 37.52737045288086, 39.62545394897461, 41.72353744506836, 43.821617126464844, 45.919700622558594, 48.017784118652344, 50.115867614746094, 52.213951110839844, 54.312034606933594, 56.410118103027344, 58.508201599121094, 60.606285095214844, 62.70436477661133, 64.80244445800781, 66.90052795410156, 68.99861145019531, 71.09669494628906]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 21.0, 38.0, 60.0, 101.0, 162.0, 283.0, 471.0, 759.0, 1238.0, 2002.0, 3271.0, 5274.0, 8580.0, 13781.0, 21449.0, 33350.0, 50604.0, 75652.0, 111510.0, 158367.0, 216735.0, 281654.0, 346194.0, 398288.0, 424198.0, 419881.0, 385390.0, 328748.0, 263344.0, 199960.0, 144467.0, 101911.0, 68613.0, 45374.0, 30139.0, 19355.0, 12284.0, 7931.0, 4881.0, 3061.0, 1855.0, 1169.0, 733.0, 429.0, 265.0, 168.0, 96.0, 67.0, 42.0, 28.0, 12.0, 11.0, 8.0, 5.0, 3.0, 0.0, 3.0], "bins": [-43.1875, -41.83251953125, -40.4775390625, -39.12255859375, -37.767578125, -36.41259765625, -35.0576171875, -33.70263671875, -32.34765625, -30.99267578125, -29.6376953125, -28.28271484375, -26.927734375, -25.57275390625, -24.2177734375, -22.86279296875, -21.5078125, -20.15283203125, -18.7978515625, -17.44287109375, -16.087890625, -14.73291015625, -13.3779296875, -12.02294921875, -10.66796875, -9.31298828125, -7.9580078125, -6.60302734375, -5.248046875, -3.89306640625, -2.5380859375, -1.18310546875, 0.171875, 1.52685546875, 2.8818359375, 4.23681640625, 5.591796875, 6.94677734375, 8.3017578125, 9.65673828125, 11.01171875, 12.36669921875, 13.7216796875, 15.07666015625, 16.431640625, 17.78662109375, 19.1416015625, 20.49658203125, 21.8515625, 23.20654296875, 24.5615234375, 25.91650390625, 27.271484375, 28.62646484375, 29.9814453125, 31.33642578125, 32.69140625, 34.04638671875, 35.4013671875, 36.75634765625, 38.111328125, 39.46630859375, 40.8212890625, 42.17626953125, 43.53125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 6.0, 6.0, 11.0, 13.0, 11.0, 18.0, 13.0, 22.0, 30.0, 25.0, 35.0, 29.0, 30.0, 31.0, 47.0, 38.0, 38.0, 31.0, 45.0, 52.0, 45.0, 48.0, 40.0, 43.0, 33.0, 37.0, 33.0, 27.0, 21.0, 18.0, 19.0, 19.0, 13.0, 11.0, 6.0, 9.0, 8.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.1796875, -52.359375, -50.5390625, -48.71875, -46.8984375, -45.078125, -43.2578125, -41.4375, -39.6171875, -37.796875, -35.9765625, -34.15625, -32.3359375, -30.515625, -28.6953125, -26.875, -25.0546875, -23.234375, -21.4140625, -19.59375, -17.7734375, -15.953125, -14.1328125, -12.3125, -10.4921875, -8.671875, -6.8515625, -5.03125, -3.2109375, -1.390625, 0.4296875, 2.25, 4.0703125, 5.890625, 7.7109375, 9.53125, 11.3515625, 13.171875, 14.9921875, 16.8125, 18.6328125, 20.453125, 22.2734375, 24.09375, 25.9140625, 27.734375, 29.5546875, 31.375, 33.1953125, 35.015625, 36.8359375, 38.65625, 40.4765625, 42.296875, 44.1171875, 45.9375, 47.7578125, 49.578125, 51.3984375, 53.21875, 55.0390625, 56.859375, 58.6796875, 60.5]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 27.0, 33.0, 53.0, 102.0, 169.0, 323.0, 490.0, 890.0, 1513.0, 2478.0, 4184.0, 6783.0, 11356.0, 18283.0, 28719.0, 44732.0, 66945.0, 97496.0, 139459.0, 190665.0, 248387.0, 307323.0, 359410.0, 395469.0, 406839.0, 390484.0, 354055.0, 297747.0, 238975.0, 181915.0, 132655.0, 92836.0, 62686.0, 41319.0, 26673.0, 16537.0, 10394.0, 6355.0, 3792.0, 2358.0, 1380.0, 840.0, 486.0, 270.0, 167.0, 79.0, 71.0, 32.0, 18.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.9375, -42.4931640625, -41.048828125, -39.6044921875, -38.16015625, -36.7158203125, -35.271484375, -33.8271484375, -32.3828125, -30.9384765625, -29.494140625, -28.0498046875, -26.60546875, -25.1611328125, -23.716796875, -22.2724609375, -20.828125, -19.3837890625, -17.939453125, -16.4951171875, -15.05078125, -13.6064453125, -12.162109375, -10.7177734375, -9.2734375, -7.8291015625, -6.384765625, -4.9404296875, -3.49609375, -2.0517578125, -0.607421875, 0.8369140625, 2.28125, 3.7255859375, 5.169921875, 6.6142578125, 8.05859375, 9.5029296875, 10.947265625, 12.3916015625, 13.8359375, 15.2802734375, 16.724609375, 18.1689453125, 19.61328125, 21.0576171875, 22.501953125, 23.9462890625, 25.390625, 26.8349609375, 28.279296875, 29.7236328125, 31.16796875, 32.6123046875, 34.056640625, 35.5009765625, 36.9453125, 38.3896484375, 39.833984375, 41.2783203125, 42.72265625, 44.1669921875, 45.611328125, 47.0556640625, 48.5]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 14.0, 20.0, 18.0, 35.0, 29.0, 54.0, 55.0, 95.0, 90.0, 120.0, 142.0, 150.0, 163.0, 201.0, 207.0, 246.0, 215.0, 253.0, 220.0, 253.0, 204.0, 203.0, 176.0, 169.0, 151.0, 109.0, 111.0, 89.0, 66.0, 58.0, 38.0, 36.0, 22.0, 11.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.948974609375, -28.00732421875, -27.065673828125, -26.1240234375, -25.182373046875, -24.24072265625, -23.299072265625, -22.357421875, -21.415771484375, -20.47412109375, -19.532470703125, -18.5908203125, -17.649169921875, -16.70751953125, -15.765869140625, -14.82421875, -13.882568359375, -12.94091796875, -11.999267578125, -11.0576171875, -10.115966796875, -9.17431640625, -8.232666015625, -7.291015625, -6.349365234375, -5.40771484375, -4.466064453125, -3.5244140625, -2.582763671875, -1.64111328125, -0.699462890625, 0.2421875, 1.183837890625, 2.12548828125, 3.067138671875, 4.0087890625, 4.950439453125, 5.89208984375, 6.833740234375, 7.775390625, 8.717041015625, 9.65869140625, 10.600341796875, 11.5419921875, 12.483642578125, 13.42529296875, 14.366943359375, 15.30859375, 16.250244140625, 17.19189453125, 18.133544921875, 19.0751953125, 20.016845703125, 20.95849609375, 21.900146484375, 22.841796875, 23.783447265625, 24.72509765625, 25.666748046875, 26.6083984375, 27.550048828125, 28.49169921875, 29.433349609375, 30.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 7.0, 7.0, 16.0, 9.0, 12.0, 23.0, 21.0, 26.0, 23.0, 24.0, 30.0, 44.0, 38.0, 42.0, 41.0, 38.0, 41.0, 36.0, 45.0, 33.0, 36.0, 40.0, 41.0, 28.0, 27.0, 29.0, 24.0, 33.0, 28.0, 16.0, 10.0, 15.0, 21.0, 15.0, 14.0, 9.0, 5.0, 7.0, 6.0, 3.0, 8.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.45366668701172, -50.6524772644043, -48.85129165649414, -47.05010223388672, -45.2489128112793, -43.447723388671875, -41.64653778076172, -39.8453483581543, -38.044158935546875, -36.24296951293945, -34.4417839050293, -32.640594482421875, -30.839405059814453, -29.038217544555664, -27.237030029296875, -25.435840606689453, -23.634653091430664, -21.833465576171875, -20.032276153564453, -18.231088638305664, -16.429899215698242, -14.628711700439453, -12.827523231506348, -11.026334762573242, -9.225146293640137, -7.423957824707031, -5.622769355773926, -3.8215813636779785, -2.020392894744873, -0.21920490264892578, 1.5819835662841797, 3.383172035217285, 5.184360504150391, 6.985548973083496, 8.786737442016602, 10.58792495727539, 12.389114379882812, 14.190301895141602, 15.991490364074707, 17.792678833007812, 19.593868255615234, 21.395055770874023, 23.196245193481445, 24.997432708740234, 26.798622131347656, 28.599809646606445, 30.400997161865234, 32.202186584472656, 34.00337219238281, 35.804561614990234, 37.60574722290039, 39.40693664550781, 41.208126068115234, 43.009315490722656, 44.81050109863281, 46.611690521240234, 48.412879943847656, 50.21406936645508, 52.015254974365234, 53.816444396972656, 55.61763381958008, 57.4188232421875, 59.220008850097656, 61.02119827270508, 62.8223876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 7.0, 11.0, 12.0, 12.0, 19.0, 18.0, 19.0, 16.0, 23.0, 33.0, 36.0, 30.0, 36.0, 27.0, 40.0, 47.0, 36.0, 43.0, 28.0, 33.0, 48.0, 46.0, 33.0, 38.0, 43.0, 28.0, 31.0, 31.0, 23.0, 26.0, 15.0, 13.0, 13.0, 13.0, 9.0, 11.0, 8.0, 5.0, 9.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.35512924194336, -57.40300750732422, -55.45088195800781, -53.49876022338867, -51.54663848876953, -49.594512939453125, -47.642391204833984, -45.690269470214844, -43.73814392089844, -41.7860221862793, -39.83389663696289, -37.88177490234375, -35.92965316772461, -33.97753143310547, -32.02540588378906, -30.073284149169922, -28.12116241455078, -26.169038772583008, -24.216917037963867, -22.264793395996094, -20.312671661376953, -18.36054801940918, -16.408424377441406, -14.45630168914795, -12.504179000854492, -10.552056312561035, -8.599933624267578, -6.647809982299805, -4.695687294006348, -2.7435646057128906, -0.7914409637451172, 1.1606817245483398, 3.1128082275390625, 5.0649309158325195, 7.017054080963135, 8.96917724609375, 10.921299934387207, 12.873422622680664, 14.825546264648438, 16.777667999267578, 18.72979164123535, 20.681915283203125, 22.634037017822266, 24.58616065979004, 26.538284301757812, 28.490406036376953, 30.442529678344727, 32.3946533203125, 34.34677505493164, 36.29889678955078, 38.25102233886719, 40.20314407348633, 42.15526580810547, 44.107391357421875, 46.059513092041016, 48.011634826660156, 49.96376037597656, 51.9158821105957, 53.86800765991211, 55.82012939453125, 57.77225112915039, 59.72437286376953, 61.67649841308594, 63.62862014770508, 65.58074188232422]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 17.0, 34.0, 60.0, 80.0, 124.0, 213.0, 316.0, 551.0, 890.0, 1403.0, 2415.0, 3822.0, 6190.0, 10068.0, 15631.0, 24099.0, 36110.0, 52881.0, 73214.0, 95966.0, 115330.0, 124420.0, 119704.0, 103653.0, 81756.0, 59845.0, 41990.0, 28283.0, 18457.0, 11608.0, 7405.0, 4586.0, 2902.0, 1713.0, 1056.0, 696.0, 404.0, 228.0, 166.0, 79.0, 68.0, 36.0, 27.0, 20.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.70947265625, -13.2626953125, -12.81591796875, -12.369140625, -11.92236328125, -11.4755859375, -11.02880859375, -10.58203125, -10.13525390625, -9.6884765625, -9.24169921875, -8.794921875, -8.34814453125, -7.9013671875, -7.45458984375, -7.0078125, -6.56103515625, -6.1142578125, -5.66748046875, -5.220703125, -4.77392578125, -4.3271484375, -3.88037109375, -3.43359375, -2.98681640625, -2.5400390625, -2.09326171875, -1.646484375, -1.19970703125, -0.7529296875, -0.30615234375, 0.140625, 0.58740234375, 1.0341796875, 1.48095703125, 1.927734375, 2.37451171875, 2.8212890625, 3.26806640625, 3.71484375, 4.16162109375, 4.6083984375, 5.05517578125, 5.501953125, 5.94873046875, 6.3955078125, 6.84228515625, 7.2890625, 7.73583984375, 8.1826171875, 8.62939453125, 9.076171875, 9.52294921875, 9.9697265625, 10.41650390625, 10.86328125, 11.31005859375, 11.7568359375, 12.20361328125, 12.650390625, 13.09716796875, 13.5439453125, 13.99072265625, 14.4375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 11.0, 10.0, 13.0, 18.0, 19.0, 20.0, 17.0, 18.0, 39.0, 35.0, 30.0, 35.0, 28.0, 39.0, 47.0, 40.0, 38.0, 29.0, 35.0, 48.0, 45.0, 39.0, 31.0, 44.0, 30.0, 31.0, 29.0, 26.0, 22.0, 18.0, 12.0, 14.0, 11.0, 10.0, 11.0, 8.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.65625, -57.69384765625, -55.7314453125, -53.76904296875, -51.806640625, -49.84423828125, -47.8818359375, -45.91943359375, -43.95703125, -41.99462890625, -40.0322265625, -38.06982421875, -36.107421875, -34.14501953125, -32.1826171875, -30.22021484375, -28.2578125, -26.29541015625, -24.3330078125, -22.37060546875, -20.408203125, -18.44580078125, -16.4833984375, -14.52099609375, -12.55859375, -10.59619140625, -8.6337890625, -6.67138671875, -4.708984375, -2.74658203125, -0.7841796875, 1.17822265625, 3.140625, 5.10302734375, 7.0654296875, 9.02783203125, 10.990234375, 12.95263671875, 14.9150390625, 16.87744140625, 18.83984375, 20.80224609375, 22.7646484375, 24.72705078125, 26.689453125, 28.65185546875, 30.6142578125, 32.57666015625, 34.5390625, 36.50146484375, 38.4638671875, 40.42626953125, 42.388671875, 44.35107421875, 46.3134765625, 48.27587890625, 50.23828125, 52.20068359375, 54.1630859375, 56.12548828125, 58.087890625, 60.05029296875, 62.0126953125, 63.97509765625, 65.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 4.0, 5.0, 4.0, 3.0, 11.0, 7.0, 14.0, 24.0, 20.0, 39.0, 59.0, 87.0, 108.0, 163.0, 240.0, 439.0, 639.0, 1174.0, 1999.0, 3646.0, 6865.0, 13202.0, 26368.0, 129229.0, 792977.0, 35183.0, 16627.0, 8642.0, 4587.0, 2511.0, 1422.0, 845.0, 502.0, 306.0, 185.0, 131.0, 81.0, 50.0, 46.0, 31.0, 27.0, 16.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-60.625, -58.7412109375, -56.857421875, -54.9736328125, -53.08984375, -51.2060546875, -49.322265625, -47.4384765625, -45.5546875, -43.6708984375, -41.787109375, -39.9033203125, -38.01953125, -36.1357421875, -34.251953125, -32.3681640625, -30.484375, -28.6005859375, -26.716796875, -24.8330078125, -22.94921875, -21.0654296875, -19.181640625, -17.2978515625, -15.4140625, -13.5302734375, -11.646484375, -9.7626953125, -7.87890625, -5.9951171875, -4.111328125, -2.2275390625, -0.34375, 1.5400390625, 3.423828125, 5.3076171875, 7.19140625, 9.0751953125, 10.958984375, 12.8427734375, 14.7265625, 16.6103515625, 18.494140625, 20.3779296875, 22.26171875, 24.1455078125, 26.029296875, 27.9130859375, 29.796875, 31.6806640625, 33.564453125, 35.4482421875, 37.33203125, 39.2158203125, 41.099609375, 42.9833984375, 44.8671875, 46.7509765625, 48.634765625, 50.5185546875, 52.40234375, 54.2861328125, 56.169921875, 58.0537109375, 59.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 9.0, 6.0, 12.0, 8.0, 12.0, 10.0, 9.0, 14.0, 21.0, 21.0, 30.0, 26.0, 38.0, 43.0, 35.0, 37.0, 32.0, 52.0, 44.0, 42.0, 45.0, 40.0, 45.0, 48.0, 34.0, 34.0, 31.0, 35.0, 18.0, 28.0, 18.0, 20.0, 15.0, 15.0, 17.0, 9.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25, -42.8720703125, -41.494140625, -40.1162109375, -38.73828125, -37.3603515625, -35.982421875, -34.6044921875, -33.2265625, -31.8486328125, -30.470703125, -29.0927734375, -27.71484375, -26.3369140625, -24.958984375, -23.5810546875, -22.203125, -20.8251953125, -19.447265625, -18.0693359375, -16.69140625, -15.3134765625, -13.935546875, -12.5576171875, -11.1796875, -9.8017578125, -8.423828125, -7.0458984375, -5.66796875, -4.2900390625, -2.912109375, -1.5341796875, -0.15625, 1.2216796875, 2.599609375, 3.9775390625, 5.35546875, 6.7333984375, 8.111328125, 9.4892578125, 10.8671875, 12.2451171875, 13.623046875, 15.0009765625, 16.37890625, 17.7568359375, 19.134765625, 20.5126953125, 21.890625, 23.2685546875, 24.646484375, 26.0244140625, 27.40234375, 28.7802734375, 30.158203125, 31.5361328125, 32.9140625, 34.2919921875, 35.669921875, 37.0478515625, 38.42578125, 39.8037109375, 41.181640625, 42.5595703125, 43.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 2.0, 16.0, 13.0, 19.0, 28.0, 33.0, 48.0, 77.0, 89.0, 155.0, 211.0, 281.0, 489.0, 751.0, 1220.0, 2022.0, 3565.0, 5928.0, 10030.0, 18880.0, 38460.0, 779718.0, 126165.0, 26697.0, 14171.0, 7758.0, 4594.0, 2651.0, 1598.0, 953.0, 608.0, 423.0, 267.0, 174.0, 132.0, 93.0, 66.0, 36.0, 34.0, 25.0, 17.0, 16.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.078125, -2.981231689453125, -2.88433837890625, -2.787445068359375, -2.6905517578125, -2.593658447265625, -2.49676513671875, -2.399871826171875, -2.302978515625, -2.206085205078125, -2.10919189453125, -2.012298583984375, -1.9154052734375, -1.818511962890625, -1.72161865234375, -1.624725341796875, -1.52783203125, -1.430938720703125, -1.33404541015625, -1.237152099609375, -1.1402587890625, -1.043365478515625, -0.94647216796875, -0.849578857421875, -0.752685546875, -0.655792236328125, -0.55889892578125, -0.462005615234375, -0.3651123046875, -0.268218994140625, -0.17132568359375, -0.074432373046875, 0.0224609375, 0.119354248046875, 0.21624755859375, 0.313140869140625, 0.4100341796875, 0.506927490234375, 0.60382080078125, 0.700714111328125, 0.797607421875, 0.894500732421875, 0.99139404296875, 1.088287353515625, 1.1851806640625, 1.282073974609375, 1.37896728515625, 1.475860595703125, 1.57275390625, 1.669647216796875, 1.76654052734375, 1.863433837890625, 1.9603271484375, 2.057220458984375, 2.15411376953125, 2.251007080078125, 2.347900390625, 2.444793701171875, 2.54168701171875, 2.638580322265625, 2.7354736328125, 2.832366943359375, 2.92926025390625, 3.026153564453125, 3.123046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 6.0, 11.0, 13.0, 12.0, 15.0, 21.0, 24.0, 40.0, 51.0, 60.0, 60.0, 76.0, 69.0, 48.0, 80.0, 82.0, 57.0, 52.0, 42.0, 32.0, 31.0, 22.0, 10.0, 19.0, 10.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001575946807861328, -0.0001520290970802307, -0.0001464635133743286, -0.00014089792966842651, -0.00013533234596252441, -0.00012976676225662231, -0.00012420117855072021, -0.00011863559484481812, -0.00011307001113891602, -0.00010750442743301392, -0.00010193884372711182, -9.637326002120972e-05, -9.080767631530762e-05, -8.524209260940552e-05, -7.967650890350342e-05, -7.411092519760132e-05, -6.854534149169922e-05, -6.297975778579712e-05, -5.741417407989502e-05, -5.184859037399292e-05, -4.628300666809082e-05, -4.071742296218872e-05, -3.515183925628662e-05, -2.958625555038452e-05, -2.4020671844482422e-05, -1.8455088138580322e-05, -1.2889504432678223e-05, -7.323920726776123e-06, -1.7583370208740234e-06, 3.807246685028076e-06, 9.372830390930176e-06, 1.4938414096832275e-05, 2.0503997802734375e-05, 2.6069581508636475e-05, 3.1635165214538574e-05, 3.7200748920440674e-05, 4.2766332626342773e-05, 4.833191633224487e-05, 5.389750003814697e-05, 5.946308374404907e-05, 6.502866744995117e-05, 7.059425115585327e-05, 7.615983486175537e-05, 8.172541856765747e-05, 8.729100227355957e-05, 9.285658597946167e-05, 9.842216968536377e-05, 0.00010398775339126587, 0.00010955333709716797, 0.00011511892080307007, 0.00012068450450897217, 0.00012625008821487427, 0.00013181567192077637, 0.00013738125562667847, 0.00014294683933258057, 0.00014851242303848267, 0.00015407800674438477, 0.00015964359045028687, 0.00016520917415618896, 0.00017077475786209106, 0.00017634034156799316, 0.00018190592527389526, 0.00018747150897979736, 0.00019303709268569946, 0.00019860267639160156]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 8.0, 8.0, 18.0, 17.0, 34.0, 59.0, 85.0, 115.0, 218.0, 352.0, 536.0, 769.0, 1219.0, 1936.0, 3008.0, 4623.0, 7230.0, 11011.0, 16365.0, 23813.0, 34252.0, 48244.0, 64622.0, 82775.0, 100291.0, 112705.0, 113801.0, 103428.0, 86222.0, 67624.0, 50612.0, 36157.0, 25641.0, 17367.0, 11588.0, 7730.0, 5008.0, 3168.0, 2147.0, 1326.0, 848.0, 578.0, 381.0, 224.0, 153.0, 82.0, 58.0, 41.0, 30.0, 14.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.025390625, -1.95574951171875, -1.8861083984375, -1.81646728515625, -1.746826171875, -1.67718505859375, -1.6075439453125, -1.53790283203125, -1.46826171875, -1.39862060546875, -1.3289794921875, -1.25933837890625, -1.189697265625, -1.12005615234375, -1.0504150390625, -0.98077392578125, -0.9111328125, -0.84149169921875, -0.7718505859375, -0.70220947265625, -0.632568359375, -0.56292724609375, -0.4932861328125, -0.42364501953125, -0.35400390625, -0.28436279296875, -0.2147216796875, -0.14508056640625, -0.075439453125, -0.00579833984375, 0.0638427734375, 0.13348388671875, 0.203125, 0.27276611328125, 0.3424072265625, 0.41204833984375, 0.481689453125, 0.55133056640625, 0.6209716796875, 0.69061279296875, 0.76025390625, 0.82989501953125, 0.8995361328125, 0.96917724609375, 1.038818359375, 1.10845947265625, 1.1781005859375, 1.24774169921875, 1.3173828125, 1.38702392578125, 1.4566650390625, 1.52630615234375, 1.595947265625, 1.66558837890625, 1.7352294921875, 1.80487060546875, 1.87451171875, 1.94415283203125, 2.0137939453125, 2.08343505859375, 2.153076171875, 2.22271728515625, 2.2923583984375, 2.36199951171875, 2.431640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 14.0, 17.0, 19.0, 10.0, 21.0, 29.0, 28.0, 32.0, 40.0, 35.0, 52.0, 36.0, 37.0, 52.0, 46.0, 50.0, 45.0, 42.0, 42.0, 43.0, 53.0, 38.0, 30.0, 22.0, 18.0, 20.0, 27.0, 13.0, 19.0, 10.0, 5.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.103515625, -1.070770263671875, -1.03802490234375, -1.005279541015625, -0.9725341796875, -0.939788818359375, -0.90704345703125, -0.874298095703125, -0.841552734375, -0.808807373046875, -0.77606201171875, -0.743316650390625, -0.7105712890625, -0.677825927734375, -0.64508056640625, -0.612335205078125, -0.57958984375, -0.546844482421875, -0.51409912109375, -0.481353759765625, -0.4486083984375, -0.415863037109375, -0.38311767578125, -0.350372314453125, -0.317626953125, -0.284881591796875, -0.25213623046875, -0.219390869140625, -0.1866455078125, -0.153900146484375, -0.12115478515625, -0.088409423828125, -0.0556640625, -0.022918701171875, 0.00982666015625, 0.042572021484375, 0.0753173828125, 0.108062744140625, 0.14080810546875, 0.173553466796875, 0.206298828125, 0.239044189453125, 0.27178955078125, 0.304534912109375, 0.3372802734375, 0.370025634765625, 0.40277099609375, 0.435516357421875, 0.46826171875, 0.501007080078125, 0.53375244140625, 0.566497802734375, 0.5992431640625, 0.631988525390625, 0.66473388671875, 0.697479248046875, 0.730224609375, 0.762969970703125, 0.79571533203125, 0.828460693359375, 0.8612060546875, 0.893951416015625, 0.92669677734375, 0.959442138671875, 0.9921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 4.0, 9.0, 11.0, 9.0, 13.0, 21.0, 16.0, 15.0, 19.0, 27.0, 26.0, 34.0, 36.0, 38.0, 41.0, 47.0, 31.0, 36.0, 53.0, 29.0, 40.0, 39.0, 42.0, 30.0, 29.0, 28.0, 30.0, 35.0, 26.0, 27.0, 17.0, 8.0, 19.0, 17.0, 19.0, 10.0, 10.0, 5.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.127662658691406, -53.357574462890625, -51.587486267089844, -49.81739807128906, -48.047306060791016, -46.277217864990234, -44.50712966918945, -42.73704147338867, -40.966949462890625, -39.196861267089844, -37.42677307128906, -35.65668487548828, -33.886592864990234, -32.11650466918945, -30.346416473388672, -28.57632827758789, -26.80624008178711, -25.036151885986328, -23.266061782836914, -21.495973587036133, -19.72588348388672, -17.955795288085938, -16.185707092285156, -14.415617942810059, -12.645528793334961, -10.875439643859863, -9.105350494384766, -7.335262298583984, -5.565173149108887, -3.795083999633789, -2.024995803833008, -0.25490665435791016, 1.5151824951171875, 3.285271406173706, 5.055360317230225, 6.825448989868164, 8.595538139343262, 10.36562728881836, 12.13571548461914, 13.905804634094238, 15.675893783569336, 17.445981979370117, 19.21607208251953, 20.986160278320312, 22.756248474121094, 24.526338577270508, 26.29642677307129, 28.066516876220703, 29.836605072021484, 31.606693267822266, 33.37678146362305, 35.146873474121094, 36.916961669921875, 38.687049865722656, 40.45713806152344, 42.22722625732422, 43.997314453125, 45.76740264892578, 47.53749084472656, 49.307579040527344, 51.07767105102539, 52.84775924682617, 54.61784744262695, 56.387935638427734, 58.15802764892578]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 11.0, 9.0, 14.0, 17.0, 20.0, 18.0, 20.0, 19.0, 32.0, 40.0, 28.0, 36.0, 26.0, 42.0, 48.0, 38.0, 40.0, 28.0, 37.0, 41.0, 46.0, 41.0, 33.0, 41.0, 34.0, 33.0, 27.0, 27.0, 20.0, 17.0, 13.0, 11.0, 15.0, 11.0, 12.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.02375793457031, -58.05263900756836, -56.08151626586914, -54.11039733886719, -52.13927459716797, -50.168155670166016, -48.19703674316406, -46.225914001464844, -44.25479507446289, -42.28367614746094, -40.31255340576172, -38.341434478759766, -36.37031555175781, -34.399192810058594, -32.42807388305664, -30.456953048706055, -28.48583221435547, -26.514711380004883, -24.543590545654297, -22.572471618652344, -20.601350784301758, -18.630229949951172, -16.65911102294922, -14.687990188598633, -12.716869354248047, -10.745748519897461, -8.774628639221191, -6.803508281707764, -4.832387924194336, -2.86126708984375, -0.8901472091674805, 1.080972671508789, 3.052093505859375, 5.023213863372803, 6.9943342208862305, 8.9654541015625, 10.936574935913086, 12.907695770263672, 14.878815650939941, 16.84993553161621, 18.821056365966797, 20.792177200317383, 22.76329803466797, 24.734416961669922, 26.705537796020508, 28.676658630371094, 30.647777557373047, 32.618896484375, 34.59001922607422, 36.56113815307617, 38.53226089477539, 40.503379821777344, 42.47450256347656, 44.445621490478516, 46.41674041748047, 48.38786315917969, 50.35898208618164, 52.330101013183594, 54.30122375488281, 56.272342681884766, 58.24346160888672, 60.21458435058594, 62.18570327758789, 64.15682220458984, 66.12794494628906]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 9.0, 14.0, 16.0, 36.0, 59.0, 95.0, 172.0, 276.0, 516.0, 975.0, 1753.0, 3279.0, 6053.0, 10554.0, 18216.0, 29788.0, 45599.0, 65871.0, 87032.0, 107752.0, 120799.0, 122597.0, 114046.0, 96165.0, 74650.0, 53696.0, 35700.0, 22391.0, 13522.0, 7697.0, 4174.0, 2269.0, 1205.0, 677.0, 364.0, 196.0, 119.0, 76.0, 49.0, 25.0, 22.0, 15.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.28125, -50.60595703125, -48.9306640625, -47.25537109375, -45.580078125, -43.90478515625, -42.2294921875, -40.55419921875, -38.87890625, -37.20361328125, -35.5283203125, -33.85302734375, -32.177734375, -30.50244140625, -28.8271484375, -27.15185546875, -25.4765625, -23.80126953125, -22.1259765625, -20.45068359375, -18.775390625, -17.10009765625, -15.4248046875, -13.74951171875, -12.07421875, -10.39892578125, -8.7236328125, -7.04833984375, -5.373046875, -3.69775390625, -2.0224609375, -0.34716796875, 1.328125, 3.00341796875, 4.6787109375, 6.35400390625, 8.029296875, 9.70458984375, 11.3798828125, 13.05517578125, 14.73046875, 16.40576171875, 18.0810546875, 19.75634765625, 21.431640625, 23.10693359375, 24.7822265625, 26.45751953125, 28.1328125, 29.80810546875, 31.4833984375, 33.15869140625, 34.833984375, 36.50927734375, 38.1845703125, 39.85986328125, 41.53515625, 43.21044921875, 44.8857421875, 46.56103515625, 48.236328125, 49.91162109375, 51.5869140625, 53.26220703125, 54.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 7.0, 8.0, 10.0, 15.0, 13.0, 26.0, 16.0, 20.0, 18.0, 36.0, 36.0, 29.0, 39.0, 23.0, 43.0, 54.0, 33.0, 38.0, 34.0, 34.0, 48.0, 43.0, 44.0, 32.0, 42.0, 27.0, 33.0, 26.0, 30.0, 21.0, 16.0, 13.0, 12.0, 11.0, 14.0, 10.0, 4.0, 5.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-58.4375, -56.513671875, -54.58984375, -52.666015625, -50.7421875, -48.818359375, -46.89453125, -44.970703125, -43.046875, -41.123046875, -39.19921875, -37.275390625, -35.3515625, -33.427734375, -31.50390625, -29.580078125, -27.65625, -25.732421875, -23.80859375, -21.884765625, -19.9609375, -18.037109375, -16.11328125, -14.189453125, -12.265625, -10.341796875, -8.41796875, -6.494140625, -4.5703125, -2.646484375, -0.72265625, 1.201171875, 3.125, 5.048828125, 6.97265625, 8.896484375, 10.8203125, 12.744140625, 14.66796875, 16.591796875, 18.515625, 20.439453125, 22.36328125, 24.287109375, 26.2109375, 28.134765625, 30.05859375, 31.982421875, 33.90625, 35.830078125, 37.75390625, 39.677734375, 41.6015625, 43.525390625, 45.44921875, 47.373046875, 49.296875, 51.220703125, 53.14453125, 55.068359375, 56.9921875, 58.916015625, 60.83984375, 62.763671875, 64.6875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 28.0, 42.0, 72.0, 118.0, 232.0, 400.0, 716.0, 1124.0, 1976.0, 3389.0, 5614.0, 9282.0, 14744.0, 22655.0, 33012.0, 47160.0, 62745.0, 79667.0, 93982.0, 104757.0, 106934.0, 102408.0, 91338.0, 76778.0, 59012.0, 44307.0, 30819.0, 20864.0, 13379.0, 8519.0, 5105.0, 3097.0, 1836.0, 1080.0, 566.0, 343.0, 185.0, 89.0, 62.0, 40.0, 27.0, 13.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -36.9443359375, -35.544921875, -34.1455078125, -32.74609375, -31.3466796875, -29.947265625, -28.5478515625, -27.1484375, -25.7490234375, -24.349609375, -22.9501953125, -21.55078125, -20.1513671875, -18.751953125, -17.3525390625, -15.953125, -14.5537109375, -13.154296875, -11.7548828125, -10.35546875, -8.9560546875, -7.556640625, -6.1572265625, -4.7578125, -3.3583984375, -1.958984375, -0.5595703125, 0.83984375, 2.2392578125, 3.638671875, 5.0380859375, 6.4375, 7.8369140625, 9.236328125, 10.6357421875, 12.03515625, 13.4345703125, 14.833984375, 16.2333984375, 17.6328125, 19.0322265625, 20.431640625, 21.8310546875, 23.23046875, 24.6298828125, 26.029296875, 27.4287109375, 28.828125, 30.2275390625, 31.626953125, 33.0263671875, 34.42578125, 35.8251953125, 37.224609375, 38.6240234375, 40.0234375, 41.4228515625, 42.822265625, 44.2216796875, 45.62109375, 47.0205078125, 48.419921875, 49.8193359375, 51.21875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 14.0, 11.0, 23.0, 24.0, 23.0, 24.0, 28.0, 41.0, 33.0, 40.0, 40.0, 33.0, 30.0, 39.0, 31.0, 45.0, 52.0, 33.0, 31.0, 33.0, 26.0, 36.0, 30.0, 23.0, 31.0, 32.0, 17.0, 18.0, 14.0, 13.0, 6.0, 11.0, 11.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -37.95361328125, -36.7509765625, -35.54833984375, -34.345703125, -33.14306640625, -31.9404296875, -30.73779296875, -29.53515625, -28.33251953125, -27.1298828125, -25.92724609375, -24.724609375, -23.52197265625, -22.3193359375, -21.11669921875, -19.9140625, -18.71142578125, -17.5087890625, -16.30615234375, -15.103515625, -13.90087890625, -12.6982421875, -11.49560546875, -10.29296875, -9.09033203125, -7.8876953125, -6.68505859375, -5.482421875, -4.27978515625, -3.0771484375, -1.87451171875, -0.671875, 0.53076171875, 1.7333984375, 2.93603515625, 4.138671875, 5.34130859375, 6.5439453125, 7.74658203125, 8.94921875, 10.15185546875, 11.3544921875, 12.55712890625, 13.759765625, 14.96240234375, 16.1650390625, 17.36767578125, 18.5703125, 19.77294921875, 20.9755859375, 22.17822265625, 23.380859375, 24.58349609375, 25.7861328125, 26.98876953125, 28.19140625, 29.39404296875, 30.5966796875, 31.79931640625, 33.001953125, 34.20458984375, 35.4072265625, 36.60986328125, 37.8125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 7.0, 9.0, 15.0, 16.0, 28.0, 40.0, 63.0, 83.0, 112.0, 171.0, 281.0, 409.0, 635.0, 965.0, 1399.0, 2245.0, 3617.0, 5312.0, 8165.0, 12283.0, 17880.0, 26066.0, 36264.0, 49083.0, 62972.0, 77076.0, 89514.0, 97786.0, 99381.0, 95072.0, 85738.0, 72287.0, 57817.0, 44470.0, 32111.0, 22807.0, 15819.0, 10431.0, 6795.0, 4734.0, 2943.0, 1986.0, 1300.0, 824.0, 539.0, 323.0, 233.0, 148.0, 86.0, 76.0, 56.0, 29.0, 27.0, 15.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0], "bins": [-15.8359375, -15.345947265625, -14.85595703125, -14.365966796875, -13.8759765625, -13.385986328125, -12.89599609375, -12.406005859375, -11.916015625, -11.426025390625, -10.93603515625, -10.446044921875, -9.9560546875, -9.466064453125, -8.97607421875, -8.486083984375, -7.99609375, -7.506103515625, -7.01611328125, -6.526123046875, -6.0361328125, -5.546142578125, -5.05615234375, -4.566162109375, -4.076171875, -3.586181640625, -3.09619140625, -2.606201171875, -2.1162109375, -1.626220703125, -1.13623046875, -0.646240234375, -0.15625, 0.333740234375, 0.82373046875, 1.313720703125, 1.8037109375, 2.293701171875, 2.78369140625, 3.273681640625, 3.763671875, 4.253662109375, 4.74365234375, 5.233642578125, 5.7236328125, 6.213623046875, 6.70361328125, 7.193603515625, 7.68359375, 8.173583984375, 8.66357421875, 9.153564453125, 9.6435546875, 10.133544921875, 10.62353515625, 11.113525390625, 11.603515625, 12.093505859375, 12.58349609375, 13.073486328125, 13.5634765625, 14.053466796875, 14.54345703125, 15.033447265625, 15.5234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 17.0, 15.0, 18.0, 19.0, 26.0, 39.0, 36.0, 37.0, 51.0, 31.0, 60.0, 44.0, 61.0, 63.0, 59.0, 51.0, 43.0, 43.0, 31.0, 43.0, 34.0, 38.0, 26.0, 23.0, 23.0, 13.0, 8.0, 11.0, 4.0, 3.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002838134765625, -0.0027550160884857178, -0.0026718974113464355, -0.0025887787342071533, -0.002505660057067871, -0.002422541379928589, -0.0023394227027893066, -0.0022563040256500244, -0.002173185348510742, -0.00209006667137146, -0.0020069479942321777, -0.0019238293170928955, -0.0018407106399536133, -0.001757591962814331, -0.0016744732856750488, -0.0015913546085357666, -0.0015082359313964844, -0.0014251172542572021, -0.00134199857711792, -0.0012588798999786377, -0.0011757612228393555, -0.0010926425457000732, -0.001009523868560791, -0.0009264051914215088, -0.0008432865142822266, -0.0007601678371429443, -0.0006770491600036621, -0.0005939304828643799, -0.0005108118057250977, -0.00042769312858581543, -0.0003445744514465332, -0.000261455774307251, -0.00017833709716796875, -9.521842002868652e-05, -1.2099742889404297e-05, 7.101893424987793e-05, 0.00015413761138916016, 0.00023725628852844238, 0.0003203749656677246, 0.00040349364280700684, 0.00048661231994628906, 0.0005697309970855713, 0.0006528496742248535, 0.0007359683513641357, 0.000819087028503418, 0.0009022057056427002, 0.0009853243827819824, 0.0010684430599212646, 0.0011515617370605469, 0.001234680414199829, 0.0013177990913391113, 0.0014009177684783936, 0.0014840364456176758, 0.001567155122756958, 0.0016502737998962402, 0.0017333924770355225, 0.0018165111541748047, 0.001899629831314087, 0.001982748508453369, 0.0020658671855926514, 0.0021489858627319336, 0.002232104539871216, 0.002315223217010498, 0.0023983418941497803, 0.0024814605712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 17.0, 24.0, 27.0, 30.0, 61.0, 108.0, 164.0, 246.0, 413.0, 645.0, 1092.0, 1808.0, 2903.0, 4750.0, 7764.0, 12540.0, 20049.0, 30420.0, 44945.0, 63377.0, 83710.0, 102572.0, 115229.0, 118124.0, 110168.0, 94337.0, 74417.0, 54443.0, 37555.0, 24931.0, 16044.0, 9984.0, 6040.0, 3722.0, 2251.0, 1362.0, 903.0, 517.0, 304.0, 210.0, 135.0, 68.0, 40.0, 41.0, 23.0, 16.0, 14.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.788330078125, -18.12353515625, -17.458740234375, -16.7939453125, -16.129150390625, -15.46435546875, -14.799560546875, -14.134765625, -13.469970703125, -12.80517578125, -12.140380859375, -11.4755859375, -10.810791015625, -10.14599609375, -9.481201171875, -8.81640625, -8.151611328125, -7.48681640625, -6.822021484375, -6.1572265625, -5.492431640625, -4.82763671875, -4.162841796875, -3.498046875, -2.833251953125, -2.16845703125, -1.503662109375, -0.8388671875, -0.174072265625, 0.49072265625, 1.155517578125, 1.8203125, 2.485107421875, 3.14990234375, 3.814697265625, 4.4794921875, 5.144287109375, 5.80908203125, 6.473876953125, 7.138671875, 7.803466796875, 8.46826171875, 9.133056640625, 9.7978515625, 10.462646484375, 11.12744140625, 11.792236328125, 12.45703125, 13.121826171875, 13.78662109375, 14.451416015625, 15.1162109375, 15.781005859375, 16.44580078125, 17.110595703125, 17.775390625, 18.440185546875, 19.10498046875, 19.769775390625, 20.4345703125, 21.099365234375, 21.76416015625, 22.428955078125, 23.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 12.0, 5.0, 14.0, 4.0, 12.0, 12.0, 17.0, 20.0, 21.0, 21.0, 28.0, 17.0, 27.0, 39.0, 48.0, 33.0, 33.0, 33.0, 45.0, 51.0, 48.0, 30.0, 41.0, 34.0, 43.0, 40.0, 25.0, 28.0, 21.0, 21.0, 20.0, 20.0, 14.0, 23.0, 27.0, 9.0, 9.0, 9.0, 9.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.96484375, -7.69805908203125, -7.4312744140625, -7.16448974609375, -6.897705078125, -6.63092041015625, -6.3641357421875, -6.09735107421875, -5.83056640625, -5.56378173828125, -5.2969970703125, -5.03021240234375, -4.763427734375, -4.49664306640625, -4.2298583984375, -3.96307373046875, -3.6962890625, -3.42950439453125, -3.1627197265625, -2.89593505859375, -2.629150390625, -2.36236572265625, -2.0955810546875, -1.82879638671875, -1.56201171875, -1.29522705078125, -1.0284423828125, -0.76165771484375, -0.494873046875, -0.22808837890625, 0.0386962890625, 0.30548095703125, 0.572265625, 0.83905029296875, 1.1058349609375, 1.37261962890625, 1.639404296875, 1.90618896484375, 2.1729736328125, 2.43975830078125, 2.70654296875, 2.97332763671875, 3.2401123046875, 3.50689697265625, 3.773681640625, 4.04046630859375, 4.3072509765625, 4.57403564453125, 4.8408203125, 5.10760498046875, 5.3743896484375, 5.64117431640625, 5.907958984375, 6.17474365234375, 6.4415283203125, 6.70831298828125, 6.97509765625, 7.24188232421875, 7.5086669921875, 7.77545166015625, 8.042236328125, 8.30902099609375, 8.5758056640625, 8.84259033203125, 9.109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 10.0, 2.0, 10.0, 9.0, 11.0, 8.0, 8.0, 11.0, 16.0, 22.0, 16.0, 13.0, 27.0, 34.0, 32.0, 33.0, 41.0, 40.0, 37.0, 28.0, 31.0, 46.0, 32.0, 44.0, 40.0, 32.0, 29.0, 30.0, 28.0, 26.0, 26.0, 23.0, 28.0, 26.0, 27.0, 18.0, 25.0, 9.0, 9.0, 9.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.527687072753906, -54.86153030395508, -53.19537353515625, -51.52921676635742, -49.863059997558594, -48.19690704345703, -46.53074645996094, -44.864593505859375, -43.19843673706055, -41.53227996826172, -39.86612319946289, -38.19996643066406, -36.533809661865234, -34.867652893066406, -33.201499938964844, -31.535343170166016, -29.869184494018555, -28.203027725219727, -26.5368709564209, -24.870716094970703, -23.204559326171875, -21.538402557373047, -19.87224578857422, -18.20608901977539, -16.539932250976562, -14.873775482177734, -13.207619667053223, -11.541462898254395, -9.875307083129883, -8.209150314331055, -6.542993545532227, -4.876837730407715, -3.210681915283203, -1.5445255041122437, 0.12163090705871582, 1.7877874374389648, 3.4539437294006348, 5.120100021362305, 6.786256790161133, 8.452412605285645, 10.118569374084473, 11.7847261428833, 13.450881958007812, 15.11703872680664, 16.78319549560547, 18.449352264404297, 20.115509033203125, 21.78166389465332, 23.44782066345215, 25.113977432250977, 26.780134201049805, 28.4462890625, 30.112445831298828, 31.778602600097656, 33.444759368896484, 35.11091613769531, 36.77707290649414, 38.44322967529297, 40.1093864440918, 41.775543212890625, 43.44169998168945, 45.10785675048828, 46.774009704589844, 48.44016647338867, 50.1063232421875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 15.0, 14.0, 8.0, 20.0, 10.0, 17.0, 20.0, 28.0, 23.0, 25.0, 34.0, 37.0, 38.0, 29.0, 38.0, 52.0, 34.0, 47.0, 45.0, 46.0, 43.0, 40.0, 39.0, 39.0, 30.0, 42.0, 25.0, 26.0, 16.0, 22.0, 20.0, 16.0, 13.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.81147384643555, -55.67109680175781, -53.53071594238281, -51.39033889770508, -49.249961853027344, -47.109580993652344, -44.96920394897461, -42.828826904296875, -40.688446044921875, -38.54806900024414, -36.40768814086914, -34.267311096191406, -32.12693405151367, -29.986555099487305, -27.846176147460938, -25.705799102783203, -23.56542205810547, -21.4250431060791, -19.284666061401367, -17.144287109375, -15.00390911102295, -12.863531112670898, -10.723152160644531, -8.58277416229248, -6.44239616394043, -4.302018165588379, -2.16163969039917, -0.021261215209960938, 2.11911678314209, 4.259494781494141, 6.399873733520508, 8.540251731872559, 10.680633544921875, 12.821011543273926, 14.961389541625977, 17.101768493652344, 19.242145538330078, 21.382524490356445, 23.522903442382812, 25.663280487060547, 27.803659439086914, 29.94403839111328, 32.084415435791016, 34.22479248046875, 36.36517333984375, 38.505550384521484, 40.64592742919922, 42.78630828857422, 44.92668533325195, 47.06706237792969, 49.20744323730469, 51.34782028198242, 53.488197326660156, 55.628578186035156, 57.76895523071289, 59.909332275390625, 62.049713134765625, 64.19009399414062, 66.3304672241211, 68.4708480834961, 70.6112289428711, 72.75160217285156, 74.89198303222656, 77.03236389160156, 79.17273712158203]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 24.0, 28.0, 47.0, 82.0, 129.0, 243.0, 456.0, 780.0, 1201.0, 2057.0, 3362.0, 5304.0, 8751.0, 13824.0, 22019.0, 34292.0, 52399.0, 78231.0, 114713.0, 160931.0, 217855.0, 277919.0, 339984.0, 388691.0, 414729.0, 409730.0, 381396.0, 329633.0, 267333.0, 206089.0, 149846.0, 106846.0, 72593.0, 47944.0, 31307.0, 20228.0, 12459.0, 7981.0, 4838.0, 3064.0, 1999.0, 1133.0, 712.0, 421.0, 230.0, 164.0, 113.0, 71.0, 43.0, 27.0, 10.0, 11.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-41.8125, -40.45947265625, -39.1064453125, -37.75341796875, -36.400390625, -35.04736328125, -33.6943359375, -32.34130859375, -30.98828125, -29.63525390625, -28.2822265625, -26.92919921875, -25.576171875, -24.22314453125, -22.8701171875, -21.51708984375, -20.1640625, -18.81103515625, -17.4580078125, -16.10498046875, -14.751953125, -13.39892578125, -12.0458984375, -10.69287109375, -9.33984375, -7.98681640625, -6.6337890625, -5.28076171875, -3.927734375, -2.57470703125, -1.2216796875, 0.13134765625, 1.484375, 2.83740234375, 4.1904296875, 5.54345703125, 6.896484375, 8.24951171875, 9.6025390625, 10.95556640625, 12.30859375, 13.66162109375, 15.0146484375, 16.36767578125, 17.720703125, 19.07373046875, 20.4267578125, 21.77978515625, 23.1328125, 24.48583984375, 25.8388671875, 27.19189453125, 28.544921875, 29.89794921875, 31.2509765625, 32.60400390625, 33.95703125, 35.31005859375, 36.6630859375, 38.01611328125, 39.369140625, 40.72216796875, 42.0751953125, 43.42822265625, 44.78125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 16.0, 11.0, 8.0, 15.0, 16.0, 19.0, 18.0, 30.0, 19.0, 21.0, 37.0, 42.0, 26.0, 37.0, 37.0, 44.0, 39.0, 42.0, 52.0, 41.0, 39.0, 42.0, 38.0, 40.0, 37.0, 36.0, 29.0, 20.0, 22.0, 19.0, 18.0, 20.0, 15.0, 9.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.03125, -49.15478515625, -47.2783203125, -45.40185546875, -43.525390625, -41.64892578125, -39.7724609375, -37.89599609375, -36.01953125, -34.14306640625, -32.2666015625, -30.39013671875, -28.513671875, -26.63720703125, -24.7607421875, -22.88427734375, -21.0078125, -19.13134765625, -17.2548828125, -15.37841796875, -13.501953125, -11.62548828125, -9.7490234375, -7.87255859375, -5.99609375, -4.11962890625, -2.2431640625, -0.36669921875, 1.509765625, 3.38623046875, 5.2626953125, 7.13916015625, 9.015625, 10.89208984375, 12.7685546875, 14.64501953125, 16.521484375, 18.39794921875, 20.2744140625, 22.15087890625, 24.02734375, 25.90380859375, 27.7802734375, 29.65673828125, 31.533203125, 33.40966796875, 35.2861328125, 37.16259765625, 39.0390625, 40.91552734375, 42.7919921875, 44.66845703125, 46.544921875, 48.42138671875, 50.2978515625, 52.17431640625, 54.05078125, 55.92724609375, 57.8037109375, 59.68017578125, 61.556640625, 63.43310546875, 65.3095703125, 67.18603515625, 69.0625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 15.0, 27.0, 46.0, 93.0, 190.0, 295.0, 500.0, 884.0, 1591.0, 2477.0, 4332.0, 7086.0, 11487.0, 18468.0, 29606.0, 45764.0, 68623.0, 101308.0, 140926.0, 191202.0, 248418.0, 304618.0, 354182.0, 387647.0, 398152.0, 384156.0, 348207.0, 299060.0, 242316.0, 185788.0, 137275.0, 95939.0, 66231.0, 44127.0, 28019.0, 17582.0, 11051.0, 6751.0, 4085.0, 2358.0, 1403.0, 824.0, 485.0, 284.0, 170.0, 92.0, 71.0, 35.0, 16.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-46.46875, -45.03662109375, -43.6044921875, -42.17236328125, -40.740234375, -39.30810546875, -37.8759765625, -36.44384765625, -35.01171875, -33.57958984375, -32.1474609375, -30.71533203125, -29.283203125, -27.85107421875, -26.4189453125, -24.98681640625, -23.5546875, -22.12255859375, -20.6904296875, -19.25830078125, -17.826171875, -16.39404296875, -14.9619140625, -13.52978515625, -12.09765625, -10.66552734375, -9.2333984375, -7.80126953125, -6.369140625, -4.93701171875, -3.5048828125, -2.07275390625, -0.640625, 0.79150390625, 2.2236328125, 3.65576171875, 5.087890625, 6.52001953125, 7.9521484375, 9.38427734375, 10.81640625, 12.24853515625, 13.6806640625, 15.11279296875, 16.544921875, 17.97705078125, 19.4091796875, 20.84130859375, 22.2734375, 23.70556640625, 25.1376953125, 26.56982421875, 28.001953125, 29.43408203125, 30.8662109375, 32.29833984375, 33.73046875, 35.16259765625, 36.5947265625, 38.02685546875, 39.458984375, 40.89111328125, 42.3232421875, 43.75537109375, 45.1875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 24.0, 35.0, 53.0, 60.0, 64.0, 81.0, 86.0, 108.0, 107.0, 138.0, 113.0, 156.0, 155.0, 188.0, 223.0, 166.0, 198.0, 195.0, 191.0, 196.0, 157.0, 168.0, 149.0, 156.0, 117.0, 102.0, 92.0, 82.0, 79.0, 71.0, 48.0, 54.0, 44.0, 29.0, 23.0, 31.0, 10.0, 19.0, 14.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0], "bins": [-25.15625, -24.398681640625, -23.64111328125, -22.883544921875, -22.1259765625, -21.368408203125, -20.61083984375, -19.853271484375, -19.095703125, -18.338134765625, -17.58056640625, -16.822998046875, -16.0654296875, -15.307861328125, -14.55029296875, -13.792724609375, -13.03515625, -12.277587890625, -11.52001953125, -10.762451171875, -10.0048828125, -9.247314453125, -8.48974609375, -7.732177734375, -6.974609375, -6.217041015625, -5.45947265625, -4.701904296875, -3.9443359375, -3.186767578125, -2.42919921875, -1.671630859375, -0.9140625, -0.156494140625, 0.60107421875, 1.358642578125, 2.1162109375, 2.873779296875, 3.63134765625, 4.388916015625, 5.146484375, 5.904052734375, 6.66162109375, 7.419189453125, 8.1767578125, 8.934326171875, 9.69189453125, 10.449462890625, 11.20703125, 11.964599609375, 12.72216796875, 13.479736328125, 14.2373046875, 14.994873046875, 15.75244140625, 16.510009765625, 17.267578125, 18.025146484375, 18.78271484375, 19.540283203125, 20.2978515625, 21.055419921875, 21.81298828125, 22.570556640625, 23.328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 6.0, 11.0, 15.0, 12.0, 9.0, 16.0, 20.0, 22.0, 26.0, 24.0, 27.0, 36.0, 39.0, 28.0, 38.0, 37.0, 42.0, 45.0, 50.0, 44.0, 43.0, 35.0, 38.0, 26.0, 37.0, 27.0, 26.0, 26.0, 24.0, 27.0, 12.0, 24.0, 12.0, 16.0, 9.0, 11.0, 3.0, 8.0, 8.0, 7.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.483909606933594, -53.61665725708008, -51.74940872192383, -49.88215637207031, -48.01490783691406, -46.14765548706055, -44.28040313720703, -42.41315460205078, -40.545902252197266, -38.67864990234375, -36.8114013671875, -34.944149017333984, -33.076900482177734, -31.20964813232422, -29.342397689819336, -27.475147247314453, -25.60789680480957, -23.740646362304688, -21.873395919799805, -20.006145477294922, -18.138893127441406, -16.271642684936523, -14.40439224243164, -12.537140846252441, -10.669890403747559, -8.802639961242676, -6.935388565063477, -5.068138122558594, -3.2008872032165527, -1.3336362838745117, 0.5336141586303711, 2.4008655548095703, 4.268115997314453, 6.135366916656494, 8.002617835998535, 9.869868278503418, 11.737119674682617, 13.6043701171875, 15.471620559692383, 17.338871002197266, 19.20612335205078, 21.073373794555664, 22.940624237060547, 24.807876586914062, 26.675127029418945, 28.542377471923828, 30.40962791442871, 32.276878356933594, 34.144126892089844, 36.01137924194336, 37.87862777709961, 39.745880126953125, 41.613128662109375, 43.48038101196289, 45.347633361816406, 47.214881896972656, 49.08213424682617, 50.94938659667969, 52.81663513183594, 54.68388748168945, 56.5511360168457, 58.41838836669922, 60.28563690185547, 62.152889251708984, 64.0201416015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 1.0, 9.0, 7.0, 11.0, 12.0, 11.0, 22.0, 25.0, 15.0, 27.0, 26.0, 21.0, 17.0, 24.0, 30.0, 36.0, 26.0, 37.0, 40.0, 31.0, 29.0, 40.0, 40.0, 31.0, 38.0, 45.0, 33.0, 36.0, 31.0, 29.0, 32.0, 20.0, 25.0, 19.0, 16.0, 15.0, 17.0, 12.0, 6.0, 7.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-50.905338287353516, -49.10744857788086, -47.30955505371094, -45.51166534423828, -43.71377182006836, -41.9158821105957, -40.11798858642578, -38.320098876953125, -36.52220916748047, -34.72431945800781, -32.92642593383789, -31.128536224365234, -29.330642700195312, -27.532752990722656, -25.734861373901367, -23.936969757080078, -22.139076232910156, -20.341184616088867, -18.543292999267578, -16.745403289794922, -14.947510719299316, -13.149619102478027, -11.351728439331055, -9.553836822509766, -7.755945205688477, -5.9580535888671875, -4.160162448883057, -2.362271308898926, -0.5643796920776367, 1.2335119247436523, 3.031402587890625, 4.829294204711914, 6.627189636230469, 8.425081253051758, 10.222972869873047, 12.02086353302002, 13.818755149841309, 15.616646766662598, 17.41453742980957, 19.21242904663086, 21.01032066345215, 22.808212280273438, 24.606103897094727, 26.403995513916016, 28.201885223388672, 29.999778747558594, 31.79766845703125, 33.595558166503906, 35.39345169067383, 37.191341400146484, 38.989234924316406, 40.78712463378906, 42.585018157958984, 44.38290786743164, 46.18080139160156, 47.97869110107422, 49.776580810546875, 51.57447052001953, 53.37236404418945, 55.17025375366211, 56.96814727783203, 58.76603698730469, 60.563926696777344, 62.361820220947266, 64.15971374511719]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 10.0, 14.0, 19.0, 30.0, 41.0, 67.0, 99.0, 157.0, 214.0, 303.0, 477.0, 690.0, 1068.0, 1575.0, 2380.0, 3621.0, 5432.0, 7967.0, 11607.0, 17099.0, 24088.0, 34120.0, 46662.0, 59974.0, 75804.0, 90004.0, 99220.0, 102146.0, 97896.0, 87647.0, 72903.0, 57617.0, 43967.0, 31704.0, 22688.0, 15950.0, 10989.0, 7450.0, 4882.0, 3232.0, 2244.0, 1514.0, 974.0, 692.0, 415.0, 293.0, 213.0, 142.0, 65.0, 74.0, 33.0, 33.0, 15.0, 13.0, 10.0, 7.0, 4.0, 5.0, 0.0, 3.0, 3.0], "bins": [-9.015625, -8.7191162109375, -8.422607421875, -8.1260986328125, -7.82958984375, -7.5330810546875, -7.236572265625, -6.9400634765625, -6.6435546875, -6.3470458984375, -6.050537109375, -5.7540283203125, -5.45751953125, -5.1610107421875, -4.864501953125, -4.5679931640625, -4.271484375, -3.9749755859375, -3.678466796875, -3.3819580078125, -3.08544921875, -2.7889404296875, -2.492431640625, -2.1959228515625, -1.8994140625, -1.6029052734375, -1.306396484375, -1.0098876953125, -0.71337890625, -0.4168701171875, -0.120361328125, 0.1761474609375, 0.47265625, 0.7691650390625, 1.065673828125, 1.3621826171875, 1.65869140625, 1.9552001953125, 2.251708984375, 2.5482177734375, 2.8447265625, 3.1412353515625, 3.437744140625, 3.7342529296875, 4.03076171875, 4.3272705078125, 4.623779296875, 4.9202880859375, 5.216796875, 5.5133056640625, 5.809814453125, 6.1063232421875, 6.40283203125, 6.6993408203125, 6.995849609375, 7.2923583984375, 7.5888671875, 7.8853759765625, 8.181884765625, 8.4783935546875, 8.77490234375, 9.0714111328125, 9.367919921875, 9.6644287109375, 9.9609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 0.0, 9.0, 7.0, 12.0, 11.0, 13.0, 22.0, 24.0, 15.0, 28.0, 25.0, 20.0, 17.0, 25.0, 33.0, 33.0, 31.0, 32.0, 40.0, 31.0, 32.0, 42.0, 34.0, 31.0, 43.0, 42.0, 34.0, 33.0, 31.0, 29.0, 32.0, 23.0, 23.0, 19.0, 16.0, 19.0, 13.0, 12.0, 5.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.125, -49.3232421875, -47.521484375, -45.7197265625, -43.91796875, -42.1162109375, -40.314453125, -38.5126953125, -36.7109375, -34.9091796875, -33.107421875, -31.3056640625, -29.50390625, -27.7021484375, -25.900390625, -24.0986328125, -22.296875, -20.4951171875, -18.693359375, -16.8916015625, -15.08984375, -13.2880859375, -11.486328125, -9.6845703125, -7.8828125, -6.0810546875, -4.279296875, -2.4775390625, -0.67578125, 1.1259765625, 2.927734375, 4.7294921875, 6.53125, 8.3330078125, 10.134765625, 11.9365234375, 13.73828125, 15.5400390625, 17.341796875, 19.1435546875, 20.9453125, 22.7470703125, 24.548828125, 26.3505859375, 28.15234375, 29.9541015625, 31.755859375, 33.5576171875, 35.359375, 37.1611328125, 38.962890625, 40.7646484375, 42.56640625, 44.3681640625, 46.169921875, 47.9716796875, 49.7734375, 51.5751953125, 53.376953125, 55.1787109375, 56.98046875, 58.7822265625, 60.583984375, 62.3857421875, 64.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 8.0, 5.0, 6.0, 8.0, 26.0, 22.0, 31.0, 72.0, 82.0, 149.0, 260.0, 422.0, 788.0, 1370.0, 2519.0, 4758.0, 8775.0, 17684.0, 38253.0, 832646.0, 89846.0, 24415.0, 12210.0, 6457.0, 3443.0, 1853.0, 1018.0, 597.0, 319.0, 189.0, 110.0, 85.0, 41.0, 32.0, 20.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.5, -41.07080078125, -39.6416015625, -38.21240234375, -36.783203125, -35.35400390625, -33.9248046875, -32.49560546875, -31.06640625, -29.63720703125, -28.2080078125, -26.77880859375, -25.349609375, -23.92041015625, -22.4912109375, -21.06201171875, -19.6328125, -18.20361328125, -16.7744140625, -15.34521484375, -13.916015625, -12.48681640625, -11.0576171875, -9.62841796875, -8.19921875, -6.77001953125, -5.3408203125, -3.91162109375, -2.482421875, -1.05322265625, 0.3759765625, 1.80517578125, 3.234375, 4.66357421875, 6.0927734375, 7.52197265625, 8.951171875, 10.38037109375, 11.8095703125, 13.23876953125, 14.66796875, 16.09716796875, 17.5263671875, 18.95556640625, 20.384765625, 21.81396484375, 23.2431640625, 24.67236328125, 26.1015625, 27.53076171875, 28.9599609375, 30.38916015625, 31.818359375, 33.24755859375, 34.6767578125, 36.10595703125, 37.53515625, 38.96435546875, 40.3935546875, 41.82275390625, 43.251953125, 44.68115234375, 46.1103515625, 47.53955078125, 48.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 11.0, 12.0, 9.0, 16.0, 14.0, 21.0, 28.0, 16.0, 19.0, 29.0, 35.0, 36.0, 40.0, 46.0, 36.0, 59.0, 46.0, 43.0, 31.0, 48.0, 47.0, 27.0, 26.0, 35.0, 38.0, 35.0, 23.0, 17.0, 19.0, 17.0, 13.0, 16.0, 13.0, 19.0, 10.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.41455078125, -42.0791015625, -40.74365234375, -39.408203125, -38.07275390625, -36.7373046875, -35.40185546875, -34.06640625, -32.73095703125, -31.3955078125, -30.06005859375, -28.724609375, -27.38916015625, -26.0537109375, -24.71826171875, -23.3828125, -22.04736328125, -20.7119140625, -19.37646484375, -18.041015625, -16.70556640625, -15.3701171875, -14.03466796875, -12.69921875, -11.36376953125, -10.0283203125, -8.69287109375, -7.357421875, -6.02197265625, -4.6865234375, -3.35107421875, -2.015625, -0.68017578125, 0.6552734375, 1.99072265625, 3.326171875, 4.66162109375, 5.9970703125, 7.33251953125, 8.66796875, 10.00341796875, 11.3388671875, 12.67431640625, 14.009765625, 15.34521484375, 16.6806640625, 18.01611328125, 19.3515625, 20.68701171875, 22.0224609375, 23.35791015625, 24.693359375, 26.02880859375, 27.3642578125, 28.69970703125, 30.03515625, 31.37060546875, 32.7060546875, 34.04150390625, 35.376953125, 36.71240234375, 38.0478515625, 39.38330078125, 40.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 6.0, 10.0, 22.0, 17.0, 21.0, 37.0, 34.0, 41.0, 75.0, 93.0, 152.0, 218.0, 370.0, 568.0, 1047.0, 1792.0, 3351.0, 6776.0, 13705.0, 29719.0, 336975.0, 590908.0, 32016.0, 14821.0, 7268.0, 3591.0, 1941.0, 1134.0, 636.0, 348.0, 240.0, 189.0, 110.0, 78.0, 57.0, 37.0, 27.0, 21.0, 19.0, 17.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.50390625, -3.39105224609375, -3.2781982421875, -3.16534423828125, -3.052490234375, -2.93963623046875, -2.8267822265625, -2.71392822265625, -2.60107421875, -2.48822021484375, -2.3753662109375, -2.26251220703125, -2.149658203125, -2.03680419921875, -1.9239501953125, -1.81109619140625, -1.6982421875, -1.58538818359375, -1.4725341796875, -1.35968017578125, -1.246826171875, -1.13397216796875, -1.0211181640625, -0.90826416015625, -0.79541015625, -0.68255615234375, -0.5697021484375, -0.45684814453125, -0.343994140625, -0.23114013671875, -0.1182861328125, -0.00543212890625, 0.107421875, 0.22027587890625, 0.3331298828125, 0.44598388671875, 0.558837890625, 0.67169189453125, 0.7845458984375, 0.89739990234375, 1.01025390625, 1.12310791015625, 1.2359619140625, 1.34881591796875, 1.461669921875, 1.57452392578125, 1.6873779296875, 1.80023193359375, 1.9130859375, 2.02593994140625, 2.1387939453125, 2.25164794921875, 2.364501953125, 2.47735595703125, 2.5902099609375, 2.70306396484375, 2.81591796875, 2.92877197265625, 3.0416259765625, 3.15447998046875, 3.267333984375, 3.38018798828125, 3.4930419921875, 3.60589599609375, 3.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 13.0, 12.0, 20.0, 26.0, 24.0, 28.0, 33.0, 48.0, 40.0, 50.0, 49.0, 61.0, 56.0, 64.0, 53.0, 52.0, 65.0, 41.0, 42.0, 29.0, 30.0, 20.0, 31.0, 23.0, 16.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.372550994157791e-05, -9.011663496494293e-05, -8.650775998830795e-05, -8.289888501167297e-05, -7.9290010035038e-05, -7.568113505840302e-05, -7.207226008176804e-05, -6.846338510513306e-05, -6.485451012849808e-05, -6.12456351518631e-05, -5.763676017522812e-05, -5.402788519859314e-05, -5.041901022195816e-05, -4.681013524532318e-05, -4.32012602686882e-05, -3.959238529205322e-05, -3.5983510315418243e-05, -3.2374635338783264e-05, -2.8765760362148285e-05, -2.5156885385513306e-05, -2.1548010408878326e-05, -1.7939135432243347e-05, -1.4330260455608368e-05, -1.0721385478973389e-05, -7.1125105023384094e-06, -3.50363552570343e-06, 1.0523945093154907e-07, 3.7141144275665283e-06, 7.3229894042015076e-06, 1.0931864380836487e-05, 1.4540739357471466e-05, 1.8149614334106445e-05, 2.1758489310741425e-05, 2.5367364287376404e-05, 2.8976239264011383e-05, 3.258511424064636e-05, 3.619398921728134e-05, 3.980286419391632e-05, 4.34117391705513e-05, 4.702061414718628e-05, 5.062948912382126e-05, 5.423836410045624e-05, 5.784723907709122e-05, 6.14561140537262e-05, 6.506498903036118e-05, 6.867386400699615e-05, 7.228273898363113e-05, 7.589161396026611e-05, 7.950048893690109e-05, 8.310936391353607e-05, 8.671823889017105e-05, 9.032711386680603e-05, 9.393598884344101e-05, 9.754486382007599e-05, 0.00010115373879671097, 0.00010476261377334595, 0.00010837148874998093, 0.0001119803637266159, 0.00011558923870325089, 0.00011919811367988586, 0.00012280698865652084, 0.00012641586363315582, 0.0001300247386097908, 0.00013363361358642578]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 8.0, 23.0, 26.0, 45.0, 84.0, 112.0, 188.0, 271.0, 469.0, 770.0, 1248.0, 2037.0, 3429.0, 5589.0, 9637.0, 15776.0, 26149.0, 42204.0, 65599.0, 96704.0, 132374.0, 155431.0, 147817.0, 117184.0, 83415.0, 54491.0, 34401.0, 21200.0, 12784.0, 7580.0, 4629.0, 2674.0, 1599.0, 955.0, 615.0, 400.0, 229.0, 120.0, 95.0, 68.0, 47.0, 26.0, 11.0, 12.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.900390625, -2.80914306640625, -2.7178955078125, -2.62664794921875, -2.535400390625, -2.44415283203125, -2.3529052734375, -2.26165771484375, -2.17041015625, -2.07916259765625, -1.9879150390625, -1.89666748046875, -1.805419921875, -1.71417236328125, -1.6229248046875, -1.53167724609375, -1.4404296875, -1.34918212890625, -1.2579345703125, -1.16668701171875, -1.075439453125, -0.98419189453125, -0.8929443359375, -0.80169677734375, -0.71044921875, -0.61920166015625, -0.5279541015625, -0.43670654296875, -0.345458984375, -0.25421142578125, -0.1629638671875, -0.07171630859375, 0.01953125, 0.11077880859375, 0.2020263671875, 0.29327392578125, 0.384521484375, 0.47576904296875, 0.5670166015625, 0.65826416015625, 0.74951171875, 0.84075927734375, 0.9320068359375, 1.02325439453125, 1.114501953125, 1.20574951171875, 1.2969970703125, 1.38824462890625, 1.4794921875, 1.57073974609375, 1.6619873046875, 1.75323486328125, 1.844482421875, 1.93572998046875, 2.0269775390625, 2.11822509765625, 2.20947265625, 2.30072021484375, 2.3919677734375, 2.48321533203125, 2.574462890625, 2.66571044921875, 2.7569580078125, 2.84820556640625, 2.939453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 7.0, 20.0, 10.0, 22.0, 23.0, 21.0, 25.0, 28.0, 31.0, 28.0, 34.0, 36.0, 31.0, 38.0, 33.0, 32.0, 63.0, 50.0, 51.0, 42.0, 49.0, 31.0, 33.0, 41.0, 24.0, 28.0, 34.0, 21.0, 23.0, 17.0, 19.0, 11.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2119140625, -1.1786270141601562, -1.1453399658203125, -1.1120529174804688, -1.078765869140625, -1.0454788208007812, -1.0121917724609375, -0.9789047241210938, -0.94561767578125, -0.9123306274414062, -0.8790435791015625, -0.8457565307617188, -0.812469482421875, -0.7791824340820312, -0.7458953857421875, -0.7126083374023438, -0.6793212890625, -0.6460342407226562, -0.6127471923828125, -0.5794601440429688, -0.546173095703125, -0.5128860473632812, -0.4795989990234375, -0.44631195068359375, -0.41302490234375, -0.37973785400390625, -0.3464508056640625, -0.31316375732421875, -0.279876708984375, -0.24658966064453125, -0.2133026123046875, -0.18001556396484375, -0.146728515625, -0.11344146728515625, -0.0801544189453125, -0.04686737060546875, -0.013580322265625, 0.01970672607421875, 0.0529937744140625, 0.08628082275390625, 0.11956787109375, 0.15285491943359375, 0.1861419677734375, 0.21942901611328125, 0.252716064453125, 0.28600311279296875, 0.3192901611328125, 0.35257720947265625, 0.3858642578125, 0.41915130615234375, 0.4524383544921875, 0.48572540283203125, 0.519012451171875, 0.5522994995117188, 0.5855865478515625, 0.6188735961914062, 0.65216064453125, 0.6854476928710938, 0.7187347412109375, 0.7520217895507812, 0.785308837890625, 0.8185958862304688, 0.8518829345703125, 0.8851699829101562, 0.91845703125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 15.0, 12.0, 13.0, 9.0, 19.0, 16.0, 30.0, 23.0, 17.0, 34.0, 40.0, 31.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 43.0, 34.0, 36.0, 37.0, 36.0, 30.0, 30.0, 32.0, 18.0, 26.0, 23.0, 13.0, 21.0, 19.0, 10.0, 8.0, 7.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.912818908691406, -53.04204177856445, -51.1712646484375, -49.30048751831055, -47.429710388183594, -45.55893325805664, -43.68815612792969, -41.8173828125, -39.94660186767578, -38.07582473754883, -36.205047607421875, -34.33427047729492, -32.46349334716797, -30.592716217041016, -28.721940994262695, -26.851163864135742, -24.980388641357422, -23.10961151123047, -21.238834381103516, -19.368057250976562, -17.49728012084961, -15.626503944396973, -13.755727767944336, -11.884950637817383, -10.01417350769043, -8.143396377563477, -6.272619724273682, -4.401843070983887, -2.5310659408569336, -0.6602888107299805, 1.2104873657226562, 3.0812644958496094, 4.9520416259765625, 6.822818756103516, 8.693595886230469, 10.564372062683105, 12.435149192810059, 14.305926322937012, 16.17670249938965, 18.0474796295166, 19.918256759643555, 21.789033889770508, 23.65981101989746, 25.53058624267578, 27.401363372802734, 29.272140502929688, 31.14291763305664, 33.013694763183594, 34.88447189331055, 36.7552490234375, 38.62602615356445, 40.496803283691406, 42.36758041381836, 44.23835754394531, 46.109130859375, 47.97991180419922, 49.850685119628906, 51.72146224975586, 53.59223937988281, 55.463016510009766, 57.33379364013672, 59.20457077026367, 61.075347900390625, 62.94612121582031, 64.81690216064453]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 16.0, 24.0, 20.0, 20.0, 25.0, 23.0, 22.0, 24.0, 23.0, 33.0, 31.0, 35.0, 36.0, 37.0, 24.0, 37.0, 41.0, 35.0, 34.0, 34.0, 47.0, 34.0, 31.0, 33.0, 30.0, 30.0, 21.0, 22.0, 21.0, 15.0, 17.0, 18.0, 7.0, 3.0, 12.0, 9.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.96181106567383, -49.15064239501953, -47.33946990966797, -45.52830123901367, -43.717132568359375, -41.90596008300781, -40.094791412353516, -38.28362274169922, -36.472450256347656, -34.66128158569336, -32.8501091003418, -31.0389404296875, -29.22776985168457, -27.41659927368164, -25.605430603027344, -23.794260025024414, -21.983089447021484, -20.171918869018555, -18.360748291015625, -16.549579620361328, -14.738409042358398, -12.927238464355469, -11.116068840026855, -9.304899215698242, -7.4937286376953125, -5.682558536529541, -3.8713884353637695, -2.060218334197998, -0.24904823303222656, 1.5621223449707031, 3.3732919692993164, 5.18446159362793, 6.995635986328125, 8.806806564331055, 10.617976188659668, 12.429145812988281, 14.240316390991211, 16.05148696899414, 17.862655639648438, 19.673826217651367, 21.484996795654297, 23.296167373657227, 25.107337951660156, 26.918506622314453, 28.729677200317383, 30.540847778320312, 32.35201644897461, 34.163185119628906, 35.97435760498047, 37.785526275634766, 39.59669876098633, 41.407867431640625, 43.21903991699219, 45.030208587646484, 46.84137725830078, 48.652549743652344, 50.46371841430664, 52.27488708496094, 54.0860595703125, 55.8972282409668, 57.708396911621094, 59.519569396972656, 61.33073806762695, 63.14190673828125, 64.95307922363281]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 12.0, 25.0, 40.0, 71.0, 89.0, 168.0, 263.0, 448.0, 739.0, 1193.0, 1930.0, 3152.0, 4795.0, 7269.0, 10550.0, 15717.0, 22293.0, 30518.0, 40658.0, 52069.0, 63835.0, 75542.0, 83509.0, 89533.0, 90778.0, 86503.0, 79057.0, 68847.0, 57659.0, 45140.0, 35299.0, 25929.0, 18239.0, 12830.0, 8514.0, 5449.0, 3705.0, 2335.0, 1444.0, 958.0, 547.0, 369.0, 197.0, 126.0, 94.0, 55.0, 23.0, 13.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-37.25, -36.09375, -34.9375, -33.78125, -32.625, -31.46875, -30.3125, -29.15625, -28.0, -26.84375, -25.6875, -24.53125, -23.375, -22.21875, -21.0625, -19.90625, -18.75, -17.59375, -16.4375, -15.28125, -14.125, -12.96875, -11.8125, -10.65625, -9.5, -8.34375, -7.1875, -6.03125, -4.875, -3.71875, -2.5625, -1.40625, -0.25, 0.90625, 2.0625, 3.21875, 4.375, 5.53125, 6.6875, 7.84375, 9.0, 10.15625, 11.3125, 12.46875, 13.625, 14.78125, 15.9375, 17.09375, 18.25, 19.40625, 20.5625, 21.71875, 22.875, 24.03125, 25.1875, 26.34375, 27.5, 28.65625, 29.8125, 30.96875, 32.125, 33.28125, 34.4375, 35.59375, 36.75]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 9.0, 9.0, 12.0, 11.0, 25.0, 22.0, 17.0, 28.0, 21.0, 24.0, 22.0, 26.0, 33.0, 28.0, 30.0, 39.0, 37.0, 30.0, 28.0, 42.0, 36.0, 30.0, 41.0, 43.0, 37.0, 30.0, 34.0, 34.0, 25.0, 24.0, 20.0, 22.0, 17.0, 17.0, 17.0, 8.0, 5.0, 11.0, 6.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-49.65625, -47.90234375, -46.1484375, -44.39453125, -42.640625, -40.88671875, -39.1328125, -37.37890625, -35.625, -33.87109375, -32.1171875, -30.36328125, -28.609375, -26.85546875, -25.1015625, -23.34765625, -21.59375, -19.83984375, -18.0859375, -16.33203125, -14.578125, -12.82421875, -11.0703125, -9.31640625, -7.5625, -5.80859375, -4.0546875, -2.30078125, -0.546875, 1.20703125, 2.9609375, 4.71484375, 6.46875, 8.22265625, 9.9765625, 11.73046875, 13.484375, 15.23828125, 16.9921875, 18.74609375, 20.5, 22.25390625, 24.0078125, 25.76171875, 27.515625, 29.26953125, 31.0234375, 32.77734375, 34.53125, 36.28515625, 38.0390625, 39.79296875, 41.546875, 43.30078125, 45.0546875, 46.80859375, 48.5625, 50.31640625, 52.0703125, 53.82421875, 55.578125, 57.33203125, 59.0859375, 60.83984375, 62.59375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 9.0, 23.0, 32.0, 43.0, 72.0, 117.0, 166.0, 246.0, 432.0, 628.0, 1004.0, 1526.0, 2285.0, 3433.0, 4993.0, 7187.0, 10428.0, 14558.0, 20210.0, 26655.0, 34445.0, 44101.0, 53701.0, 63620.0, 72353.0, 78222.0, 81872.0, 82336.0, 78863.0, 72505.0, 64138.0, 54054.0, 44333.0, 34699.0, 27237.0, 20022.0, 14824.0, 10568.0, 7432.0, 5169.0, 3269.0, 2332.0, 1549.0, 1013.0, 649.0, 422.0, 287.0, 181.0, 121.0, 68.0, 51.0, 24.0, 27.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-31.125, -30.12158203125, -29.1181640625, -28.11474609375, -27.111328125, -26.10791015625, -25.1044921875, -24.10107421875, -23.09765625, -22.09423828125, -21.0908203125, -20.08740234375, -19.083984375, -18.08056640625, -17.0771484375, -16.07373046875, -15.0703125, -14.06689453125, -13.0634765625, -12.06005859375, -11.056640625, -10.05322265625, -9.0498046875, -8.04638671875, -7.04296875, -6.03955078125, -5.0361328125, -4.03271484375, -3.029296875, -2.02587890625, -1.0224609375, -0.01904296875, 0.984375, 1.98779296875, 2.9912109375, 3.99462890625, 4.998046875, 6.00146484375, 7.0048828125, 8.00830078125, 9.01171875, 10.01513671875, 11.0185546875, 12.02197265625, 13.025390625, 14.02880859375, 15.0322265625, 16.03564453125, 17.0390625, 18.04248046875, 19.0458984375, 20.04931640625, 21.052734375, 22.05615234375, 23.0595703125, 24.06298828125, 25.06640625, 26.06982421875, 27.0732421875, 28.07666015625, 29.080078125, 30.08349609375, 31.0869140625, 32.09033203125, 33.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 9.0, 3.0, 12.0, 12.0, 10.0, 15.0, 18.0, 24.0, 31.0, 36.0, 22.0, 36.0, 25.0, 46.0, 36.0, 24.0, 31.0, 49.0, 41.0, 45.0, 46.0, 35.0, 35.0, 42.0, 37.0, 35.0, 32.0, 41.0, 22.0, 18.0, 14.0, 13.0, 18.0, 16.0, 9.0, 6.0, 8.0, 6.0, 9.0, 7.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.5625, -39.32861328125, -38.0947265625, -36.86083984375, -35.626953125, -34.39306640625, -33.1591796875, -31.92529296875, -30.69140625, -29.45751953125, -28.2236328125, -26.98974609375, -25.755859375, -24.52197265625, -23.2880859375, -22.05419921875, -20.8203125, -19.58642578125, -18.3525390625, -17.11865234375, -15.884765625, -14.65087890625, -13.4169921875, -12.18310546875, -10.94921875, -9.71533203125, -8.4814453125, -7.24755859375, -6.013671875, -4.77978515625, -3.5458984375, -2.31201171875, -1.078125, 0.15576171875, 1.3896484375, 2.62353515625, 3.857421875, 5.09130859375, 6.3251953125, 7.55908203125, 8.79296875, 10.02685546875, 11.2607421875, 12.49462890625, 13.728515625, 14.96240234375, 16.1962890625, 17.43017578125, 18.6640625, 19.89794921875, 21.1318359375, 22.36572265625, 23.599609375, 24.83349609375, 26.0673828125, 27.30126953125, 28.53515625, 29.76904296875, 31.0029296875, 32.23681640625, 33.470703125, 34.70458984375, 35.9384765625, 37.17236328125, 38.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 12.0, 22.0, 21.0, 44.0, 89.0, 129.0, 197.0, 319.0, 462.0, 800.0, 1206.0, 1957.0, 2969.0, 4681.0, 7477.0, 11325.0, 16883.0, 25114.0, 35107.0, 47775.0, 62118.0, 76535.0, 88967.0, 97963.0, 100552.0, 96898.0, 87565.0, 74443.0, 59414.0, 45460.0, 33374.0, 23403.0, 15913.0, 10544.0, 6800.0, 4335.0, 2758.0, 1802.0, 1187.0, 685.0, 398.0, 289.0, 202.0, 126.0, 79.0, 50.0, 39.0, 27.0, 16.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.546875, -15.052001953125, -14.55712890625, -14.062255859375, -13.5673828125, -13.072509765625, -12.57763671875, -12.082763671875, -11.587890625, -11.093017578125, -10.59814453125, -10.103271484375, -9.6083984375, -9.113525390625, -8.61865234375, -8.123779296875, -7.62890625, -7.134033203125, -6.63916015625, -6.144287109375, -5.6494140625, -5.154541015625, -4.65966796875, -4.164794921875, -3.669921875, -3.175048828125, -2.68017578125, -2.185302734375, -1.6904296875, -1.195556640625, -0.70068359375, -0.205810546875, 0.2890625, 0.783935546875, 1.27880859375, 1.773681640625, 2.2685546875, 2.763427734375, 3.25830078125, 3.753173828125, 4.248046875, 4.742919921875, 5.23779296875, 5.732666015625, 6.2275390625, 6.722412109375, 7.21728515625, 7.712158203125, 8.20703125, 8.701904296875, 9.19677734375, 9.691650390625, 10.1865234375, 10.681396484375, 11.17626953125, 11.671142578125, 12.166015625, 12.660888671875, 13.15576171875, 13.650634765625, 14.1455078125, 14.640380859375, 15.13525390625, 15.630126953125, 16.125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 3.0, 7.0, 3.0, 13.0, 10.0, 11.0, 10.0, 22.0, 21.0, 22.0, 26.0, 33.0, 33.0, 37.0, 44.0, 37.0, 34.0, 44.0, 37.0, 39.0, 49.0, 38.0, 42.0, 50.0, 39.0, 45.0, 28.0, 34.0, 28.0, 23.0, 22.0, 23.0, 13.0, 6.0, 14.0, 16.0, 11.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020885467529296875, -0.002025127410888672, -0.0019617080688476562, -0.0018982887268066406, -0.001834869384765625, -0.0017714500427246094, -0.0017080307006835938, -0.0016446113586425781, -0.0015811920166015625, -0.0015177726745605469, -0.0014543533325195312, -0.0013909339904785156, -0.0013275146484375, -0.0012640953063964844, -0.0012006759643554688, -0.0011372566223144531, -0.0010738372802734375, -0.0010104179382324219, -0.0009469985961914062, -0.0008835792541503906, -0.000820159912109375, -0.0007567405700683594, -0.0006933212280273438, -0.0006299018859863281, -0.0005664825439453125, -0.0005030632019042969, -0.00043964385986328125, -0.0003762245178222656, -0.00031280517578125, -0.0002493858337402344, -0.00018596649169921875, -0.00012254714965820312, -5.91278076171875e-05, 4.291534423828125e-06, 6.771087646484375e-05, 0.00013113021850585938, 0.000194549560546875, 0.0002579689025878906, 0.00032138824462890625, 0.0003848075866699219, 0.0004482269287109375, 0.0005116462707519531, 0.0005750656127929688, 0.0006384849548339844, 0.000701904296875, 0.0007653236389160156, 0.0008287429809570312, 0.0008921623229980469, 0.0009555816650390625, 0.0010190010070800781, 0.0010824203491210938, 0.0011458396911621094, 0.001209259033203125, 0.0012726783752441406, 0.0013360977172851562, 0.0013995170593261719, 0.0014629364013671875, 0.0015263557434082031, 0.0015897750854492188, 0.0016531944274902344, 0.00171661376953125, 0.0017800331115722656, 0.0018434524536132812, 0.0019068717956542969, 0.0019702911376953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 25.0, 43.0, 58.0, 84.0, 156.0, 269.0, 397.0, 692.0, 1048.0, 1642.0, 2656.0, 4294.0, 6642.0, 10369.0, 15784.0, 23907.0, 35077.0, 48876.0, 65059.0, 81997.0, 97103.0, 106551.0, 108292.0, 101046.0, 88325.0, 72140.0, 55019.0, 40034.0, 28203.0, 18901.0, 12270.0, 8023.0, 5202.0, 3163.0, 1971.0, 1233.0, 734.0, 496.0, 306.0, 168.0, 94.0, 76.0, 46.0, 30.0, 19.0, 8.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.65625, -20.05224609375, -19.4482421875, -18.84423828125, -18.240234375, -17.63623046875, -17.0322265625, -16.42822265625, -15.82421875, -15.22021484375, -14.6162109375, -14.01220703125, -13.408203125, -12.80419921875, -12.2001953125, -11.59619140625, -10.9921875, -10.38818359375, -9.7841796875, -9.18017578125, -8.576171875, -7.97216796875, -7.3681640625, -6.76416015625, -6.16015625, -5.55615234375, -4.9521484375, -4.34814453125, -3.744140625, -3.14013671875, -2.5361328125, -1.93212890625, -1.328125, -0.72412109375, -0.1201171875, 0.48388671875, 1.087890625, 1.69189453125, 2.2958984375, 2.89990234375, 3.50390625, 4.10791015625, 4.7119140625, 5.31591796875, 5.919921875, 6.52392578125, 7.1279296875, 7.73193359375, 8.3359375, 8.93994140625, 9.5439453125, 10.14794921875, 10.751953125, 11.35595703125, 11.9599609375, 12.56396484375, 13.16796875, 13.77197265625, 14.3759765625, 14.97998046875, 15.583984375, 16.18798828125, 16.7919921875, 17.39599609375, 18.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 2.0, 6.0, 12.0, 7.0, 10.0, 14.0, 12.0, 22.0, 16.0, 31.0, 27.0, 18.0, 20.0, 36.0, 29.0, 37.0, 37.0, 40.0, 50.0, 47.0, 51.0, 40.0, 27.0, 39.0, 47.0, 42.0, 34.0, 37.0, 28.0, 22.0, 23.0, 20.0, 22.0, 14.0, 19.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.8671875, -7.6195068359375, -7.371826171875, -7.1241455078125, -6.87646484375, -6.6287841796875, -6.381103515625, -6.1334228515625, -5.8857421875, -5.6380615234375, -5.390380859375, -5.1427001953125, -4.89501953125, -4.6473388671875, -4.399658203125, -4.1519775390625, -3.904296875, -3.6566162109375, -3.408935546875, -3.1612548828125, -2.91357421875, -2.6658935546875, -2.418212890625, -2.1705322265625, -1.9228515625, -1.6751708984375, -1.427490234375, -1.1798095703125, -0.93212890625, -0.6844482421875, -0.436767578125, -0.1890869140625, 0.05859375, 0.3062744140625, 0.553955078125, 0.8016357421875, 1.04931640625, 1.2969970703125, 1.544677734375, 1.7923583984375, 2.0400390625, 2.2877197265625, 2.535400390625, 2.7830810546875, 3.03076171875, 3.2784423828125, 3.526123046875, 3.7738037109375, 4.021484375, 4.2691650390625, 4.516845703125, 4.7645263671875, 5.01220703125, 5.2598876953125, 5.507568359375, 5.7552490234375, 6.0029296875, 6.2506103515625, 6.498291015625, 6.7459716796875, 6.99365234375, 7.2413330078125, 7.489013671875, 7.7366943359375, 7.984375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 14.0, 6.0, 11.0, 12.0, 16.0, 22.0, 12.0, 18.0, 24.0, 31.0, 25.0, 27.0, 35.0, 38.0, 30.0, 49.0, 42.0, 43.0, 53.0, 47.0, 35.0, 35.0, 42.0, 31.0, 33.0, 30.0, 27.0, 24.0, 29.0, 27.0, 22.0, 15.0, 14.0, 19.0, 3.0, 13.0, 8.0, 4.0, 8.0, 6.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.916141510009766, -59.020442962646484, -57.12474060058594, -55.229042053222656, -53.333343505859375, -51.437644958496094, -49.54194259643555, -47.646244049072266, -45.75054168701172, -43.85484313964844, -41.95914077758789, -40.06344223022461, -38.16774368286133, -36.27204132080078, -34.3763427734375, -32.48064422607422, -30.584945678710938, -28.689245223999023, -26.793546676635742, -24.897846221923828, -23.002147674560547, -21.106447219848633, -19.21074676513672, -17.315048217773438, -15.419347763061523, -13.523648262023926, -11.627948760986328, -9.732248306274414, -7.836548805236816, -5.940849304199219, -4.045148849487305, -2.149449348449707, -0.25374603271484375, 1.641953706741333, 3.5376534461975098, 5.433353424072266, 7.329052925109863, 9.224752426147461, 11.120452880859375, 13.016152381896973, 14.91185188293457, 16.807552337646484, 18.703250885009766, 20.59895133972168, 22.494651794433594, 24.390350341796875, 26.28605079650879, 28.181751251220703, 30.077449798583984, 31.9731502532959, 33.86885070800781, 35.764549255371094, 37.660247802734375, 39.555946350097656, 41.4516487121582, 43.347347259521484, 45.24304962158203, 47.13874816894531, 49.03445053100586, 50.93014907836914, 52.82584762573242, 54.72154998779297, 56.61724853515625, 58.51294708251953, 60.40864562988281]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 2.0, 5.0, 3.0, 7.0, 15.0, 10.0, 12.0, 18.0, 23.0, 21.0, 24.0, 28.0, 22.0, 29.0, 29.0, 27.0, 27.0, 30.0, 32.0, 36.0, 40.0, 45.0, 29.0, 32.0, 40.0, 28.0, 33.0, 42.0, 30.0, 38.0, 21.0, 27.0, 31.0, 29.0, 20.0, 24.0, 12.0, 14.0, 10.0, 6.0, 10.0, 6.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.048343658447266, -52.148345947265625, -50.24835205078125, -48.34835433959961, -46.44835662841797, -44.548362731933594, -42.64836502075195, -40.74836730957031, -38.84837341308594, -36.9483757019043, -35.04838180541992, -33.14838409423828, -31.248388290405273, -29.348392486572266, -27.448394775390625, -25.548398971557617, -23.64840316772461, -21.7484073638916, -19.848411560058594, -17.948413848876953, -16.048418045043945, -14.148422241210938, -12.248425483703613, -10.348428726196289, -8.448432922363281, -6.548436641693115, -4.648440361022949, -2.748444080352783, -0.8484477996826172, 1.0515480041503906, 2.951544761657715, 4.851541519165039, 6.751533508300781, 8.651529312133789, 10.551526069641113, 12.451522827148438, 14.351518630981445, 16.251514434814453, 18.151512145996094, 20.0515079498291, 21.95150375366211, 23.851499557495117, 25.751495361328125, 27.651493072509766, 29.551488876342773, 31.45148468017578, 33.35148239135742, 35.25148010253906, 37.15147399902344, 39.05147171020508, 40.95146560668945, 42.851463317871094, 44.75145721435547, 46.65145492553711, 48.55145263671875, 50.451446533203125, 52.351444244384766, 54.251441955566406, 56.15143585205078, 58.05143356323242, 59.95143127441406, 61.85142517089844, 63.75142288208008, 65.65142059326172, 67.5514144897461]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 17.0, 24.0, 33.0, 73.0, 118.0, 201.0, 353.0, 614.0, 970.0, 1711.0, 2653.0, 4267.0, 6951.0, 11057.0, 16992.0, 26008.0, 39481.0, 58360.0, 84901.0, 118129.0, 160822.0, 211544.0, 263590.0, 316971.0, 357499.0, 382161.0, 383733.0, 363903.0, 323348.0, 272912.0, 218901.0, 168699.0, 125246.0, 89028.0, 62778.0, 42033.0, 28081.0, 18458.0, 11850.0, 7437.0, 4745.0, 2932.0, 1778.0, 1114.0, 719.0, 422.0, 261.0, 147.0, 103.0, 62.0, 35.0, 25.0, 14.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.4619140625, -36.173828125, -34.8857421875, -33.59765625, -32.3095703125, -31.021484375, -29.7333984375, -28.4453125, -27.1572265625, -25.869140625, -24.5810546875, -23.29296875, -22.0048828125, -20.716796875, -19.4287109375, -18.140625, -16.8525390625, -15.564453125, -14.2763671875, -12.98828125, -11.7001953125, -10.412109375, -9.1240234375, -7.8359375, -6.5478515625, -5.259765625, -3.9716796875, -2.68359375, -1.3955078125, -0.107421875, 1.1806640625, 2.46875, 3.7568359375, 5.044921875, 6.3330078125, 7.62109375, 8.9091796875, 10.197265625, 11.4853515625, 12.7734375, 14.0615234375, 15.349609375, 16.6376953125, 17.92578125, 19.2138671875, 20.501953125, 21.7900390625, 23.078125, 24.3662109375, 25.654296875, 26.9423828125, 28.23046875, 29.5185546875, 30.806640625, 32.0947265625, 33.3828125, 34.6708984375, 35.958984375, 37.2470703125, 38.53515625, 39.8232421875, 41.111328125, 42.3994140625, 43.6875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 9.0, 15.0, 9.0, 18.0, 17.0, 24.0, 20.0, 31.0, 25.0, 21.0, 30.0, 36.0, 24.0, 25.0, 34.0, 39.0, 32.0, 41.0, 42.0, 32.0, 40.0, 29.0, 31.0, 45.0, 29.0, 34.0, 33.0, 24.0, 25.0, 37.0, 19.0, 26.0, 11.0, 15.0, 11.0, 7.0, 9.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.46875, -46.72705078125, -44.9853515625, -43.24365234375, -41.501953125, -39.76025390625, -38.0185546875, -36.27685546875, -34.53515625, -32.79345703125, -31.0517578125, -29.31005859375, -27.568359375, -25.82666015625, -24.0849609375, -22.34326171875, -20.6015625, -18.85986328125, -17.1181640625, -15.37646484375, -13.634765625, -11.89306640625, -10.1513671875, -8.40966796875, -6.66796875, -4.92626953125, -3.1845703125, -1.44287109375, 0.298828125, 2.04052734375, 3.7822265625, 5.52392578125, 7.265625, 9.00732421875, 10.7490234375, 12.49072265625, 14.232421875, 15.97412109375, 17.7158203125, 19.45751953125, 21.19921875, 22.94091796875, 24.6826171875, 26.42431640625, 28.166015625, 29.90771484375, 31.6494140625, 33.39111328125, 35.1328125, 36.87451171875, 38.6162109375, 40.35791015625, 42.099609375, 43.84130859375, 45.5830078125, 47.32470703125, 49.06640625, 50.80810546875, 52.5498046875, 54.29150390625, 56.033203125, 57.77490234375, 59.5166015625, 61.25830078125, 63.0]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 28.0, 46.0, 84.0, 148.0, 252.0, 369.0, 622.0, 1061.0, 1709.0, 2756.0, 4360.0, 6850.0, 10948.0, 16603.0, 24801.0, 37314.0, 53669.0, 75767.0, 104097.0, 139289.0, 179036.0, 222311.0, 265658.0, 303367.0, 332588.0, 347208.0, 345121.0, 327577.0, 297288.0, 258002.0, 214419.0, 171073.0, 131602.0, 97494.0, 70836.0, 50413.0, 34444.0, 22847.0, 15467.0, 9894.0, 6457.0, 3948.0, 2520.0, 1557.0, 961.0, 572.0, 360.0, 192.0, 128.0, 70.0, 42.0, 27.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.8125, -39.533203125, -38.25390625, -36.974609375, -35.6953125, -34.416015625, -33.13671875, -31.857421875, -30.578125, -29.298828125, -28.01953125, -26.740234375, -25.4609375, -24.181640625, -22.90234375, -21.623046875, -20.34375, -19.064453125, -17.78515625, -16.505859375, -15.2265625, -13.947265625, -12.66796875, -11.388671875, -10.109375, -8.830078125, -7.55078125, -6.271484375, -4.9921875, -3.712890625, -2.43359375, -1.154296875, 0.125, 1.404296875, 2.68359375, 3.962890625, 5.2421875, 6.521484375, 7.80078125, 9.080078125, 10.359375, 11.638671875, 12.91796875, 14.197265625, 15.4765625, 16.755859375, 18.03515625, 19.314453125, 20.59375, 21.873046875, 23.15234375, 24.431640625, 25.7109375, 26.990234375, 28.26953125, 29.548828125, 30.828125, 32.107421875, 33.38671875, 34.666015625, 35.9453125, 37.224609375, 38.50390625, 39.783203125, 41.0625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 12.0, 12.0, 11.0, 17.0, 26.0, 23.0, 33.0, 56.0, 48.0, 74.0, 77.0, 85.0, 110.0, 113.0, 125.0, 146.0, 139.0, 153.0, 152.0, 186.0, 182.0, 193.0, 180.0, 176.0, 162.0, 164.0, 178.0, 152.0, 133.0, 129.0, 115.0, 114.0, 96.0, 74.0, 82.0, 59.0, 44.0, 53.0, 41.0, 32.0, 35.0, 16.0, 15.0, 7.0, 7.0, 13.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.59375, -23.836669921875, -23.07958984375, -22.322509765625, -21.5654296875, -20.808349609375, -20.05126953125, -19.294189453125, -18.537109375, -17.780029296875, -17.02294921875, -16.265869140625, -15.5087890625, -14.751708984375, -13.99462890625, -13.237548828125, -12.48046875, -11.723388671875, -10.96630859375, -10.209228515625, -9.4521484375, -8.695068359375, -7.93798828125, -7.180908203125, -6.423828125, -5.666748046875, -4.90966796875, -4.152587890625, -3.3955078125, -2.638427734375, -1.88134765625, -1.124267578125, -0.3671875, 0.389892578125, 1.14697265625, 1.904052734375, 2.6611328125, 3.418212890625, 4.17529296875, 4.932373046875, 5.689453125, 6.446533203125, 7.20361328125, 7.960693359375, 8.7177734375, 9.474853515625, 10.23193359375, 10.989013671875, 11.74609375, 12.503173828125, 13.26025390625, 14.017333984375, 14.7744140625, 15.531494140625, 16.28857421875, 17.045654296875, 17.802734375, 18.559814453125, 19.31689453125, 20.073974609375, 20.8310546875, 21.588134765625, 22.34521484375, 23.102294921875, 23.859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 7.0, 8.0, 17.0, 14.0, 16.0, 22.0, 21.0, 22.0, 31.0, 30.0, 36.0, 30.0, 30.0, 43.0, 43.0, 56.0, 48.0, 45.0, 35.0, 27.0, 38.0, 40.0, 32.0, 27.0, 37.0, 28.0, 23.0, 22.0, 25.0, 20.0, 14.0, 8.0, 10.0, 14.0, 12.0, 8.0, 12.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.678443908691406, -55.83201599121094, -53.98558807373047, -52.13916015625, -50.29273223876953, -48.44630432128906, -46.599876403808594, -44.753448486328125, -42.907020568847656, -41.06059265136719, -39.21416473388672, -37.36773681640625, -35.52130889892578, -33.67488098144531, -31.828453063964844, -29.982025146484375, -28.135595321655273, -26.289167404174805, -24.442739486694336, -22.596311569213867, -20.7498836517334, -18.903453826904297, -17.057025909423828, -15.210598945617676, -13.364171028137207, -11.517743110656738, -9.67131519317627, -7.824886798858643, -5.978458881378174, -4.132030487060547, -2.285602569580078, -0.4391746520996094, 1.4072532653808594, 3.253681182861328, 5.100109100341797, 6.946537494659424, 8.792964935302734, 10.63939380645752, 12.485821723937988, 14.332249641418457, 16.17867660522461, 18.025104522705078, 19.871532440185547, 21.717960357666016, 23.564388275146484, 25.410816192626953, 27.257244110107422, 29.10367202758789, 30.950101852416992, 32.796531677246094, 34.64295959472656, 36.48938751220703, 38.3358154296875, 40.18224334716797, 42.02867126464844, 43.875099182128906, 45.721527099609375, 47.567955017089844, 49.41438293457031, 51.26081085205078, 53.10723876953125, 54.95366668701172, 56.80009460449219, 58.646522521972656, 60.492950439453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 10.0, 13.0, 7.0, 16.0, 20.0, 13.0, 23.0, 22.0, 20.0, 22.0, 25.0, 24.0, 32.0, 26.0, 41.0, 35.0, 42.0, 32.0, 35.0, 41.0, 38.0, 43.0, 42.0, 32.0, 25.0, 32.0, 29.0, 20.0, 26.0, 23.0, 27.0, 21.0, 17.0, 11.0, 10.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.211090087890625, -53.36396789550781, -51.516849517822266, -49.66972732543945, -47.822608947753906, -45.975486755371094, -44.12836456298828, -42.281246185302734, -40.43412780761719, -38.587005615234375, -36.73988723754883, -34.892765045166016, -33.04564666748047, -31.198524475097656, -29.351404190063477, -27.504283905029297, -25.657161712646484, -23.810041427612305, -21.962921142578125, -20.115798950195312, -18.268680572509766, -16.421558380126953, -14.574438095092773, -12.727317810058594, -10.880197525024414, -9.033077239990234, -7.1859564781188965, -5.338835716247559, -3.491715431213379, -1.6445951461791992, 0.20252609252929688, 2.0496463775634766, 3.8967628479003906, 5.74388313293457, 7.591003894805908, 9.438124656677246, 11.285244941711426, 13.132365226745605, 14.979486465454102, 16.82660675048828, 18.67372703552246, 20.52084732055664, 22.36796760559082, 24.215087890625, 26.062210083007812, 27.90932846069336, 29.756450653076172, 31.60357093811035, 33.45069122314453, 35.297813415527344, 37.14493179321289, 38.9920539855957, 40.83917236328125, 42.68629455566406, 44.533416748046875, 46.38053512573242, 48.22765350341797, 50.07477569580078, 51.92189407348633, 53.76901626586914, 55.61613464355469, 57.4632568359375, 59.31037902832031, 61.15749740600586, 63.00461959838867]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 21.0, 26.0, 34.0, 57.0, 84.0, 158.0, 224.0, 367.0, 575.0, 908.0, 1398.0, 2225.0, 3475.0, 5626.0, 8444.0, 13188.0, 19503.0, 29327.0, 42111.0, 58614.0, 76939.0, 95321.0, 108730.0, 113762.0, 110012.0, 95378.0, 76982.0, 58046.0, 41855.0, 29095.0, 19587.0, 12955.0, 8494.0, 5497.0, 3491.0, 2183.0, 1426.0, 886.0, 530.0, 321.0, 246.0, 171.0, 97.0, 61.0, 42.0, 25.0, 18.0, 7.0, 12.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.41015625, -8.125, -7.83984375, -7.5546875, -7.26953125, -6.984375, -6.69921875, -6.4140625, -6.12890625, -5.84375, -5.55859375, -5.2734375, -4.98828125, -4.703125, -4.41796875, -4.1328125, -3.84765625, -3.5625, -3.27734375, -2.9921875, -2.70703125, -2.421875, -2.13671875, -1.8515625, -1.56640625, -1.28125, -0.99609375, -0.7109375, -0.42578125, -0.140625, 0.14453125, 0.4296875, 0.71484375, 1.0, 1.28515625, 1.5703125, 1.85546875, 2.140625, 2.42578125, 2.7109375, 2.99609375, 3.28125, 3.56640625, 3.8515625, 4.13671875, 4.421875, 4.70703125, 4.9921875, 5.27734375, 5.5625, 5.84765625, 6.1328125, 6.41796875, 6.703125, 6.98828125, 7.2734375, 7.55859375, 7.84375, 8.12890625, 8.4140625, 8.69921875, 8.984375, 9.26953125, 9.5546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 11.0, 12.0, 8.0, 18.0, 16.0, 15.0, 23.0, 21.0, 21.0, 22.0, 26.0, 22.0, 30.0, 27.0, 41.0, 37.0, 42.0, 32.0, 37.0, 39.0, 38.0, 43.0, 41.0, 31.0, 27.0, 30.0, 29.0, 22.0, 26.0, 23.0, 27.0, 20.0, 16.0, 11.0, 12.0, 13.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.5, -53.64990234375, -51.7998046875, -49.94970703125, -48.099609375, -46.24951171875, -44.3994140625, -42.54931640625, -40.69921875, -38.84912109375, -36.9990234375, -35.14892578125, -33.298828125, -31.44873046875, -29.5986328125, -27.74853515625, -25.8984375, -24.04833984375, -22.1982421875, -20.34814453125, -18.498046875, -16.64794921875, -14.7978515625, -12.94775390625, -11.09765625, -9.24755859375, -7.3974609375, -5.54736328125, -3.697265625, -1.84716796875, 0.0029296875, 1.85302734375, 3.703125, 5.55322265625, 7.4033203125, 9.25341796875, 11.103515625, 12.95361328125, 14.8037109375, 16.65380859375, 18.50390625, 20.35400390625, 22.2041015625, 24.05419921875, 25.904296875, 27.75439453125, 29.6044921875, 31.45458984375, 33.3046875, 35.15478515625, 37.0048828125, 38.85498046875, 40.705078125, 42.55517578125, 44.4052734375, 46.25537109375, 48.10546875, 49.95556640625, 51.8056640625, 53.65576171875, 55.505859375, 57.35595703125, 59.2060546875, 61.05615234375, 62.90625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 12.0, 18.0, 26.0, 47.0, 72.0, 123.0, 184.0, 308.0, 486.0, 825.0, 1305.0, 2129.0, 3541.0, 5729.0, 9385.0, 15718.0, 28512.0, 188235.0, 705318.0, 38353.0, 19296.0, 11278.0, 6842.0, 4320.0, 2490.0, 1583.0, 906.0, 611.0, 346.0, 208.0, 124.0, 90.0, 40.0, 36.0, 17.0, 10.0, 11.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.46875, -24.625, -23.78125, -22.9375, -22.09375, -21.25, -20.40625, -19.5625, -18.71875, -17.875, -17.03125, -16.1875, -15.34375, -14.5, -13.65625, -12.8125, -11.96875, -11.125, -10.28125, -9.4375, -8.59375, -7.75, -6.90625, -6.0625, -5.21875, -4.375, -3.53125, -2.6875, -1.84375, -1.0, -0.15625, 0.6875, 1.53125, 2.375, 3.21875, 4.0625, 4.90625, 5.75, 6.59375, 7.4375, 8.28125, 9.125, 9.96875, 10.8125, 11.65625, 12.5, 13.34375, 14.1875, 15.03125, 15.875, 16.71875, 17.5625, 18.40625, 19.25, 20.09375, 20.9375, 21.78125, 22.625, 23.46875, 24.3125, 25.15625, 26.0, 26.84375, 27.6875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 15.0, 16.0, 8.0, 15.0, 20.0, 17.0, 27.0, 27.0, 28.0, 16.0, 28.0, 29.0, 37.0, 33.0, 42.0, 52.0, 35.0, 37.0, 48.0, 42.0, 38.0, 38.0, 32.0, 24.0, 27.0, 30.0, 34.0, 29.0, 16.0, 28.0, 12.0, 19.0, 22.0, 12.0, 12.0, 6.0, 7.0, 7.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5, -41.146484375, -39.79296875, -38.439453125, -37.0859375, -35.732421875, -34.37890625, -33.025390625, -31.671875, -30.318359375, -28.96484375, -27.611328125, -26.2578125, -24.904296875, -23.55078125, -22.197265625, -20.84375, -19.490234375, -18.13671875, -16.783203125, -15.4296875, -14.076171875, -12.72265625, -11.369140625, -10.015625, -8.662109375, -7.30859375, -5.955078125, -4.6015625, -3.248046875, -1.89453125, -0.541015625, 0.8125, 2.166015625, 3.51953125, 4.873046875, 6.2265625, 7.580078125, 8.93359375, 10.287109375, 11.640625, 12.994140625, 14.34765625, 15.701171875, 17.0546875, 18.408203125, 19.76171875, 21.115234375, 22.46875, 23.822265625, 25.17578125, 26.529296875, 27.8828125, 29.236328125, 30.58984375, 31.943359375, 33.296875, 34.650390625, 36.00390625, 37.357421875, 38.7109375, 40.064453125, 41.41796875, 42.771484375, 44.125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 20.0, 41.0, 52.0, 83.0, 143.0, 242.0, 376.0, 639.0, 1045.0, 1909.0, 3189.0, 5542.0, 10340.0, 19016.0, 38119.0, 810029.0, 99065.0, 26876.0, 14119.0, 7556.0, 4256.0, 2315.0, 1404.0, 823.0, 481.0, 306.0, 197.0, 102.0, 70.0, 43.0, 32.0, 29.0, 7.0, 7.0, 15.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.09765625, -3.003082275390625, -2.90850830078125, -2.813934326171875, -2.7193603515625, -2.624786376953125, -2.53021240234375, -2.435638427734375, -2.341064453125, -2.246490478515625, -2.15191650390625, -2.057342529296875, -1.9627685546875, -1.868194580078125, -1.77362060546875, -1.679046630859375, -1.58447265625, -1.489898681640625, -1.39532470703125, -1.300750732421875, -1.2061767578125, -1.111602783203125, -1.01702880859375, -0.922454833984375, -0.827880859375, -0.733306884765625, -0.63873291015625, -0.544158935546875, -0.4495849609375, -0.355010986328125, -0.26043701171875, -0.165863037109375, -0.0712890625, 0.023284912109375, 0.11785888671875, 0.212432861328125, 0.3070068359375, 0.401580810546875, 0.49615478515625, 0.590728759765625, 0.685302734375, 0.779876708984375, 0.87445068359375, 0.969024658203125, 1.0635986328125, 1.158172607421875, 1.25274658203125, 1.347320556640625, 1.44189453125, 1.536468505859375, 1.63104248046875, 1.725616455078125, 1.8201904296875, 1.914764404296875, 2.00933837890625, 2.103912353515625, 2.198486328125, 2.293060302734375, 2.38763427734375, 2.482208251953125, 2.5767822265625, 2.671356201171875, 2.76593017578125, 2.860504150390625, 2.955078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 13.0, 13.0, 10.0, 17.0, 24.0, 28.0, 27.0, 35.0, 28.0, 53.0, 39.0, 44.0, 53.0, 38.0, 50.0, 46.0, 57.0, 49.0, 56.0, 42.0, 31.0, 43.0, 16.0, 35.0, 27.0, 19.0, 23.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.18832015991211e-05, -6.942730396986008e-05, -6.697140634059906e-05, -6.451550871133804e-05, -6.205961108207703e-05, -5.960371345281601e-05, -5.714781582355499e-05, -5.4691918194293976e-05, -5.223602056503296e-05, -4.978012293577194e-05, -4.7324225306510925e-05, -4.486832767724991e-05, -4.241243004798889e-05, -3.9956532418727875e-05, -3.750063478946686e-05, -3.504473716020584e-05, -3.2588839530944824e-05, -3.0132941901683807e-05, -2.767704427242279e-05, -2.5221146643161774e-05, -2.2765249013900757e-05, -2.030935138463974e-05, -1.7853453755378723e-05, -1.5397556126117706e-05, -1.294165849685669e-05, -1.0485760867595673e-05, -8.029863238334656e-06, -5.573965609073639e-06, -3.118067979812622e-06, -6.621703505516052e-07, 1.7937272787094116e-06, 4.2496249079704285e-06, 6.705522537231445e-06, 9.161420166492462e-06, 1.1617317795753479e-05, 1.4073215425014496e-05, 1.6529113054275513e-05, 1.898501068353653e-05, 2.1440908312797546e-05, 2.3896805942058563e-05, 2.635270357131958e-05, 2.8808601200580597e-05, 3.1264498829841614e-05, 3.372039645910263e-05, 3.617629408836365e-05, 3.8632191717624664e-05, 4.108808934688568e-05, 4.35439869761467e-05, 4.5999884605407715e-05, 4.845578223466873e-05, 5.091167986392975e-05, 5.3367577493190765e-05, 5.582347512245178e-05, 5.82793727517128e-05, 6.0735270380973816e-05, 6.319116801023483e-05, 6.564706563949585e-05, 6.810296326875687e-05, 7.055886089801788e-05, 7.30147585272789e-05, 7.547065615653992e-05, 7.792655378580093e-05, 8.038245141506195e-05, 8.283834904432297e-05, 8.529424667358398e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 13.0, 13.0, 13.0, 18.0, 33.0, 54.0, 77.0, 104.0, 150.0, 253.0, 367.0, 536.0, 858.0, 1191.0, 1768.0, 2835.0, 4035.0, 5958.0, 8636.0, 12688.0, 18162.0, 26145.0, 36278.0, 49491.0, 66957.0, 87508.0, 107380.0, 120014.0, 116103.0, 98612.0, 77811.0, 59087.0, 42981.0, 31210.0, 22032.0, 15446.0, 10753.0, 7575.0, 5203.0, 3440.0, 2262.0, 1436.0, 1032.0, 702.0, 441.0, 294.0, 216.0, 142.0, 86.0, 57.0, 30.0, 24.0, 15.0, 19.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.9775390625, -1.9132843017578125, -1.849029541015625, -1.7847747802734375, -1.72052001953125, -1.6562652587890625, -1.592010498046875, -1.5277557373046875, -1.4635009765625, -1.3992462158203125, -1.334991455078125, -1.2707366943359375, -1.20648193359375, -1.1422271728515625, -1.077972412109375, -1.0137176513671875, -0.949462890625, -0.8852081298828125, -0.820953369140625, -0.7566986083984375, -0.69244384765625, -0.6281890869140625, -0.563934326171875, -0.4996795654296875, -0.4354248046875, -0.3711700439453125, -0.306915283203125, -0.2426605224609375, -0.17840576171875, -0.1141510009765625, -0.049896240234375, 0.0143585205078125, 0.07861328125, 0.1428680419921875, 0.207122802734375, 0.2713775634765625, 0.33563232421875, 0.3998870849609375, 0.464141845703125, 0.5283966064453125, 0.5926513671875, 0.6569061279296875, 0.721160888671875, 0.7854156494140625, 0.84967041015625, 0.9139251708984375, 0.978179931640625, 1.0424346923828125, 1.106689453125, 1.1709442138671875, 1.235198974609375, 1.2994537353515625, 1.36370849609375, 1.4279632568359375, 1.492218017578125, 1.5564727783203125, 1.6207275390625, 1.6849822998046875, 1.749237060546875, 1.8134918212890625, 1.87774658203125, 1.9420013427734375, 2.006256103515625, 2.0705108642578125, 2.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 9.0, 14.0, 21.0, 16.0, 16.0, 22.0, 30.0, 29.0, 32.0, 41.0, 55.0, 53.0, 55.0, 66.0, 73.0, 70.0, 47.0, 50.0, 42.0, 38.0, 38.0, 18.0, 25.0, 18.0, 11.0, 15.0, 15.0, 14.0, 5.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.2724609375, -1.2373580932617188, -1.2022552490234375, -1.1671524047851562, -1.132049560546875, -1.0969467163085938, -1.0618438720703125, -1.0267410278320312, -0.99163818359375, -0.9565353393554688, -0.9214324951171875, -0.8863296508789062, -0.851226806640625, -0.8161239624023438, -0.7810211181640625, -0.7459182739257812, -0.7108154296875, -0.6757125854492188, -0.6406097412109375, -0.6055068969726562, -0.570404052734375, -0.5353012084960938, -0.5001983642578125, -0.46509552001953125, -0.42999267578125, -0.39488983154296875, -0.3597869873046875, -0.32468414306640625, -0.289581298828125, -0.25447845458984375, -0.2193756103515625, -0.18427276611328125, -0.149169921875, -0.11406707763671875, -0.0789642333984375, -0.04386138916015625, -0.008758544921875, 0.02634429931640625, 0.0614471435546875, 0.09654998779296875, 0.13165283203125, 0.16675567626953125, 0.2018585205078125, 0.23696136474609375, 0.272064208984375, 0.30716705322265625, 0.3422698974609375, 0.37737274169921875, 0.4124755859375, 0.44757843017578125, 0.4826812744140625, 0.5177841186523438, 0.552886962890625, 0.5879898071289062, 0.6230926513671875, 0.6581954956054688, 0.69329833984375, 0.7284011840820312, 0.7635040283203125, 0.7986068725585938, 0.833709716796875, 0.8688125610351562, 0.9039154052734375, 0.9390182495117188, 0.97412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 11.0, 5.0, 14.0, 14.0, 14.0, 16.0, 32.0, 17.0, 22.0, 39.0, 21.0, 33.0, 28.0, 36.0, 44.0, 46.0, 53.0, 44.0, 40.0, 40.0, 23.0, 33.0, 46.0, 31.0, 34.0, 28.0, 26.0, 20.0, 27.0, 21.0, 20.0, 14.0, 11.0, 12.0, 12.0, 9.0, 11.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.98395538330078, -54.17173767089844, -52.359519958496094, -50.54730224609375, -48.73508834838867, -46.92287063598633, -45.110652923583984, -43.29843521118164, -41.48622131347656, -39.67400360107422, -37.861785888671875, -36.04956817626953, -34.23735427856445, -32.42513656616211, -30.612918853759766, -28.800701141357422, -26.988483428955078, -25.176265716552734, -23.364049911499023, -21.55183219909668, -19.73961639404297, -17.927398681640625, -16.11518096923828, -14.302964210510254, -12.490747451782227, -10.6785306930542, -8.866313934326172, -7.054096221923828, -5.241879463195801, -3.4296627044677734, -1.6174449920654297, 0.19477176666259766, 2.0069847106933594, 3.819201707839966, 5.631418704986572, 7.443635940551758, 9.255852699279785, 11.068069458007812, 12.880287170410156, 14.692503929138184, 16.50472068786621, 18.316938400268555, 20.129154205322266, 21.94137191772461, 23.753589630126953, 25.565805435180664, 27.378023147583008, 29.19023895263672, 31.002456665039062, 32.814674377441406, 34.62689208984375, 36.439109802246094, 38.25132369995117, 40.063541412353516, 41.87575912475586, 43.6879768371582, 45.50019073486328, 47.312408447265625, 49.12462615966797, 50.93684387207031, 52.74905776977539, 54.561275482177734, 56.37349319458008, 58.18571090698242, 59.997928619384766]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 14.0, 13.0, 10.0, 11.0, 18.0, 13.0, 18.0, 22.0, 20.0, 21.0, 21.0, 26.0, 25.0, 31.0, 29.0, 38.0, 36.0, 47.0, 31.0, 33.0, 43.0, 39.0, 42.0, 38.0, 30.0, 28.0, 30.0, 32.0, 17.0, 28.0, 21.0, 28.0, 20.0, 14.0, 10.0, 10.0, 17.0, 12.0, 7.0, 9.0, 7.0, 2.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-55.297603607177734, -53.44639205932617, -51.59518051147461, -49.74396896362305, -47.892757415771484, -46.04154586791992, -44.19033432006836, -42.3391227722168, -40.487911224365234, -38.63669967651367, -36.78548812866211, -34.93427658081055, -33.083065032958984, -31.231853485107422, -29.38064193725586, -27.529430389404297, -25.6782169342041, -23.82700538635254, -21.975793838500977, -20.124582290649414, -18.27337074279785, -16.422157287597656, -14.57094669342041, -12.719735145568848, -10.868523597717285, -9.017312049865723, -7.16610050201416, -5.3148884773254395, -3.463676929473877, -1.6124649047851562, 0.23874664306640625, 2.0899581909179688, 3.9411697387695312, 5.792381286621094, 7.643592834472656, 9.494804382324219, 11.346015930175781, 13.19722843170166, 15.048439979553223, 16.89965057373047, 18.75086212158203, 20.602073669433594, 22.453285217285156, 24.30449676513672, 26.15570831298828, 28.006919860839844, 29.858131408691406, 31.70934295654297, 33.56055450439453, 35.411766052246094, 37.262977600097656, 39.11418914794922, 40.96540069580078, 42.816612243652344, 44.667823791503906, 46.51903533935547, 48.3702507019043, 50.22146224975586, 52.07267379760742, 53.923885345458984, 55.77509689331055, 57.62630844116211, 59.47751998901367, 61.328731536865234, 63.1799430847168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 13.0, 27.0, 32.0, 55.0, 93.0, 219.0, 285.0, 472.0, 765.0, 1171.0, 1894.0, 3047.0, 4525.0, 6671.0, 9830.0, 14092.0, 19649.0, 26839.0, 35505.0, 45629.0, 55900.0, 66583.0, 75422.0, 82225.0, 85696.0, 85174.0, 80537.0, 73010.0, 62959.0, 53357.0, 42916.0, 32958.0, 24469.0, 17951.0, 12818.0, 8650.0, 5938.0, 4074.0, 2626.0, 1605.0, 1089.0, 690.0, 436.0, 251.0, 163.0, 103.0, 56.0, 35.0, 20.0, 12.0, 8.0, 5.0, 5.0, 0.0, 1.0], "bins": [-36.75, -35.66455078125, -34.5791015625, -33.49365234375, -32.408203125, -31.32275390625, -30.2373046875, -29.15185546875, -28.06640625, -26.98095703125, -25.8955078125, -24.81005859375, -23.724609375, -22.63916015625, -21.5537109375, -20.46826171875, -19.3828125, -18.29736328125, -17.2119140625, -16.12646484375, -15.041015625, -13.95556640625, -12.8701171875, -11.78466796875, -10.69921875, -9.61376953125, -8.5283203125, -7.44287109375, -6.357421875, -5.27197265625, -4.1865234375, -3.10107421875, -2.015625, -0.93017578125, 0.1552734375, 1.24072265625, 2.326171875, 3.41162109375, 4.4970703125, 5.58251953125, 6.66796875, 7.75341796875, 8.8388671875, 9.92431640625, 11.009765625, 12.09521484375, 13.1806640625, 14.26611328125, 15.3515625, 16.43701171875, 17.5224609375, 18.60791015625, 19.693359375, 20.77880859375, 21.8642578125, 22.94970703125, 24.03515625, 25.12060546875, 26.2060546875, 27.29150390625, 28.376953125, 29.46240234375, 30.5478515625, 31.63330078125, 32.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 11.0, 12.0, 12.0, 11.0, 16.0, 18.0, 15.0, 23.0, 21.0, 18.0, 22.0, 29.0, 23.0, 33.0, 29.0, 42.0, 37.0, 45.0, 32.0, 29.0, 52.0, 40.0, 40.0, 38.0, 27.0, 28.0, 33.0, 25.0, 19.0, 30.0, 22.0, 28.0, 15.0, 19.0, 5.0, 14.0, 14.0, 11.0, 6.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.18017578125, -50.3603515625, -48.54052734375, -46.720703125, -44.90087890625, -43.0810546875, -41.26123046875, -39.44140625, -37.62158203125, -35.8017578125, -33.98193359375, -32.162109375, -30.34228515625, -28.5224609375, -26.70263671875, -24.8828125, -23.06298828125, -21.2431640625, -19.42333984375, -17.603515625, -15.78369140625, -13.9638671875, -12.14404296875, -10.32421875, -8.50439453125, -6.6845703125, -4.86474609375, -3.044921875, -1.22509765625, 0.5947265625, 2.41455078125, 4.234375, 6.05419921875, 7.8740234375, 9.69384765625, 11.513671875, 13.33349609375, 15.1533203125, 16.97314453125, 18.79296875, 20.61279296875, 22.4326171875, 24.25244140625, 26.072265625, 27.89208984375, 29.7119140625, 31.53173828125, 33.3515625, 35.17138671875, 36.9912109375, 38.81103515625, 40.630859375, 42.45068359375, 44.2705078125, 46.09033203125, 47.91015625, 49.72998046875, 51.5498046875, 53.36962890625, 55.189453125, 57.00927734375, 58.8291015625, 60.64892578125, 62.46875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 35.0, 47.0, 81.0, 135.0, 224.0, 350.0, 651.0, 1031.0, 1714.0, 2573.0, 4155.0, 6501.0, 9964.0, 14671.0, 21252.0, 29661.0, 39735.0, 51688.0, 64677.0, 76011.0, 86322.0, 91937.0, 92887.0, 88995.0, 81114.0, 69824.0, 57813.0, 45097.0, 34303.0, 24710.0, 17287.0, 11783.0, 7862.0, 5058.0, 3211.0, 1988.0, 1245.0, 807.0, 464.0, 260.0, 179.0, 104.0, 51.0, 46.0, 23.0, 12.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.875, -31.75, -30.625, -29.5, -28.375, -27.25, -26.125, -25.0, -23.875, -22.75, -21.625, -20.5, -19.375, -18.25, -17.125, -16.0, -14.875, -13.75, -12.625, -11.5, -10.375, -9.25, -8.125, -7.0, -5.875, -4.75, -3.625, -2.5, -1.375, -0.25, 0.875, 2.0, 3.125, 4.25, 5.375, 6.5, 7.625, 8.75, 9.875, 11.0, 12.125, 13.25, 14.375, 15.5, 16.625, 17.75, 18.875, 20.0, 21.125, 22.25, 23.375, 24.5, 25.625, 26.75, 27.875, 29.0, 30.125, 31.25, 32.375, 33.5, 34.625, 35.75, 36.875, 38.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 7.0, 16.0, 17.0, 18.0, 18.0, 16.0, 21.0, 27.0, 24.0, 31.0, 34.0, 43.0, 34.0, 35.0, 46.0, 40.0, 41.0, 42.0, 52.0, 51.0, 41.0, 33.0, 29.0, 39.0, 33.0, 22.0, 28.0, 16.0, 19.0, 16.0, 10.0, 5.0, 6.0, 13.0, 10.0, 9.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.6875, -39.34912109375, -38.0107421875, -36.67236328125, -35.333984375, -33.99560546875, -32.6572265625, -31.31884765625, -29.98046875, -28.64208984375, -27.3037109375, -25.96533203125, -24.626953125, -23.28857421875, -21.9501953125, -20.61181640625, -19.2734375, -17.93505859375, -16.5966796875, -15.25830078125, -13.919921875, -12.58154296875, -11.2431640625, -9.90478515625, -8.56640625, -7.22802734375, -5.8896484375, -4.55126953125, -3.212890625, -1.87451171875, -0.5361328125, 0.80224609375, 2.140625, 3.47900390625, 4.8173828125, 6.15576171875, 7.494140625, 8.83251953125, 10.1708984375, 11.50927734375, 12.84765625, 14.18603515625, 15.5244140625, 16.86279296875, 18.201171875, 19.53955078125, 20.8779296875, 22.21630859375, 23.5546875, 24.89306640625, 26.2314453125, 27.56982421875, 28.908203125, 30.24658203125, 31.5849609375, 32.92333984375, 34.26171875, 35.60009765625, 36.9384765625, 38.27685546875, 39.615234375, 40.95361328125, 42.2919921875, 43.63037109375, 44.96875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 14.0, 28.0, 36.0, 67.0, 122.0, 181.0, 338.0, 597.0, 1064.0, 1823.0, 3356.0, 5640.0, 9884.0, 16485.0, 26135.0, 40032.0, 58425.0, 79126.0, 98928.0, 114498.0, 120140.0, 115759.0, 100933.0, 81593.0, 60842.0, 42756.0, 27630.0, 17240.0, 10482.0, 6113.0, 3592.0, 1952.0, 1201.0, 684.0, 362.0, 190.0, 126.0, 75.0, 42.0, 29.0, 16.0, 9.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.139404296875, -18.51318359375, -17.886962890625, -17.2607421875, -16.634521484375, -16.00830078125, -15.382080078125, -14.755859375, -14.129638671875, -13.50341796875, -12.877197265625, -12.2509765625, -11.624755859375, -10.99853515625, -10.372314453125, -9.74609375, -9.119873046875, -8.49365234375, -7.867431640625, -7.2412109375, -6.614990234375, -5.98876953125, -5.362548828125, -4.736328125, -4.110107421875, -3.48388671875, -2.857666015625, -2.2314453125, -1.605224609375, -0.97900390625, -0.352783203125, 0.2734375, 0.899658203125, 1.52587890625, 2.152099609375, 2.7783203125, 3.404541015625, 4.03076171875, 4.656982421875, 5.283203125, 5.909423828125, 6.53564453125, 7.161865234375, 7.7880859375, 8.414306640625, 9.04052734375, 9.666748046875, 10.29296875, 10.919189453125, 11.54541015625, 12.171630859375, 12.7978515625, 13.424072265625, 14.05029296875, 14.676513671875, 15.302734375, 15.928955078125, 16.55517578125, 17.181396484375, 17.8076171875, 18.433837890625, 19.06005859375, 19.686279296875, 20.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 18.0, 11.0, 16.0, 23.0, 21.0, 29.0, 32.0, 34.0, 40.0, 40.0, 59.0, 43.0, 60.0, 52.0, 58.0, 45.0, 56.0, 54.0, 44.0, 46.0, 35.0, 28.0, 32.0, 23.0, 12.0, 23.0, 12.0, 14.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023040771484375, -0.0022216439247131348, -0.0021392107009887695, -0.0020567774772644043, -0.001974344253540039, -0.0018919110298156738, -0.0018094778060913086, -0.0017270445823669434, -0.0016446113586425781, -0.0015621781349182129, -0.0014797449111938477, -0.0013973116874694824, -0.0013148784637451172, -0.001232445240020752, -0.0011500120162963867, -0.0010675787925720215, -0.0009851455688476562, -0.000902712345123291, -0.0008202791213989258, -0.0007378458976745605, -0.0006554126739501953, -0.0005729794502258301, -0.0004905462265014648, -0.0004081130027770996, -0.0003256797790527344, -0.00024324655532836914, -0.0001608133316040039, -7.838010787963867e-05, 4.0531158447265625e-06, 8.64863395690918e-05, 0.00016891956329345703, 0.00025135278701782227, 0.0003337860107421875, 0.00041621923446655273, 0.000498652458190918, 0.0005810856819152832, 0.0006635189056396484, 0.0007459521293640137, 0.0008283853530883789, 0.0009108185768127441, 0.0009932518005371094, 0.0010756850242614746, 0.0011581182479858398, 0.001240551471710205, 0.0013229846954345703, 0.0014054179191589355, 0.0014878511428833008, 0.001570284366607666, 0.0016527175903320312, 0.0017351508140563965, 0.0018175840377807617, 0.001900017261505127, 0.001982450485229492, 0.0020648837089538574, 0.0021473169326782227, 0.002229750156402588, 0.002312183380126953, 0.0023946166038513184, 0.0024770498275756836, 0.002559483051300049, 0.002641916275024414, 0.0027243494987487793, 0.0028067827224731445, 0.0028892159461975098, 0.002971649169921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 14.0, 12.0, 19.0, 35.0, 73.0, 106.0, 155.0, 297.0, 477.0, 818.0, 1395.0, 2105.0, 3429.0, 5541.0, 8760.0, 13368.0, 20435.0, 29650.0, 41667.0, 56821.0, 71856.0, 87974.0, 99269.0, 105014.0, 102913.0, 94723.0, 80537.0, 64981.0, 49087.0, 35965.0, 24985.0, 16607.0, 10980.0, 6953.0, 4341.0, 2754.0, 1695.0, 1091.0, 649.0, 425.0, 222.0, 144.0, 100.0, 43.0, 28.0, 14.0, 8.0, 8.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.453125, -19.828857421875, -19.20458984375, -18.580322265625, -17.9560546875, -17.331787109375, -16.70751953125, -16.083251953125, -15.458984375, -14.834716796875, -14.21044921875, -13.586181640625, -12.9619140625, -12.337646484375, -11.71337890625, -11.089111328125, -10.46484375, -9.840576171875, -9.21630859375, -8.592041015625, -7.9677734375, -7.343505859375, -6.71923828125, -6.094970703125, -5.470703125, -4.846435546875, -4.22216796875, -3.597900390625, -2.9736328125, -2.349365234375, -1.72509765625, -1.100830078125, -0.4765625, 0.147705078125, 0.77197265625, 1.396240234375, 2.0205078125, 2.644775390625, 3.26904296875, 3.893310546875, 4.517578125, 5.141845703125, 5.76611328125, 6.390380859375, 7.0146484375, 7.638916015625, 8.26318359375, 8.887451171875, 9.51171875, 10.135986328125, 10.76025390625, 11.384521484375, 12.0087890625, 12.633056640625, 13.25732421875, 13.881591796875, 14.505859375, 15.130126953125, 15.75439453125, 16.378662109375, 17.0029296875, 17.627197265625, 18.25146484375, 18.875732421875, 19.5]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 7.0, 10.0, 12.0, 14.0, 10.0, 20.0, 23.0, 16.0, 21.0, 30.0, 29.0, 38.0, 36.0, 30.0, 32.0, 41.0, 59.0, 50.0, 62.0, 53.0, 44.0, 37.0, 38.0, 43.0, 51.0, 30.0, 30.0, 27.0, 11.0, 17.0, 15.0, 10.0, 6.0, 4.0, 8.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0638427734375, -8.760498046875, -8.4571533203125, -8.15380859375, -7.8504638671875, -7.547119140625, -7.2437744140625, -6.9404296875, -6.6370849609375, -6.333740234375, -6.0303955078125, -5.72705078125, -5.4237060546875, -5.120361328125, -4.8170166015625, -4.513671875, -4.2103271484375, -3.906982421875, -3.6036376953125, -3.30029296875, -2.9969482421875, -2.693603515625, -2.3902587890625, -2.0869140625, -1.7835693359375, -1.480224609375, -1.1768798828125, -0.87353515625, -0.5701904296875, -0.266845703125, 0.0364990234375, 0.33984375, 0.6431884765625, 0.946533203125, 1.2498779296875, 1.55322265625, 1.8565673828125, 2.159912109375, 2.4632568359375, 2.7666015625, 3.0699462890625, 3.373291015625, 3.6766357421875, 3.97998046875, 4.2833251953125, 4.586669921875, 4.8900146484375, 5.193359375, 5.4967041015625, 5.800048828125, 6.1033935546875, 6.40673828125, 6.7100830078125, 7.013427734375, 7.3167724609375, 7.6201171875, 7.9234619140625, 8.226806640625, 8.5301513671875, 8.83349609375, 9.1368408203125, 9.440185546875, 9.7435302734375, 10.046875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 9.0, 17.0, 15.0, 13.0, 15.0, 22.0, 22.0, 18.0, 36.0, 35.0, 32.0, 33.0, 43.0, 48.0, 41.0, 32.0, 40.0, 38.0, 40.0, 51.0, 34.0, 43.0, 29.0, 25.0, 24.0, 24.0, 25.0, 20.0, 17.0, 16.0, 11.0, 19.0, 7.0, 7.0, 10.0, 6.0, 7.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.550498962402344, -51.78920364379883, -50.02790832519531, -48.26660919189453, -46.505313873291016, -44.7440185546875, -42.982723236083984, -41.22142791748047, -39.46012878417969, -37.69883346557617, -35.937538146972656, -34.176239013671875, -32.41494369506836, -30.653648376464844, -28.892353057861328, -27.13105583190918, -25.369760513305664, -23.60846519470215, -21.84716796875, -20.085872650146484, -18.324575424194336, -16.56328010559082, -14.801983833312988, -13.040687561035156, -11.279391288757324, -9.518095016479492, -7.75679874420166, -5.995502948760986, -4.234206676483154, -2.4729108810424805, -0.7116146087646484, 1.0496816635131836, 2.8109779357910156, 4.572274208068848, 6.33357048034668, 8.094865798950195, 9.856163024902344, 11.61745834350586, 13.378754615783691, 15.140050888061523, 16.901348114013672, 18.662643432617188, 20.423940658569336, 22.18523597717285, 23.946533203125, 25.707828521728516, 27.46912384033203, 29.23042106628418, 30.991716384887695, 32.753013610839844, 34.51430892944336, 36.275604248046875, 38.03689956665039, 39.798194885253906, 41.55949401855469, 43.3207893371582, 45.08208465576172, 46.843379974365234, 48.60467529296875, 50.36597442626953, 52.12726974487305, 53.88856506347656, 55.64986038208008, 57.411155700683594, 59.172454833984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 14.0, 16.0, 13.0, 17.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 25.0, 29.0, 39.0, 33.0, 50.0, 42.0, 33.0, 35.0, 41.0, 56.0, 37.0, 36.0, 26.0, 34.0, 33.0, 17.0, 25.0, 31.0, 20.0, 24.0, 21.0, 20.0, 8.0, 11.0, 7.0, 6.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-64.747314453125, -62.61769104003906, -60.488067626953125, -58.35844421386719, -56.22882080078125, -54.09919738769531, -51.96957015991211, -49.83994674682617, -47.710323333740234, -45.5806999206543, -43.45107650756836, -41.32145309448242, -39.19182586669922, -37.06220245361328, -34.932579040527344, -32.802955627441406, -30.67333221435547, -28.54370880126953, -26.414085388183594, -24.284460067749023, -22.154836654663086, -20.02521324157715, -17.895587921142578, -15.76596450805664, -13.636341094970703, -11.506717681884766, -9.377093315124512, -7.247469425201416, -5.11784553527832, -2.988222122192383, -0.8585977554321289, 1.271026611328125, 3.4006423950195312, 5.530266284942627, 7.659890174865723, 9.789514541625977, 11.919137954711914, 14.048761367797852, 16.178386688232422, 18.30801010131836, 20.437633514404297, 22.567256927490234, 24.696880340576172, 26.826505661010742, 28.95612907409668, 31.085752487182617, 33.21537780761719, 35.345001220703125, 37.47462463378906, 39.604248046875, 41.73387145996094, 43.863494873046875, 45.99311828613281, 48.12274169921875, 50.25236892700195, 52.38199234008789, 54.51161575317383, 56.641239166259766, 58.7708625793457, 60.90048599243164, 63.030113220214844, 65.15973663330078, 67.28936004638672, 69.41898345947266, 71.5486068725586]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 11.0, 11.0, 26.0, 21.0, 47.0, 95.0, 179.0, 308.0, 493.0, 862.0, 1508.0, 2542.0, 4451.0, 7285.0, 11939.0, 19476.0, 31068.0, 48196.0, 73790.0, 108174.0, 153667.0, 208669.0, 270833.0, 331629.0, 381947.0, 410741.0, 413483.0, 386163.0, 340370.0, 279901.0, 217450.0, 161440.0, 113742.0, 77355.0, 51429.0, 32780.0, 20434.0, 12770.0, 7775.0, 4653.0, 2692.0, 1638.0, 961.0, 545.0, 299.0, 179.0, 128.0, 47.0, 35.0, 21.0, 12.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.08349609375, -40.6357421875, -39.18798828125, -37.740234375, -36.29248046875, -34.8447265625, -33.39697265625, -31.94921875, -30.50146484375, -29.0537109375, -27.60595703125, -26.158203125, -24.71044921875, -23.2626953125, -21.81494140625, -20.3671875, -18.91943359375, -17.4716796875, -16.02392578125, -14.576171875, -13.12841796875, -11.6806640625, -10.23291015625, -8.78515625, -7.33740234375, -5.8896484375, -4.44189453125, -2.994140625, -1.54638671875, -0.0986328125, 1.34912109375, 2.796875, 4.24462890625, 5.6923828125, 7.14013671875, 8.587890625, 10.03564453125, 11.4833984375, 12.93115234375, 14.37890625, 15.82666015625, 17.2744140625, 18.72216796875, 20.169921875, 21.61767578125, 23.0654296875, 24.51318359375, 25.9609375, 27.40869140625, 28.8564453125, 30.30419921875, 31.751953125, 33.19970703125, 34.6474609375, 36.09521484375, 37.54296875, 38.99072265625, 40.4384765625, 41.88623046875, 43.333984375, 44.78173828125, 46.2294921875, 47.67724609375, 49.125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 6.0, 7.0, 16.0, 15.0, 17.0, 17.0, 22.0, 14.0, 25.0, 24.0, 28.0, 25.0, 25.0, 36.0, 36.0, 38.0, 43.0, 43.0, 29.0, 33.0, 46.0, 52.0, 45.0, 29.0, 25.0, 31.0, 32.0, 26.0, 24.0, 24.0, 24.0, 22.0, 24.0, 16.0, 14.0, 8.0, 7.0, 7.0, 6.0, 9.0, 2.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-58.53125, -56.60009765625, -54.6689453125, -52.73779296875, -50.806640625, -48.87548828125, -46.9443359375, -45.01318359375, -43.08203125, -41.15087890625, -39.2197265625, -37.28857421875, -35.357421875, -33.42626953125, -31.4951171875, -29.56396484375, -27.6328125, -25.70166015625, -23.7705078125, -21.83935546875, -19.908203125, -17.97705078125, -16.0458984375, -14.11474609375, -12.18359375, -10.25244140625, -8.3212890625, -6.39013671875, -4.458984375, -2.52783203125, -0.5966796875, 1.33447265625, 3.265625, 5.19677734375, 7.1279296875, 9.05908203125, 10.990234375, 12.92138671875, 14.8525390625, 16.78369140625, 18.71484375, 20.64599609375, 22.5771484375, 24.50830078125, 26.439453125, 28.37060546875, 30.3017578125, 32.23291015625, 34.1640625, 36.09521484375, 38.0263671875, 39.95751953125, 41.888671875, 43.81982421875, 45.7509765625, 47.68212890625, 49.61328125, 51.54443359375, 53.4755859375, 55.40673828125, 57.337890625, 59.26904296875, 61.2001953125, 63.13134765625, 65.0625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 11.0, 20.0, 41.0, 74.0, 143.0, 225.0, 396.0, 651.0, 1145.0, 1898.0, 3292.0, 5403.0, 8824.0, 13956.0, 22272.0, 34693.0, 51958.0, 76222.0, 107770.0, 147345.0, 193712.0, 245097.0, 294054.0, 336604.0, 365759.0, 376040.0, 364859.0, 336058.0, 293649.0, 244975.0, 193072.0, 147245.0, 106742.0, 75223.0, 51907.0, 34520.0, 22245.0, 14099.0, 8765.0, 5353.0, 3286.0, 1920.0, 1157.0, 656.0, 385.0, 230.0, 132.0, 84.0, 47.0, 32.0, 19.0, 14.0, 3.0, 1.0, 3.0], "bins": [-48.84375, -47.427734375, -46.01171875, -44.595703125, -43.1796875, -41.763671875, -40.34765625, -38.931640625, -37.515625, -36.099609375, -34.68359375, -33.267578125, -31.8515625, -30.435546875, -29.01953125, -27.603515625, -26.1875, -24.771484375, -23.35546875, -21.939453125, -20.5234375, -19.107421875, -17.69140625, -16.275390625, -14.859375, -13.443359375, -12.02734375, -10.611328125, -9.1953125, -7.779296875, -6.36328125, -4.947265625, -3.53125, -2.115234375, -0.69921875, 0.716796875, 2.1328125, 3.548828125, 4.96484375, 6.380859375, 7.796875, 9.212890625, 10.62890625, 12.044921875, 13.4609375, 14.876953125, 16.29296875, 17.708984375, 19.125, 20.541015625, 21.95703125, 23.373046875, 24.7890625, 26.205078125, 27.62109375, 29.037109375, 30.453125, 31.869140625, 33.28515625, 34.701171875, 36.1171875, 37.533203125, 38.94921875, 40.365234375, 41.78125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 5.0, 16.0, 9.0, 15.0, 17.0, 30.0, 29.0, 32.0, 39.0, 55.0, 64.0, 80.0, 84.0, 119.0, 117.0, 126.0, 130.0, 157.0, 158.0, 178.0, 170.0, 199.0, 200.0, 178.0, 153.0, 178.0, 159.0, 184.0, 145.0, 153.0, 114.0, 130.0, 98.0, 73.0, 69.0, 76.0, 65.0, 43.0, 42.0, 32.0, 29.0, 34.0, 24.0, 21.0, 9.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.96875, -24.1494140625, -23.330078125, -22.5107421875, -21.69140625, -20.8720703125, -20.052734375, -19.2333984375, -18.4140625, -17.5947265625, -16.775390625, -15.9560546875, -15.13671875, -14.3173828125, -13.498046875, -12.6787109375, -11.859375, -11.0400390625, -10.220703125, -9.4013671875, -8.58203125, -7.7626953125, -6.943359375, -6.1240234375, -5.3046875, -4.4853515625, -3.666015625, -2.8466796875, -2.02734375, -1.2080078125, -0.388671875, 0.4306640625, 1.25, 2.0693359375, 2.888671875, 3.7080078125, 4.52734375, 5.3466796875, 6.166015625, 6.9853515625, 7.8046875, 8.6240234375, 9.443359375, 10.2626953125, 11.08203125, 11.9013671875, 12.720703125, 13.5400390625, 14.359375, 15.1787109375, 15.998046875, 16.8173828125, 17.63671875, 18.4560546875, 19.275390625, 20.0947265625, 20.9140625, 21.7333984375, 22.552734375, 23.3720703125, 24.19140625, 25.0107421875, 25.830078125, 26.6494140625, 27.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 11.0, 18.0, 18.0, 20.0, 16.0, 21.0, 20.0, 28.0, 27.0, 36.0, 38.0, 41.0, 44.0, 54.0, 63.0, 44.0, 42.0, 44.0, 58.0, 33.0, 40.0, 28.0, 27.0, 31.0, 30.0, 22.0, 19.0, 22.0, 14.0, 9.0, 8.0, 7.0, 6.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-78.44146728515625, -76.33866882324219, -74.23587036132812, -72.1330795288086, -70.03028106689453, -67.92748260498047, -65.8246841430664, -63.721885681152344, -61.61909103393555, -59.516292572021484, -57.41349792480469, -55.310699462890625, -53.20790100097656, -51.105106353759766, -49.0023078918457, -46.899513244628906, -44.796714782714844, -42.69391632080078, -40.591121673583984, -38.48832321166992, -36.385528564453125, -34.28273010253906, -32.179931640625, -30.07713508605957, -27.97433853149414, -25.87154197692871, -23.76874542236328, -21.66594696044922, -19.56315040588379, -17.46035385131836, -15.357556343078613, -13.254758834838867, -11.151966094970703, -9.049169540405273, -6.946372032165527, -4.8435750007629395, -2.7407779693603516, -0.6379814147949219, 1.4648160934448242, 3.5676136016845703, 5.67041015625, 7.773207187652588, 9.876004219055176, 11.978801727294922, 14.081598281860352, 16.18439483642578, 18.287193298339844, 20.389989852905273, 22.492786407470703, 24.595582962036133, 26.698379516601562, 28.801177978515625, 30.903974533081055, 33.006771087646484, 35.10956954956055, 37.212364196777344, 39.315162658691406, 41.41796112060547, 43.520755767822266, 45.62355422973633, 47.726348876953125, 49.82914733886719, 51.93194580078125, 54.03474426269531, 56.13753890991211]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 8.0, 7.0, 5.0, 13.0, 17.0, 19.0, 16.0, 23.0, 20.0, 32.0, 30.0, 25.0, 41.0, 32.0, 23.0, 48.0, 42.0, 43.0, 44.0, 44.0, 43.0, 47.0, 52.0, 44.0, 34.0, 20.0, 28.0, 40.0, 25.0, 22.0, 19.0, 18.0, 13.0, 13.0, 3.0, 17.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.32952117919922, -70.92608642578125, -68.52265167236328, -66.11920928955078, -63.71577453613281, -61.312339782714844, -58.908905029296875, -56.505470275878906, -54.10203170776367, -51.6985969543457, -49.29515838623047, -46.8917236328125, -44.48828887939453, -42.0848503112793, -39.68141555786133, -37.277976989746094, -34.874542236328125, -32.471107482910156, -30.067668914794922, -27.664234161376953, -25.26079750061035, -22.85736083984375, -20.45392608642578, -18.05048942565918, -15.647052764892578, -13.243616104125977, -10.840180397033691, -8.436744689941406, -6.033308029174805, -3.629871368408203, -1.226435661315918, 1.1770000457763672, 3.5804367065429688, 5.983872890472412, 8.387309074401855, 10.79074478149414, 13.194181442260742, 15.597618103027344, 18.001052856445312, 20.404489517211914, 22.807926177978516, 25.211362838745117, 27.61479949951172, 30.018234252929688, 32.421669006347656, 34.82510757446289, 37.22854232788086, 39.631980895996094, 42.03541564941406, 44.43885040283203, 46.842288970947266, 49.245723724365234, 51.64916229248047, 54.05259704589844, 56.456031799316406, 58.859466552734375, 61.26290512084961, 63.66633987426758, 66.06977844238281, 68.47321319580078, 70.87664794921875, 73.28009033203125, 75.68352508544922, 78.08695983886719, 80.49039459228516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 9.0, 36.0, 39.0, 70.0, 94.0, 150.0, 238.0, 393.0, 568.0, 933.0, 1389.0, 2162.0, 3399.0, 5161.0, 7729.0, 11879.0, 17476.0, 25554.0, 36840.0, 50749.0, 66423.0, 84545.0, 99853.0, 108293.0, 108470.0, 99757.0, 85001.0, 66995.0, 50568.0, 36464.0, 25627.0, 17374.0, 11874.0, 7808.0, 4899.0, 3364.0, 2227.0, 1462.0, 918.0, 592.0, 364.0, 254.0, 183.0, 114.0, 83.0, 51.0, 32.0, 19.0, 20.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-8.390625, -8.12841796875, -7.8662109375, -7.60400390625, -7.341796875, -7.07958984375, -6.8173828125, -6.55517578125, -6.29296875, -6.03076171875, -5.7685546875, -5.50634765625, -5.244140625, -4.98193359375, -4.7197265625, -4.45751953125, -4.1953125, -3.93310546875, -3.6708984375, -3.40869140625, -3.146484375, -2.88427734375, -2.6220703125, -2.35986328125, -2.09765625, -1.83544921875, -1.5732421875, -1.31103515625, -1.048828125, -0.78662109375, -0.5244140625, -0.26220703125, 0.0, 0.26220703125, 0.5244140625, 0.78662109375, 1.048828125, 1.31103515625, 1.5732421875, 1.83544921875, 2.09765625, 2.35986328125, 2.6220703125, 2.88427734375, 3.146484375, 3.40869140625, 3.6708984375, 3.93310546875, 4.1953125, 4.45751953125, 4.7197265625, 4.98193359375, 5.244140625, 5.50634765625, 5.7685546875, 6.03076171875, 6.29296875, 6.55517578125, 6.8173828125, 7.07958984375, 7.341796875, 7.60400390625, 7.8662109375, 8.12841796875, 8.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 8.0, 4.0, 13.0, 19.0, 16.0, 17.0, 22.0, 22.0, 30.0, 30.0, 26.0, 41.0, 32.0, 24.0, 48.0, 40.0, 44.0, 46.0, 43.0, 43.0, 47.0, 49.0, 44.0, 35.0, 22.0, 28.0, 37.0, 28.0, 22.0, 19.0, 18.0, 12.0, 13.0, 5.0, 15.0, 4.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.8125, -71.40234375, -68.9921875, -66.58203125, -64.171875, -61.76171875, -59.3515625, -56.94140625, -54.53125, -52.12109375, -49.7109375, -47.30078125, -44.890625, -42.48046875, -40.0703125, -37.66015625, -35.25, -32.83984375, -30.4296875, -28.01953125, -25.609375, -23.19921875, -20.7890625, -18.37890625, -15.96875, -13.55859375, -11.1484375, -8.73828125, -6.328125, -3.91796875, -1.5078125, 0.90234375, 3.3125, 5.72265625, 8.1328125, 10.54296875, 12.953125, 15.36328125, 17.7734375, 20.18359375, 22.59375, 25.00390625, 27.4140625, 29.82421875, 32.234375, 34.64453125, 37.0546875, 39.46484375, 41.875, 44.28515625, 46.6953125, 49.10546875, 51.515625, 53.92578125, 56.3359375, 58.74609375, 61.15625, 63.56640625, 65.9765625, 68.38671875, 70.796875, 73.20703125, 75.6171875, 78.02734375, 80.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 6.0, 10.0, 5.0, 13.0, 17.0, 26.0, 37.0, 57.0, 82.0, 107.0, 171.0, 242.0, 349.0, 471.0, 650.0, 914.0, 1176.0, 1710.0, 2388.0, 3183.0, 4382.0, 6026.0, 8449.0, 11836.0, 17691.0, 30591.0, 203153.0, 623330.0, 58073.0, 22302.0, 14720.0, 10020.0, 7175.0, 5236.0, 3814.0, 2829.0, 2006.0, 1484.0, 1107.0, 779.0, 495.0, 429.0, 315.0, 218.0, 133.0, 95.0, 83.0, 48.0, 45.0, 25.0, 14.0, 17.0, 9.0, 10.0, 1.0, 3.0, 3.0, 3.0], "bins": [-16.109375, -15.625, -15.140625, -14.65625, -14.171875, -13.6875, -13.203125, -12.71875, -12.234375, -11.75, -11.265625, -10.78125, -10.296875, -9.8125, -9.328125, -8.84375, -8.359375, -7.875, -7.390625, -6.90625, -6.421875, -5.9375, -5.453125, -4.96875, -4.484375, -4.0, -3.515625, -3.03125, -2.546875, -2.0625, -1.578125, -1.09375, -0.609375, -0.125, 0.359375, 0.84375, 1.328125, 1.8125, 2.296875, 2.78125, 3.265625, 3.75, 4.234375, 4.71875, 5.203125, 5.6875, 6.171875, 6.65625, 7.140625, 7.625, 8.109375, 8.59375, 9.078125, 9.5625, 10.046875, 10.53125, 11.015625, 11.5, 11.984375, 12.46875, 12.953125, 13.4375, 13.921875, 14.40625, 14.890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 14.0, 14.0, 19.0, 22.0, 23.0, 20.0, 28.0, 26.0, 32.0, 28.0, 34.0, 43.0, 50.0, 58.0, 47.0, 44.0, 39.0, 52.0, 42.0, 37.0, 45.0, 47.0, 25.0, 29.0, 25.0, 21.0, 18.0, 26.0, 12.0, 16.0, 13.0, 14.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.59375, -49.8564453125, -48.119140625, -46.3818359375, -44.64453125, -42.9072265625, -41.169921875, -39.4326171875, -37.6953125, -35.9580078125, -34.220703125, -32.4833984375, -30.74609375, -29.0087890625, -27.271484375, -25.5341796875, -23.796875, -22.0595703125, -20.322265625, -18.5849609375, -16.84765625, -15.1103515625, -13.373046875, -11.6357421875, -9.8984375, -8.1611328125, -6.423828125, -4.6865234375, -2.94921875, -1.2119140625, 0.525390625, 2.2626953125, 4.0, 5.7373046875, 7.474609375, 9.2119140625, 10.94921875, 12.6865234375, 14.423828125, 16.1611328125, 17.8984375, 19.6357421875, 21.373046875, 23.1103515625, 24.84765625, 26.5849609375, 28.322265625, 30.0595703125, 31.796875, 33.5341796875, 35.271484375, 37.0087890625, 38.74609375, 40.4833984375, 42.220703125, 43.9580078125, 45.6953125, 47.4326171875, 49.169921875, 50.9072265625, 52.64453125, 54.3818359375, 56.119140625, 57.8564453125, 59.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 11.0, 11.0, 14.0, 17.0, 31.0, 41.0, 47.0, 78.0, 112.0, 135.0, 235.0, 279.0, 433.0, 627.0, 940.0, 1388.0, 2029.0, 3041.0, 4434.0, 6742.0, 10233.0, 15530.0, 24688.0, 81162.0, 790983.0, 42207.0, 21684.0, 13920.0, 9153.0, 6018.0, 4014.0, 2647.0, 1783.0, 1221.0, 825.0, 529.0, 402.0, 268.0, 166.0, 138.0, 102.0, 57.0, 56.0, 33.0, 33.0, 11.0, 8.0, 11.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.140625, -2.074493408203125, -2.00836181640625, -1.942230224609375, -1.8760986328125, -1.809967041015625, -1.74383544921875, -1.677703857421875, -1.611572265625, -1.545440673828125, -1.47930908203125, -1.413177490234375, -1.3470458984375, -1.280914306640625, -1.21478271484375, -1.148651123046875, -1.08251953125, -1.016387939453125, -0.95025634765625, -0.884124755859375, -0.8179931640625, -0.751861572265625, -0.68572998046875, -0.619598388671875, -0.553466796875, -0.487335205078125, -0.42120361328125, -0.355072021484375, -0.2889404296875, -0.222808837890625, -0.15667724609375, -0.090545654296875, -0.0244140625, 0.041717529296875, 0.10784912109375, 0.173980712890625, 0.2401123046875, 0.306243896484375, 0.37237548828125, 0.438507080078125, 0.504638671875, 0.570770263671875, 0.63690185546875, 0.703033447265625, 0.7691650390625, 0.835296630859375, 0.90142822265625, 0.967559814453125, 1.03369140625, 1.099822998046875, 1.16595458984375, 1.232086181640625, 1.2982177734375, 1.364349365234375, 1.43048095703125, 1.496612548828125, 1.562744140625, 1.628875732421875, 1.69500732421875, 1.761138916015625, 1.8272705078125, 1.893402099609375, 1.95953369140625, 2.025665283203125, 2.091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 10.0, 19.0, 14.0, 20.0, 14.0, 21.0, 28.0, 17.0, 35.0, 31.0, 38.0, 33.0, 51.0, 56.0, 35.0, 40.0, 49.0, 41.0, 54.0, 46.0, 36.0, 35.0, 39.0, 40.0, 31.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 11.0, 3.0, 9.0, 1.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-7.224082946777344e-05, -7.024593651294708e-05, -6.825104355812073e-05, -6.625615060329437e-05, -6.426125764846802e-05, -6.226636469364166e-05, -6.027147173881531e-05, -5.827657878398895e-05, -5.62816858291626e-05, -5.428679287433624e-05, -5.229189991950989e-05, -5.029700696468353e-05, -4.830211400985718e-05, -4.630722105503082e-05, -4.431232810020447e-05, -4.231743514537811e-05, -4.032254219055176e-05, -3.83276492357254e-05, -3.633275628089905e-05, -3.433786332607269e-05, -3.234297037124634e-05, -3.0348077416419983e-05, -2.8353184461593628e-05, -2.6358291506767273e-05, -2.4363398551940918e-05, -2.2368505597114563e-05, -2.0373612642288208e-05, -1.8378719687461853e-05, -1.6383826732635498e-05, -1.4388933777809143e-05, -1.2394040822982788e-05, -1.0399147868156433e-05, -8.404254913330078e-06, -6.409361958503723e-06, -4.414469003677368e-06, -2.419576048851013e-06, -4.246830940246582e-07, 1.5702098608016968e-06, 3.5651028156280518e-06, 5.559995770454407e-06, 7.554888725280762e-06, 9.549781680107117e-06, 1.1544674634933472e-05, 1.3539567589759827e-05, 1.553446054458618e-05, 1.7529353499412537e-05, 1.952424645423889e-05, 2.1519139409065247e-05, 2.35140323638916e-05, 2.5508925318717957e-05, 2.750381827354431e-05, 2.9498711228370667e-05, 3.149360418319702e-05, 3.3488497138023376e-05, 3.548339009284973e-05, 3.7478283047676086e-05, 3.947317600250244e-05, 4.1468068957328796e-05, 4.346296191215515e-05, 4.5457854866981506e-05, 4.745274782180786e-05, 4.9447640776634216e-05, 5.144253373146057e-05, 5.3437426686286926e-05, 5.543231964111328e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 11.0, 12.0, 18.0, 48.0, 45.0, 83.0, 118.0, 161.0, 238.0, 373.0, 526.0, 755.0, 1140.0, 1624.0, 2391.0, 3278.0, 4897.0, 6848.0, 9652.0, 14233.0, 19534.0, 27555.0, 38876.0, 52906.0, 70803.0, 91497.0, 110773.0, 119125.0, 112220.0, 93968.0, 73139.0, 54603.0, 40099.0, 28479.0, 20639.0, 14438.0, 10174.0, 7190.0, 4893.0, 3426.0, 2365.0, 1687.0, 1142.0, 809.0, 569.0, 411.0, 257.0, 198.0, 117.0, 91.0, 45.0, 40.0, 13.0, 19.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6256561279296875, -1.570648193359375, -1.5156402587890625, -1.46063232421875, -1.4056243896484375, -1.350616455078125, -1.2956085205078125, -1.2406005859375, -1.1855926513671875, -1.130584716796875, -1.0755767822265625, -1.02056884765625, -0.9655609130859375, -0.910552978515625, -0.8555450439453125, -0.800537109375, -0.7455291748046875, -0.690521240234375, -0.6355133056640625, -0.58050537109375, -0.5254974365234375, -0.470489501953125, -0.4154815673828125, -0.3604736328125, -0.3054656982421875, -0.250457763671875, -0.1954498291015625, -0.14044189453125, -0.0854339599609375, -0.030426025390625, 0.0245819091796875, 0.07958984375, 0.1345977783203125, 0.189605712890625, 0.2446136474609375, 0.29962158203125, 0.3546295166015625, 0.409637451171875, 0.4646453857421875, 0.5196533203125, 0.5746612548828125, 0.629669189453125, 0.6846771240234375, 0.73968505859375, 0.7946929931640625, 0.849700927734375, 0.9047088623046875, 0.959716796875, 1.0147247314453125, 1.069732666015625, 1.1247406005859375, 1.17974853515625, 1.2347564697265625, 1.289764404296875, 1.3447723388671875, 1.3997802734375, 1.4547882080078125, 1.509796142578125, 1.5648040771484375, 1.61981201171875, 1.6748199462890625, 1.729827880859375, 1.7848358154296875, 1.83984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 3.0, 12.0, 16.0, 10.0, 23.0, 30.0, 27.0, 40.0, 55.0, 32.0, 48.0, 60.0, 89.0, 89.0, 72.0, 46.0, 45.0, 38.0, 40.0, 33.0, 30.0, 24.0, 30.0, 18.0, 11.0, 9.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1164093017578125, -1.073638916015625, -1.0308685302734375, -0.98809814453125, -0.9453277587890625, -0.902557373046875, -0.8597869873046875, -0.8170166015625, -0.7742462158203125, -0.731475830078125, -0.6887054443359375, -0.64593505859375, -0.6031646728515625, -0.560394287109375, -0.5176239013671875, -0.474853515625, -0.4320831298828125, -0.389312744140625, -0.3465423583984375, -0.30377197265625, -0.2610015869140625, -0.218231201171875, -0.1754608154296875, -0.1326904296875, -0.0899200439453125, -0.047149658203125, -0.0043792724609375, 0.03839111328125, 0.0811614990234375, 0.123931884765625, 0.1667022705078125, 0.20947265625, 0.2522430419921875, 0.295013427734375, 0.3377838134765625, 0.38055419921875, 0.4233245849609375, 0.466094970703125, 0.5088653564453125, 0.5516357421875, 0.5944061279296875, 0.637176513671875, 0.6799468994140625, 0.72271728515625, 0.7654876708984375, 0.808258056640625, 0.8510284423828125, 0.893798828125, 0.9365692138671875, 0.979339599609375, 1.0221099853515625, 1.06488037109375, 1.1076507568359375, 1.150421142578125, 1.1931915283203125, 1.2359619140625, 1.2787322998046875, 1.321502685546875, 1.3642730712890625, 1.40704345703125, 1.4498138427734375, 1.492584228515625, 1.5353546142578125, 1.578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 11.0, 23.0, 17.0, 17.0, 21.0, 19.0, 24.0, 21.0, 34.0, 39.0, 36.0, 43.0, 46.0, 56.0, 55.0, 49.0, 38.0, 50.0, 51.0, 37.0, 37.0, 30.0, 35.0, 25.0, 23.0, 25.0, 22.0, 14.0, 12.0, 11.0, 10.0, 3.0, 6.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-79.88013458251953, -77.76766967773438, -75.65519714355469, -73.54273223876953, -71.43026733398438, -69.31780242919922, -67.20533752441406, -65.09286499023438, -62.98040008544922, -60.86793518066406, -58.75546646118164, -56.64299774169922, -54.53053283691406, -52.418067932128906, -50.305599212646484, -48.19313049316406, -46.080665588378906, -43.96820068359375, -41.85573196411133, -39.743263244628906, -37.63079833984375, -35.518333435058594, -33.40586471557617, -31.293397903442383, -29.180931091308594, -27.068464279174805, -24.955997467041016, -22.843530654907227, -20.731063842773438, -18.61859703063965, -16.50613021850586, -14.39366340637207, -12.281192779541016, -10.168725967407227, -8.056259155273438, -5.943792343139648, -3.8313255310058594, -1.7188587188720703, 0.39360809326171875, 2.506074905395508, 4.618541717529297, 6.731008529663086, 8.843475341796875, 10.955942153930664, 13.068408966064453, 15.180875778198242, 17.29334259033203, 19.40580940246582, 21.51827621459961, 23.6307430267334, 25.743209838867188, 27.855676651000977, 29.968143463134766, 32.08061218261719, 34.193077087402344, 36.3055419921875, 38.41801071166992, 40.530479431152344, 42.6429443359375, 44.755409240722656, 46.86787796020508, 48.9803466796875, 51.092811584472656, 53.20527648925781, 55.317745208740234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 12.0, 7.0, 5.0, 6.0, 12.0, 20.0, 16.0, 16.0, 27.0, 20.0, 36.0, 25.0, 24.0, 42.0, 29.0, 27.0, 45.0, 46.0, 40.0, 49.0, 40.0, 42.0, 48.0, 54.0, 42.0, 32.0, 24.0, 26.0, 37.0, 27.0, 22.0, 17.0, 21.0, 12.0, 11.0, 5.0, 15.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.3089828491211, -70.90727996826172, -68.50557708740234, -66.10387420654297, -63.70217514038086, -61.300472259521484, -58.89876937866211, -56.4970703125, -54.095367431640625, -51.69366455078125, -49.291961669921875, -46.8902587890625, -44.48855972290039, -42.086856842041016, -39.68515396118164, -37.28345489501953, -34.88174819946289, -32.480045318603516, -30.078344345092773, -27.6766414642334, -25.274940490722656, -22.87323760986328, -20.471534729003906, -18.069833755493164, -15.668130874633789, -13.26642894744873, -10.864727020263672, -8.463024139404297, -6.061322212219238, -3.6596202850341797, -1.2579174041748047, 1.1437835693359375, 3.5454864501953125, 5.947188377380371, 8.34889030456543, 10.750593185424805, 13.152295112609863, 15.553997039794922, 17.955699920654297, 20.35740089416504, 22.759103775024414, 25.16080665588379, 27.56250762939453, 29.964210510253906, 32.36591339111328, 34.767616271972656, 37.16931915283203, 39.57101821899414, 41.972721099853516, 44.37442398071289, 46.776126861572266, 49.177825927734375, 51.57952880859375, 53.981231689453125, 56.3829345703125, 58.784637451171875, 61.18634033203125, 63.588043212890625, 65.98974609375, 68.39144897460938, 70.79315185546875, 73.19485473632812, 75.5965576171875, 77.99825286865234, 80.39995574951172]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 9.0, 11.0, 9.0, 24.0, 55.0, 68.0, 115.0, 183.0, 337.0, 571.0, 952.0, 1479.0, 2392.0, 3854.0, 5967.0, 9128.0, 13696.0, 19649.0, 27743.0, 37418.0, 48445.0, 60860.0, 72988.0, 82096.0, 89519.0, 92336.0, 89942.0, 82454.0, 72746.0, 61235.0, 48627.0, 37195.0, 27898.0, 19510.0, 13666.0, 9235.0, 5798.0, 3930.0, 2392.0, 1568.0, 965.0, 625.0, 345.0, 220.0, 127.0, 67.0, 52.0, 26.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.71875, -37.48974609375, -36.2607421875, -35.03173828125, -33.802734375, -32.57373046875, -31.3447265625, -30.11572265625, -28.88671875, -27.65771484375, -26.4287109375, -25.19970703125, -23.970703125, -22.74169921875, -21.5126953125, -20.28369140625, -19.0546875, -17.82568359375, -16.5966796875, -15.36767578125, -14.138671875, -12.90966796875, -11.6806640625, -10.45166015625, -9.22265625, -7.99365234375, -6.7646484375, -5.53564453125, -4.306640625, -3.07763671875, -1.8486328125, -0.61962890625, 0.609375, 1.83837890625, 3.0673828125, 4.29638671875, 5.525390625, 6.75439453125, 7.9833984375, 9.21240234375, 10.44140625, 11.67041015625, 12.8994140625, 14.12841796875, 15.357421875, 16.58642578125, 17.8154296875, 19.04443359375, 20.2734375, 21.50244140625, 22.7314453125, 23.96044921875, 25.189453125, 26.41845703125, 27.6474609375, 28.87646484375, 30.10546875, 31.33447265625, 32.5634765625, 33.79248046875, 35.021484375, 36.25048828125, 37.4794921875, 38.70849609375, 39.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 7.0, 6.0, 9.0, 9.0, 18.0, 19.0, 18.0, 23.0, 21.0, 33.0, 25.0, 27.0, 40.0, 31.0, 28.0, 43.0, 45.0, 39.0, 52.0, 40.0, 46.0, 45.0, 53.0, 45.0, 29.0, 23.0, 26.0, 36.0, 30.0, 21.0, 19.0, 18.0, 12.0, 11.0, 6.0, 14.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.1875, -68.8564453125, -66.525390625, -64.1943359375, -61.86328125, -59.5322265625, -57.201171875, -54.8701171875, -52.5390625, -50.2080078125, -47.876953125, -45.5458984375, -43.21484375, -40.8837890625, -38.552734375, -36.2216796875, -33.890625, -31.5595703125, -29.228515625, -26.8974609375, -24.56640625, -22.2353515625, -19.904296875, -17.5732421875, -15.2421875, -12.9111328125, -10.580078125, -8.2490234375, -5.91796875, -3.5869140625, -1.255859375, 1.0751953125, 3.40625, 5.7373046875, 8.068359375, 10.3994140625, 12.73046875, 15.0615234375, 17.392578125, 19.7236328125, 22.0546875, 24.3857421875, 26.716796875, 29.0478515625, 31.37890625, 33.7099609375, 36.041015625, 38.3720703125, 40.703125, 43.0341796875, 45.365234375, 47.6962890625, 50.02734375, 52.3583984375, 54.689453125, 57.0205078125, 59.3515625, 61.6826171875, 64.013671875, 66.3447265625, 68.67578125, 71.0068359375, 73.337890625, 75.6689453125, 78.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 14.0, 15.0, 41.0, 67.0, 91.0, 154.0, 276.0, 423.0, 748.0, 1147.0, 1781.0, 2779.0, 4241.0, 6414.0, 9390.0, 13677.0, 19098.0, 26237.0, 34481.0, 44099.0, 54667.0, 64576.0, 73652.0, 80603.0, 83704.0, 84224.0, 81180.0, 74144.0, 65097.0, 54839.0, 44215.0, 35244.0, 26326.0, 19321.0, 13565.0, 9597.0, 6449.0, 4356.0, 2801.0, 1846.0, 1186.0, 718.0, 436.0, 261.0, 160.0, 88.0, 62.0, 26.0, 27.0, 11.0, 2.0, 7.0, 0.0, 2.0, 1.0], "bins": [-37.96875, -36.8525390625, -35.736328125, -34.6201171875, -33.50390625, -32.3876953125, -31.271484375, -30.1552734375, -29.0390625, -27.9228515625, -26.806640625, -25.6904296875, -24.57421875, -23.4580078125, -22.341796875, -21.2255859375, -20.109375, -18.9931640625, -17.876953125, -16.7607421875, -15.64453125, -14.5283203125, -13.412109375, -12.2958984375, -11.1796875, -10.0634765625, -8.947265625, -7.8310546875, -6.71484375, -5.5986328125, -4.482421875, -3.3662109375, -2.25, -1.1337890625, -0.017578125, 1.0986328125, 2.21484375, 3.3310546875, 4.447265625, 5.5634765625, 6.6796875, 7.7958984375, 8.912109375, 10.0283203125, 11.14453125, 12.2607421875, 13.376953125, 14.4931640625, 15.609375, 16.7255859375, 17.841796875, 18.9580078125, 20.07421875, 21.1904296875, 22.306640625, 23.4228515625, 24.5390625, 25.6552734375, 26.771484375, 27.8876953125, 29.00390625, 30.1201171875, 31.236328125, 32.3525390625, 33.46875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 16.0, 9.0, 8.0, 22.0, 16.0, 17.0, 29.0, 27.0, 28.0, 26.0, 29.0, 31.0, 37.0, 57.0, 41.0, 42.0, 47.0, 50.0, 44.0, 39.0, 53.0, 34.0, 37.0, 31.0, 37.0, 21.0, 33.0, 23.0, 22.0, 13.0, 18.0, 17.0, 7.0, 11.0, 6.0, 7.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5, -50.814453125, -49.12890625, -47.443359375, -45.7578125, -44.072265625, -42.38671875, -40.701171875, -39.015625, -37.330078125, -35.64453125, -33.958984375, -32.2734375, -30.587890625, -28.90234375, -27.216796875, -25.53125, -23.845703125, -22.16015625, -20.474609375, -18.7890625, -17.103515625, -15.41796875, -13.732421875, -12.046875, -10.361328125, -8.67578125, -6.990234375, -5.3046875, -3.619140625, -1.93359375, -0.248046875, 1.4375, 3.123046875, 4.80859375, 6.494140625, 8.1796875, 9.865234375, 11.55078125, 13.236328125, 14.921875, 16.607421875, 18.29296875, 19.978515625, 21.6640625, 23.349609375, 25.03515625, 26.720703125, 28.40625, 30.091796875, 31.77734375, 33.462890625, 35.1484375, 36.833984375, 38.51953125, 40.205078125, 41.890625, 43.576171875, 45.26171875, 46.947265625, 48.6328125, 50.318359375, 52.00390625, 53.689453125, 55.375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 6.0, 11.0, 14.0, 23.0, 51.0, 56.0, 82.0, 123.0, 188.0, 318.0, 449.0, 643.0, 969.0, 1493.0, 2151.0, 3158.0, 4590.0, 6668.0, 9513.0, 13259.0, 18157.0, 24046.0, 32623.0, 41651.0, 51072.0, 61334.0, 70438.0, 77668.0, 82003.0, 82957.0, 80404.0, 74972.0, 66021.0, 56546.0, 46274.0, 36882.0, 28336.0, 21183.0, 15552.0, 11294.0, 8034.0, 5517.0, 3831.0, 2558.0, 1781.0, 1224.0, 792.0, 535.0, 379.0, 249.0, 160.0, 132.0, 70.0, 45.0, 33.0, 19.0, 12.0, 9.0, 3.0, 0.0, 4.0], "bins": [-16.6875, -16.170166015625, -15.65283203125, -15.135498046875, -14.6181640625, -14.100830078125, -13.58349609375, -13.066162109375, -12.548828125, -12.031494140625, -11.51416015625, -10.996826171875, -10.4794921875, -9.962158203125, -9.44482421875, -8.927490234375, -8.41015625, -7.892822265625, -7.37548828125, -6.858154296875, -6.3408203125, -5.823486328125, -5.30615234375, -4.788818359375, -4.271484375, -3.754150390625, -3.23681640625, -2.719482421875, -2.2021484375, -1.684814453125, -1.16748046875, -0.650146484375, -0.1328125, 0.384521484375, 0.90185546875, 1.419189453125, 1.9365234375, 2.453857421875, 2.97119140625, 3.488525390625, 4.005859375, 4.523193359375, 5.04052734375, 5.557861328125, 6.0751953125, 6.592529296875, 7.10986328125, 7.627197265625, 8.14453125, 8.661865234375, 9.17919921875, 9.696533203125, 10.2138671875, 10.731201171875, 11.24853515625, 11.765869140625, 12.283203125, 12.800537109375, 13.31787109375, 13.835205078125, 14.3525390625, 14.869873046875, 15.38720703125, 15.904541015625, 16.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 5.0, 14.0, 18.0, 7.0, 9.0, 27.0, 28.0, 31.0, 36.0, 23.0, 63.0, 46.0, 37.0, 46.0, 62.0, 39.0, 51.0, 61.0, 53.0, 42.0, 35.0, 44.0, 32.0, 29.0, 30.0, 21.0, 29.0, 12.0, 11.0, 5.0, 6.0, 9.0, 12.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032806396484375, -0.0031862258911132812, -0.0030918121337890625, -0.0029973983764648438, -0.002902984619140625, -0.0028085708618164062, -0.0027141571044921875, -0.0026197433471679688, -0.00252532958984375, -0.0024309158325195312, -0.0023365020751953125, -0.0022420883178710938, -0.002147674560546875, -0.0020532608032226562, -0.0019588470458984375, -0.0018644332885742188, -0.00177001953125, -0.0016756057739257812, -0.0015811920166015625, -0.0014867782592773438, -0.001392364501953125, -0.0012979507446289062, -0.0012035369873046875, -0.0011091232299804688, -0.00101470947265625, -0.0009202957153320312, -0.0008258819580078125, -0.0007314682006835938, -0.000637054443359375, -0.0005426406860351562, -0.0004482269287109375, -0.00035381317138671875, -0.0002593994140625, -0.00016498565673828125, -7.05718994140625e-05, 2.384185791015625e-05, 0.000118255615234375, 0.00021266937255859375, 0.0003070831298828125, 0.00040149688720703125, 0.00049591064453125, 0.0005903244018554688, 0.0006847381591796875, 0.0007791519165039062, 0.000873565673828125, 0.0009679794311523438, 0.0010623931884765625, 0.0011568069458007812, 0.001251220703125, 0.0013456344604492188, 0.0014400482177734375, 0.0015344619750976562, 0.001628875732421875, 0.0017232894897460938, 0.0018177032470703125, 0.0019121170043945312, 0.00200653076171875, 0.0021009445190429688, 0.0021953582763671875, 0.0022897720336914062, 0.002384185791015625, 0.0024785995483398438, 0.0025730133056640625, 0.0026674270629882812, 0.0027618408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 9.0, 15.0, 24.0, 31.0, 69.0, 94.0, 128.0, 206.0, 340.0, 541.0, 822.0, 1354.0, 2088.0, 3173.0, 4704.0, 7286.0, 10506.0, 15118.0, 21263.0, 29241.0, 38493.0, 49037.0, 60918.0, 72173.0, 81428.0, 86658.0, 88751.0, 86516.0, 79628.0, 70329.0, 59557.0, 47971.0, 37241.0, 27825.0, 20717.0, 14372.0, 10041.0, 6753.0, 4586.0, 2971.0, 2043.0, 1285.0, 830.0, 500.0, 338.0, 230.0, 140.0, 81.0, 54.0, 29.0, 17.0, 17.0, 5.0, 6.0, 1.0, 6.0, 1.0, 3.0], "bins": [-19.6875, -19.08056640625, -18.4736328125, -17.86669921875, -17.259765625, -16.65283203125, -16.0458984375, -15.43896484375, -14.83203125, -14.22509765625, -13.6181640625, -13.01123046875, -12.404296875, -11.79736328125, -11.1904296875, -10.58349609375, -9.9765625, -9.36962890625, -8.7626953125, -8.15576171875, -7.548828125, -6.94189453125, -6.3349609375, -5.72802734375, -5.12109375, -4.51416015625, -3.9072265625, -3.30029296875, -2.693359375, -2.08642578125, -1.4794921875, -0.87255859375, -0.265625, 0.34130859375, 0.9482421875, 1.55517578125, 2.162109375, 2.76904296875, 3.3759765625, 3.98291015625, 4.58984375, 5.19677734375, 5.8037109375, 6.41064453125, 7.017578125, 7.62451171875, 8.2314453125, 8.83837890625, 9.4453125, 10.05224609375, 10.6591796875, 11.26611328125, 11.873046875, 12.47998046875, 13.0869140625, 13.69384765625, 14.30078125, 14.90771484375, 15.5146484375, 16.12158203125, 16.728515625, 17.33544921875, 17.9423828125, 18.54931640625, 19.15625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 7.0, 12.0, 11.0, 14.0, 15.0, 7.0, 28.0, 15.0, 26.0, 31.0, 29.0, 42.0, 36.0, 36.0, 51.0, 42.0, 37.0, 40.0, 55.0, 51.0, 54.0, 37.0, 27.0, 39.0, 33.0, 28.0, 33.0, 24.0, 24.0, 19.0, 15.0, 11.0, 16.0, 8.0, 11.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.503662109375, -10.15576171875, -9.807861328125, -9.4599609375, -9.112060546875, -8.76416015625, -8.416259765625, -8.068359375, -7.720458984375, -7.37255859375, -7.024658203125, -6.6767578125, -6.328857421875, -5.98095703125, -5.633056640625, -5.28515625, -4.937255859375, -4.58935546875, -4.241455078125, -3.8935546875, -3.545654296875, -3.19775390625, -2.849853515625, -2.501953125, -2.154052734375, -1.80615234375, -1.458251953125, -1.1103515625, -0.762451171875, -0.41455078125, -0.066650390625, 0.28125, 0.629150390625, 0.97705078125, 1.324951171875, 1.6728515625, 2.020751953125, 2.36865234375, 2.716552734375, 3.064453125, 3.412353515625, 3.76025390625, 4.108154296875, 4.4560546875, 4.803955078125, 5.15185546875, 5.499755859375, 5.84765625, 6.195556640625, 6.54345703125, 6.891357421875, 7.2392578125, 7.587158203125, 7.93505859375, 8.282958984375, 8.630859375, 8.978759765625, 9.32666015625, 9.674560546875, 10.0224609375, 10.370361328125, 10.71826171875, 11.066162109375, 11.4140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 5.0, 9.0, 12.0, 13.0, 21.0, 18.0, 26.0, 26.0, 33.0, 37.0, 31.0, 28.0, 47.0, 35.0, 36.0, 41.0, 45.0, 51.0, 49.0, 33.0, 38.0, 41.0, 38.0, 29.0, 27.0, 32.0, 19.0, 19.0, 27.0, 14.0, 17.0, 16.0, 12.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-68.19844055175781, -66.23094940185547, -64.26345825195312, -62.295963287353516, -60.32847213745117, -58.36098098754883, -56.39348602294922, -54.425994873046875, -52.45850372314453, -50.49101257324219, -48.523521423339844, -46.556026458740234, -44.58853530883789, -42.62104415893555, -40.65354919433594, -38.686058044433594, -36.71856689453125, -34.751075744628906, -32.78358459472656, -30.816089630126953, -28.84859848022461, -26.881107330322266, -24.91361427307129, -22.946121215820312, -20.97863006591797, -19.011138916015625, -17.04364585876465, -15.076153755187988, -13.108661651611328, -11.141169548034668, -9.173677444458008, -7.206185340881348, -5.238697052001953, -3.271204948425293, -1.3037128448486328, 0.6637792587280273, 2.6312713623046875, 4.598763465881348, 6.566255569458008, 8.533747673034668, 10.501239776611328, 12.468731880187988, 14.436223983764648, 16.403717041015625, 18.37120819091797, 20.338699340820312, 22.30619239807129, 24.273685455322266, 26.24117660522461, 28.208667755126953, 30.17616081237793, 32.143653869628906, 34.11114501953125, 36.078636169433594, 38.04612731933594, 40.01362228393555, 41.98111343383789, 43.948604583740234, 45.916099548339844, 47.88359069824219, 49.85108184814453, 51.818572998046875, 53.78606414794922, 55.75355911254883, 57.72105026245117]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 7.0, 5.0, 15.0, 13.0, 13.0, 10.0, 20.0, 23.0, 24.0, 26.0, 30.0, 26.0, 34.0, 27.0, 27.0, 40.0, 31.0, 37.0, 42.0, 42.0, 35.0, 39.0, 44.0, 36.0, 39.0, 35.0, 36.0, 28.0, 27.0, 32.0, 25.0, 16.0, 13.0, 13.0, 13.0, 9.0, 12.0, 7.0, 8.0, 3.0, 1.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.96417236328125, -69.64633178710938, -67.32849884033203, -65.01065826416016, -62.69282150268555, -60.37498474121094, -58.05714416503906, -55.73930740356445, -53.421470642089844, -51.103633880615234, -48.785797119140625, -46.46795654296875, -44.15011978149414, -41.83228302001953, -39.514442443847656, -37.19660568237305, -34.87876892089844, -32.56093215942383, -30.243093490600586, -27.925254821777344, -25.607418060302734, -23.289581298828125, -20.971742630004883, -18.65390396118164, -16.33606719970703, -14.018229484558105, -11.70039176940918, -9.382554054260254, -7.064716339111328, -4.746878623962402, -2.4290409088134766, -0.11120223999023438, 2.2066421508789062, 4.524479866027832, 6.842317581176758, 9.160155296325684, 11.47799301147461, 13.795830726623535, 16.11366844177246, 18.431507110595703, 20.749343872070312, 23.067180633544922, 25.385019302368164, 27.702857971191406, 30.020694732666016, 32.338531494140625, 34.6563720703125, 36.97420883178711, 39.29204559326172, 41.60988235473633, 43.92771911621094, 46.24555969238281, 48.56339645385742, 50.88123321533203, 53.199073791503906, 55.516910552978516, 57.834747314453125, 60.152584075927734, 62.470420837402344, 64.78826141357422, 67.10609436035156, 69.42393493652344, 71.74177551269531, 74.05961608886719, 76.37744903564453]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 8.0, 9.0, 14.0, 38.0, 37.0, 83.0, 126.0, 216.0, 372.0, 662.0, 1084.0, 1871.0, 2974.0, 5202.0, 8791.0, 14234.0, 23117.0, 37060.0, 57523.0, 87068.0, 128465.0, 179982.0, 243340.0, 308474.0, 367950.0, 409735.0, 424477.0, 410613.0, 369544.0, 309948.0, 245298.0, 182600.0, 129856.0, 88556.0, 58590.0, 37618.0, 23447.0, 14285.0, 8713.0, 5055.0, 3060.0, 1748.0, 1057.0, 586.0, 340.0, 195.0, 100.0, 62.0, 45.0, 20.0, 10.0, 16.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.59375, -46.08349609375, -44.5732421875, -43.06298828125, -41.552734375, -40.04248046875, -38.5322265625, -37.02197265625, -35.51171875, -34.00146484375, -32.4912109375, -30.98095703125, -29.470703125, -27.96044921875, -26.4501953125, -24.93994140625, -23.4296875, -21.91943359375, -20.4091796875, -18.89892578125, -17.388671875, -15.87841796875, -14.3681640625, -12.85791015625, -11.34765625, -9.83740234375, -8.3271484375, -6.81689453125, -5.306640625, -3.79638671875, -2.2861328125, -0.77587890625, 0.734375, 2.24462890625, 3.7548828125, 5.26513671875, 6.775390625, 8.28564453125, 9.7958984375, 11.30615234375, 12.81640625, 14.32666015625, 15.8369140625, 17.34716796875, 18.857421875, 20.36767578125, 21.8779296875, 23.38818359375, 24.8984375, 26.40869140625, 27.9189453125, 29.42919921875, 30.939453125, 32.44970703125, 33.9599609375, 35.47021484375, 36.98046875, 38.49072265625, 40.0009765625, 41.51123046875, 43.021484375, 44.53173828125, 46.0419921875, 47.55224609375, 49.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 7.0, 6.0, 10.0, 15.0, 16.0, 12.0, 15.0, 20.0, 23.0, 27.0, 31.0, 26.0, 33.0, 27.0, 26.0, 31.0, 47.0, 26.0, 40.0, 49.0, 33.0, 39.0, 46.0, 34.0, 36.0, 39.0, 33.0, 33.0, 28.0, 33.0, 24.0, 19.0, 11.0, 15.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 1.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.8310546875, -65.599609375, -63.3681640625, -61.13671875, -58.9052734375, -56.673828125, -54.4423828125, -52.2109375, -49.9794921875, -47.748046875, -45.5166015625, -43.28515625, -41.0537109375, -38.822265625, -36.5908203125, -34.359375, -32.1279296875, -29.896484375, -27.6650390625, -25.43359375, -23.2021484375, -20.970703125, -18.7392578125, -16.5078125, -14.2763671875, -12.044921875, -9.8134765625, -7.58203125, -5.3505859375, -3.119140625, -0.8876953125, 1.34375, 3.5751953125, 5.806640625, 8.0380859375, 10.26953125, 12.5009765625, 14.732421875, 16.9638671875, 19.1953125, 21.4267578125, 23.658203125, 25.8896484375, 28.12109375, 30.3525390625, 32.583984375, 34.8154296875, 37.046875, 39.2783203125, 41.509765625, 43.7412109375, 45.97265625, 48.2041015625, 50.435546875, 52.6669921875, 54.8984375, 57.1298828125, 59.361328125, 61.5927734375, 63.82421875, 66.0556640625, 68.287109375, 70.5185546875, 72.75]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 23.0, 35.0, 55.0, 114.0, 186.0, 368.0, 542.0, 935.0, 1610.0, 2601.0, 4214.0, 6900.0, 10964.0, 16819.0, 26021.0, 38856.0, 57466.0, 82106.0, 114107.0, 152272.0, 196654.0, 243851.0, 288975.0, 327980.0, 353175.0, 361629.0, 352701.0, 326822.0, 286397.0, 241742.0, 192602.0, 150385.0, 111531.0, 80422.0, 55833.0, 38263.0, 25322.0, 16439.0, 10412.0, 6562.0, 4106.0, 2498.0, 1541.0, 907.0, 565.0, 321.0, 208.0, 108.0, 47.0, 50.0, 19.0, 6.0, 4.0, 4.0, 2.0], "bins": [-49.53125, -48.09423828125, -46.6572265625, -45.22021484375, -43.783203125, -42.34619140625, -40.9091796875, -39.47216796875, -38.03515625, -36.59814453125, -35.1611328125, -33.72412109375, -32.287109375, -30.85009765625, -29.4130859375, -27.97607421875, -26.5390625, -25.10205078125, -23.6650390625, -22.22802734375, -20.791015625, -19.35400390625, -17.9169921875, -16.47998046875, -15.04296875, -13.60595703125, -12.1689453125, -10.73193359375, -9.294921875, -7.85791015625, -6.4208984375, -4.98388671875, -3.546875, -2.10986328125, -0.6728515625, 0.76416015625, 2.201171875, 3.63818359375, 5.0751953125, 6.51220703125, 7.94921875, 9.38623046875, 10.8232421875, 12.26025390625, 13.697265625, 15.13427734375, 16.5712890625, 18.00830078125, 19.4453125, 20.88232421875, 22.3193359375, 23.75634765625, 25.193359375, 26.63037109375, 28.0673828125, 29.50439453125, 30.94140625, 32.37841796875, 33.8154296875, 35.25244140625, 36.689453125, 38.12646484375, 39.5634765625, 41.00048828125, 42.4375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 10.0, 21.0, 21.0, 23.0, 28.0, 33.0, 55.0, 68.0, 63.0, 91.0, 92.0, 102.0, 132.0, 141.0, 150.0, 160.0, 155.0, 186.0, 188.0, 190.0, 161.0, 179.0, 185.0, 189.0, 175.0, 189.0, 141.0, 110.0, 136.0, 107.0, 82.0, 91.0, 71.0, 67.0, 55.0, 51.0, 37.0, 28.0, 23.0, 18.0, 8.0, 12.0, 10.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.796875, -28.88916015625, -27.9814453125, -27.07373046875, -26.166015625, -25.25830078125, -24.3505859375, -23.44287109375, -22.53515625, -21.62744140625, -20.7197265625, -19.81201171875, -18.904296875, -17.99658203125, -17.0888671875, -16.18115234375, -15.2734375, -14.36572265625, -13.4580078125, -12.55029296875, -11.642578125, -10.73486328125, -9.8271484375, -8.91943359375, -8.01171875, -7.10400390625, -6.1962890625, -5.28857421875, -4.380859375, -3.47314453125, -2.5654296875, -1.65771484375, -0.75, 0.15771484375, 1.0654296875, 1.97314453125, 2.880859375, 3.78857421875, 4.6962890625, 5.60400390625, 6.51171875, 7.41943359375, 8.3271484375, 9.23486328125, 10.142578125, 11.05029296875, 11.9580078125, 12.86572265625, 13.7734375, 14.68115234375, 15.5888671875, 16.49658203125, 17.404296875, 18.31201171875, 19.2197265625, 20.12744140625, 21.03515625, 21.94287109375, 22.8505859375, 23.75830078125, 24.666015625, 25.57373046875, 26.4814453125, 27.38916015625, 28.296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 4.0, 12.0, 14.0, 12.0, 12.0, 33.0, 16.0, 26.0, 11.0, 27.0, 27.0, 35.0, 30.0, 38.0, 48.0, 40.0, 46.0, 42.0, 41.0, 53.0, 39.0, 29.0, 45.0, 38.0, 40.0, 36.0, 28.0, 23.0, 16.0, 20.0, 20.0, 10.0, 15.0, 11.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.62174987792969, -69.43634796142578, -67.25094604492188, -65.06553649902344, -62.88013458251953, -60.694732666015625, -58.50933074951172, -56.32392883300781, -54.13852310180664, -51.953121185302734, -49.76771545410156, -47.582313537597656, -45.39691162109375, -43.21150588989258, -41.02610397338867, -38.8406982421875, -36.655296325683594, -34.46989440917969, -32.284488677978516, -30.09908676147461, -27.91368293762207, -25.72827911376953, -23.542877197265625, -21.357473373413086, -19.172069549560547, -16.986665725708008, -14.801262855529785, -12.615859985351562, -10.430456161499023, -8.245052337646484, -6.059649467468262, -3.874246597290039, -1.6888351440429688, 0.4965682029724121, 2.681971549987793, 4.867374897003174, 7.052778244018555, 9.238182067871094, 11.423584938049316, 13.608987808227539, 15.794391632080078, 17.979795455932617, 20.165199279785156, 22.350601196289062, 24.5360050201416, 26.72140884399414, 28.906810760498047, 31.092214584350586, 33.277618408203125, 35.46302032470703, 37.6484260559082, 39.83382797241211, 42.01923370361328, 44.20463562011719, 46.390037536621094, 48.575439453125, 50.76084518432617, 52.94624710083008, 55.13165283203125, 57.317054748535156, 59.50245666503906, 61.687862396240234, 63.87326431274414, 66.05867004394531, 68.24407196044922]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 15.0, 17.0, 10.0, 14.0, 26.0, 21.0, 15.0, 32.0, 31.0, 30.0, 33.0, 39.0, 23.0, 43.0, 37.0, 40.0, 49.0, 42.0, 41.0, 54.0, 34.0, 42.0, 37.0, 28.0, 38.0, 29.0, 20.0, 24.0, 21.0, 13.0, 11.0, 13.0, 13.0, 8.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.8331527709961, -90.14823150634766, -87.46330261230469, -84.77838134765625, -82.09346008300781, -79.40853118896484, -76.7236099243164, -74.03868103027344, -71.353759765625, -68.66883850097656, -65.9839096069336, -63.298988342285156, -60.61406326293945, -57.92913818359375, -55.24421691894531, -52.55929183959961, -49.874366760253906, -47.1894416809082, -44.5045166015625, -41.81959533691406, -39.13467025756836, -36.449745178222656, -33.76482391357422, -31.079898834228516, -28.394973754882812, -25.71004867553711, -23.02512550354004, -20.34020233154297, -17.655277252197266, -14.970353126525879, -12.285429000854492, -9.600505828857422, -6.9155731201171875, -4.230648994445801, -1.545724868774414, 1.1391992568969727, 3.8241233825683594, 6.509047508239746, 9.193971633911133, 11.878894805908203, 14.563819885253906, 17.24874496459961, 19.93366813659668, 22.61859130859375, 25.303516387939453, 27.988441467285156, 30.673364639282227, 33.3582878112793, 36.043212890625, 38.7281379699707, 41.413063049316406, 44.097984313964844, 46.78290939331055, 49.46783447265625, 52.15275573730469, 54.83768081665039, 57.522605895996094, 60.2075309753418, 62.8924560546875, 65.57737731933594, 68.26229858398438, 70.94722747802734, 73.63214874267578, 76.31707763671875, 79.00199890136719]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 16.0, 13.0, 21.0, 28.0, 28.0, 64.0, 102.0, 155.0, 258.0, 374.0, 557.0, 847.0, 1395.0, 2158.0, 3431.0, 5278.0, 8209.0, 12581.0, 19029.0, 28774.0, 42122.0, 59198.0, 80196.0, 101198.0, 117153.0, 121476.0, 112464.0, 94320.0, 73283.0, 53352.0, 37194.0, 25552.0, 16873.0, 10972.0, 7217.0, 4376.0, 2974.0, 1915.0, 1230.0, 748.0, 523.0, 310.0, 191.0, 143.0, 85.0, 60.0, 29.0, 36.0, 13.0, 8.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0], "bins": [-11.46875, -11.124755859375, -10.78076171875, -10.436767578125, -10.0927734375, -9.748779296875, -9.40478515625, -9.060791015625, -8.716796875, -8.372802734375, -8.02880859375, -7.684814453125, -7.3408203125, -6.996826171875, -6.65283203125, -6.308837890625, -5.96484375, -5.620849609375, -5.27685546875, -4.932861328125, -4.5888671875, -4.244873046875, -3.90087890625, -3.556884765625, -3.212890625, -2.868896484375, -2.52490234375, -2.180908203125, -1.8369140625, -1.492919921875, -1.14892578125, -0.804931640625, -0.4609375, -0.116943359375, 0.22705078125, 0.571044921875, 0.9150390625, 1.259033203125, 1.60302734375, 1.947021484375, 2.291015625, 2.635009765625, 2.97900390625, 3.322998046875, 3.6669921875, 4.010986328125, 4.35498046875, 4.698974609375, 5.04296875, 5.386962890625, 5.73095703125, 6.074951171875, 6.4189453125, 6.762939453125, 7.10693359375, 7.450927734375, 7.794921875, 8.138916015625, 8.48291015625, 8.826904296875, 9.1708984375, 9.514892578125, 9.85888671875, 10.202880859375, 10.546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 17.0, 10.0, 13.0, 24.0, 21.0, 17.0, 32.0, 31.0, 30.0, 32.0, 39.0, 26.0, 41.0, 36.0, 43.0, 43.0, 44.0, 45.0, 53.0, 33.0, 42.0, 37.0, 27.0, 39.0, 29.0, 21.0, 24.0, 22.0, 12.0, 11.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.125, -90.431640625, -87.73828125, -85.044921875, -82.3515625, -79.658203125, -76.96484375, -74.271484375, -71.578125, -68.884765625, -66.19140625, -63.498046875, -60.8046875, -58.111328125, -55.41796875, -52.724609375, -50.03125, -47.337890625, -44.64453125, -41.951171875, -39.2578125, -36.564453125, -33.87109375, -31.177734375, -28.484375, -25.791015625, -23.09765625, -20.404296875, -17.7109375, -15.017578125, -12.32421875, -9.630859375, -6.9375, -4.244140625, -1.55078125, 1.142578125, 3.8359375, 6.529296875, 9.22265625, 11.916015625, 14.609375, 17.302734375, 19.99609375, 22.689453125, 25.3828125, 28.076171875, 30.76953125, 33.462890625, 36.15625, 38.849609375, 41.54296875, 44.236328125, 46.9296875, 49.623046875, 52.31640625, 55.009765625, 57.703125, 60.396484375, 63.08984375, 65.783203125, 68.4765625, 71.169921875, 73.86328125, 76.556640625, 79.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 7.0, 15.0, 27.0, 25.0, 50.0, 59.0, 93.0, 145.0, 186.0, 269.0, 372.0, 547.0, 832.0, 1178.0, 1696.0, 2452.0, 3394.0, 4821.0, 7015.0, 10048.0, 14711.0, 23963.0, 74384.0, 724546.0, 101644.0, 25724.0, 15959.0, 10446.0, 7107.0, 4992.0, 3537.0, 2467.0, 1698.0, 1259.0, 911.0, 585.0, 400.0, 283.0, 209.0, 138.0, 99.0, 78.0, 59.0, 49.0, 19.0, 18.0, 5.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-21.828125, -21.15771484375, -20.4873046875, -19.81689453125, -19.146484375, -18.47607421875, -17.8056640625, -17.13525390625, -16.46484375, -15.79443359375, -15.1240234375, -14.45361328125, -13.783203125, -13.11279296875, -12.4423828125, -11.77197265625, -11.1015625, -10.43115234375, -9.7607421875, -9.09033203125, -8.419921875, -7.74951171875, -7.0791015625, -6.40869140625, -5.73828125, -5.06787109375, -4.3974609375, -3.72705078125, -3.056640625, -2.38623046875, -1.7158203125, -1.04541015625, -0.375, 0.29541015625, 0.9658203125, 1.63623046875, 2.306640625, 2.97705078125, 3.6474609375, 4.31787109375, 4.98828125, 5.65869140625, 6.3291015625, 6.99951171875, 7.669921875, 8.34033203125, 9.0107421875, 9.68115234375, 10.3515625, 11.02197265625, 11.6923828125, 12.36279296875, 13.033203125, 13.70361328125, 14.3740234375, 15.04443359375, 15.71484375, 16.38525390625, 17.0556640625, 17.72607421875, 18.396484375, 19.06689453125, 19.7373046875, 20.40771484375, 21.078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 14.0, 17.0, 20.0, 8.0, 17.0, 25.0, 12.0, 21.0, 29.0, 31.0, 36.0, 27.0, 39.0, 37.0, 37.0, 42.0, 36.0, 35.0, 40.0, 40.0, 36.0, 32.0, 31.0, 33.0, 30.0, 14.0, 30.0, 22.0, 21.0, 16.0, 26.0, 17.0, 18.0, 14.0, 16.0, 8.0, 5.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.71875, -47.09619140625, -45.4736328125, -43.85107421875, -42.228515625, -40.60595703125, -38.9833984375, -37.36083984375, -35.73828125, -34.11572265625, -32.4931640625, -30.87060546875, -29.248046875, -27.62548828125, -26.0029296875, -24.38037109375, -22.7578125, -21.13525390625, -19.5126953125, -17.89013671875, -16.267578125, -14.64501953125, -13.0224609375, -11.39990234375, -9.77734375, -8.15478515625, -6.5322265625, -4.90966796875, -3.287109375, -1.66455078125, -0.0419921875, 1.58056640625, 3.203125, 4.82568359375, 6.4482421875, 8.07080078125, 9.693359375, 11.31591796875, 12.9384765625, 14.56103515625, 16.18359375, 17.80615234375, 19.4287109375, 21.05126953125, 22.673828125, 24.29638671875, 25.9189453125, 27.54150390625, 29.1640625, 30.78662109375, 32.4091796875, 34.03173828125, 35.654296875, 37.27685546875, 38.8994140625, 40.52197265625, 42.14453125, 43.76708984375, 45.3896484375, 47.01220703125, 48.634765625, 50.25732421875, 51.8798828125, 53.50244140625, 55.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 4.0, 11.0, 14.0, 30.0, 40.0, 58.0, 80.0, 144.0, 211.0, 331.0, 531.0, 927.0, 1444.0, 2398.0, 4215.0, 6922.0, 11918.0, 20799.0, 40820.0, 817038.0, 79921.0, 25590.0, 14505.0, 8258.0, 4765.0, 2925.0, 1761.0, 1099.0, 625.0, 435.0, 255.0, 166.0, 100.0, 59.0, 42.0, 24.0, 19.0, 21.0, 9.0, 6.0, 2.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.640625, -2.5416259765625, -2.442626953125, -2.3436279296875, -2.24462890625, -2.1456298828125, -2.046630859375, -1.9476318359375, -1.8486328125, -1.7496337890625, -1.650634765625, -1.5516357421875, -1.45263671875, -1.3536376953125, -1.254638671875, -1.1556396484375, -1.056640625, -0.9576416015625, -0.858642578125, -0.7596435546875, -0.66064453125, -0.5616455078125, -0.462646484375, -0.3636474609375, -0.2646484375, -0.1656494140625, -0.066650390625, 0.0323486328125, 0.13134765625, 0.2303466796875, 0.329345703125, 0.4283447265625, 0.52734375, 0.6263427734375, 0.725341796875, 0.8243408203125, 0.92333984375, 1.0223388671875, 1.121337890625, 1.2203369140625, 1.3193359375, 1.4183349609375, 1.517333984375, 1.6163330078125, 1.71533203125, 1.8143310546875, 1.913330078125, 2.0123291015625, 2.111328125, 2.2103271484375, 2.309326171875, 2.4083251953125, 2.50732421875, 2.6063232421875, 2.705322265625, 2.8043212890625, 2.9033203125, 3.0023193359375, 3.101318359375, 3.2003173828125, 3.29931640625, 3.3983154296875, 3.497314453125, 3.5963134765625, 3.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 13.0, 17.0, 13.0, 22.0, 20.0, 21.0, 21.0, 40.0, 37.0, 42.0, 48.0, 44.0, 46.0, 52.0, 53.0, 42.0, 54.0, 45.0, 50.0, 40.0, 41.0, 22.0, 30.0, 30.0, 13.0, 26.0, 22.0, 14.0, 19.0, 10.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.185075759887695e-05, -8.923280984163284e-05, -8.661486208438873e-05, -8.399691432714462e-05, -8.137896656990051e-05, -7.87610188126564e-05, -7.614307105541229e-05, -7.352512329816818e-05, -7.090717554092407e-05, -6.828922778367996e-05, -6.567128002643585e-05, -6.305333226919174e-05, -6.043538451194763e-05, -5.781743675470352e-05, -5.519948899745941e-05, -5.25815412402153e-05, -4.996359348297119e-05, -4.734564572572708e-05, -4.472769796848297e-05, -4.210975021123886e-05, -3.949180245399475e-05, -3.687385469675064e-05, -3.425590693950653e-05, -3.163795918226242e-05, -2.902001142501831e-05, -2.64020636677742e-05, -2.378411591053009e-05, -2.116616815328598e-05, -1.854822039604187e-05, -1.593027263879776e-05, -1.331232488155365e-05, -1.069437712430954e-05, -8.07642936706543e-06, -5.45848160982132e-06, -2.8405338525772095e-06, -2.2258609533309937e-07, 2.3953616619110107e-06, 5.013309419155121e-06, 7.631257176399231e-06, 1.0249204933643341e-05, 1.2867152690887451e-05, 1.548510044813156e-05, 1.810304820537567e-05, 2.072099596261978e-05, 2.333894371986389e-05, 2.5956891477108002e-05, 2.8574839234352112e-05, 3.119278699159622e-05, 3.381073474884033e-05, 3.642868250608444e-05, 3.904663026332855e-05, 4.166457802057266e-05, 4.428252577781677e-05, 4.690047353506088e-05, 4.951842129230499e-05, 5.21363690495491e-05, 5.475431680679321e-05, 5.737226456403732e-05, 5.999021232128143e-05, 6.260816007852554e-05, 6.522610783576965e-05, 6.784405559301376e-05, 7.046200335025787e-05, 7.307995110750198e-05, 7.56978988647461e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 14.0, 12.0, 18.0, 38.0, 64.0, 119.0, 200.0, 303.0, 476.0, 866.0, 1548.0, 2549.0, 4217.0, 7221.0, 12463.0, 21180.0, 34973.0, 57077.0, 91183.0, 134474.0, 171199.0, 166988.0, 125995.0, 83971.0, 52424.0, 32261.0, 19117.0, 11356.0, 6721.0, 3987.0, 2289.0, 1353.0, 751.0, 462.0, 273.0, 144.0, 101.0, 59.0, 44.0, 23.0, 12.0, 11.0, 11.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.78515625, -2.6978759765625, -2.610595703125, -2.5233154296875, -2.43603515625, -2.3487548828125, -2.261474609375, -2.1741943359375, -2.0869140625, -1.9996337890625, -1.912353515625, -1.8250732421875, -1.73779296875, -1.6505126953125, -1.563232421875, -1.4759521484375, -1.388671875, -1.3013916015625, -1.214111328125, -1.1268310546875, -1.03955078125, -0.9522705078125, -0.864990234375, -0.7777099609375, -0.6904296875, -0.6031494140625, -0.515869140625, -0.4285888671875, -0.34130859375, -0.2540283203125, -0.166748046875, -0.0794677734375, 0.0078125, 0.0950927734375, 0.182373046875, 0.2696533203125, 0.35693359375, 0.4442138671875, 0.531494140625, 0.6187744140625, 0.7060546875, 0.7933349609375, 0.880615234375, 0.9678955078125, 1.05517578125, 1.1424560546875, 1.229736328125, 1.3170166015625, 1.404296875, 1.4915771484375, 1.578857421875, 1.6661376953125, 1.75341796875, 1.8406982421875, 1.927978515625, 2.0152587890625, 2.1025390625, 2.1898193359375, 2.277099609375, 2.3643798828125, 2.45166015625, 2.5389404296875, 2.626220703125, 2.7135009765625, 2.80078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 14.0, 10.0, 15.0, 15.0, 14.0, 16.0, 18.0, 25.0, 33.0, 30.0, 36.0, 41.0, 40.0, 57.0, 42.0, 39.0, 47.0, 56.0, 54.0, 53.0, 53.0, 34.0, 34.0, 36.0, 22.0, 25.0, 22.0, 26.0, 15.0, 14.0, 7.0, 7.0, 6.0, 3.0, 12.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3271484375, -1.2866668701171875, -1.246185302734375, -1.2057037353515625, -1.16522216796875, -1.1247406005859375, -1.084259033203125, -1.0437774658203125, -1.0032958984375, -0.9628143310546875, -0.922332763671875, -0.8818511962890625, -0.84136962890625, -0.8008880615234375, -0.760406494140625, -0.7199249267578125, -0.679443359375, -0.6389617919921875, -0.598480224609375, -0.5579986572265625, -0.51751708984375, -0.4770355224609375, -0.436553955078125, -0.3960723876953125, -0.3555908203125, -0.3151092529296875, -0.274627685546875, -0.2341461181640625, -0.19366455078125, -0.1531829833984375, -0.112701416015625, -0.0722198486328125, -0.03173828125, 0.0087432861328125, 0.049224853515625, 0.0897064208984375, 0.13018798828125, 0.1706695556640625, 0.211151123046875, 0.2516326904296875, 0.2921142578125, 0.3325958251953125, 0.373077392578125, 0.4135589599609375, 0.45404052734375, 0.4945220947265625, 0.535003662109375, 0.5754852294921875, 0.615966796875, 0.6564483642578125, 0.696929931640625, 0.7374114990234375, 0.77789306640625, 0.8183746337890625, 0.858856201171875, 0.8993377685546875, 0.9398193359375, 0.9803009033203125, 1.020782470703125, 1.0612640380859375, 1.10174560546875, 1.1422271728515625, 1.182708740234375, 1.2231903076171875, 1.263671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 11.0, 5.0, 9.0, 5.0, 5.0, 13.0, 9.0, 17.0, 16.0, 27.0, 21.0, 21.0, 18.0, 32.0, 24.0, 35.0, 30.0, 37.0, 53.0, 46.0, 36.0, 43.0, 54.0, 34.0, 47.0, 35.0, 41.0, 38.0, 35.0, 29.0, 34.0, 22.0, 23.0, 16.0, 13.0, 13.0, 11.0, 8.0, 12.0, 9.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.83599090576172, -68.6427001953125, -66.44940948486328, -64.25611114501953, -62.06282043457031, -59.869529724121094, -57.676239013671875, -55.482948303222656, -53.28965377807617, -51.09636306762695, -48.90306854248047, -46.70977783203125, -44.51648712158203, -42.32319259643555, -40.12990188598633, -37.936607360839844, -35.743316650390625, -33.550025939941406, -31.356731414794922, -29.163440704345703, -26.97014808654785, -24.77685546875, -22.58356475830078, -20.39027214050293, -18.196979522705078, -16.003686904907227, -13.810395240783691, -11.617103576660156, -9.423810958862305, -7.230518341064453, -5.037226676940918, -2.843935012817383, -0.6506423950195312, 1.542649745941162, 3.7359418869018555, 5.929234027862549, 8.122526168823242, 10.315818786621094, 12.509110450744629, 14.702402114868164, 16.895694732666016, 19.088987350463867, 21.28227996826172, 23.475570678710938, 25.66886329650879, 27.86215591430664, 30.05544662475586, 32.248741149902344, 34.44203186035156, 36.63532257080078, 38.828617095947266, 41.021907806396484, 43.21520233154297, 45.40849304199219, 47.601783752441406, 49.795074462890625, 51.98836898803711, 54.18165969848633, 56.37495422363281, 58.56824493408203, 60.76153564453125, 62.954830169677734, 65.14812469482422, 67.34141540527344, 69.53470611572266]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 11.0, 18.0, 12.0, 11.0, 25.0, 21.0, 17.0, 29.0, 29.0, 29.0, 32.0, 45.0, 24.0, 38.0, 37.0, 41.0, 44.0, 41.0, 43.0, 60.0, 34.0, 40.0, 33.0, 32.0, 38.0, 31.0, 21.0, 26.0, 17.0, 18.0, 12.0, 10.0, 12.0, 9.0, 10.0, 7.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.45228576660156, -90.76252746582031, -88.07276916503906, -85.38300323486328, -82.69324493408203, -80.00348663330078, -77.313720703125, -74.62396240234375, -71.9342041015625, -69.24444580078125, -66.5546875, -63.86492156982422, -61.17516326904297, -58.48540496826172, -55.7956428527832, -53.10588073730469, -50.41612243652344, -47.72636413574219, -45.03660202026367, -42.346839904785156, -39.657081604003906, -36.967323303222656, -34.27756118774414, -31.587800979614258, -28.898040771484375, -26.208280563354492, -23.51852035522461, -20.828760147094727, -18.138999938964844, -15.449239730834961, -12.759479522705078, -10.069719314575195, -7.3799591064453125, -4.69019889831543, -2.000438690185547, 0.6893215179443359, 3.3790817260742188, 6.068841934204102, 8.758602142333984, 11.448362350463867, 14.13812255859375, 16.827882766723633, 19.517642974853516, 22.2074031829834, 24.89716339111328, 27.586923599243164, 30.276683807373047, 32.96644592285156, 35.65620422363281, 38.34596252441406, 41.03572463989258, 43.725486755371094, 46.415245056152344, 49.105003356933594, 51.79476547241211, 54.484527587890625, 57.174285888671875, 59.864044189453125, 62.55380630493164, 65.24356842041016, 67.9333267211914, 70.62308502197266, 73.31285095214844, 76.00260925292969, 78.69236755371094]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 20.0, 34.0, 47.0, 111.0, 140.0, 215.0, 443.0, 662.0, 1145.0, 1737.0, 2901.0, 4831.0, 7677.0, 11948.0, 18496.0, 27974.0, 39692.0, 54878.0, 70863.0, 86648.0, 99660.0, 106413.0, 105433.0, 97258.0, 83167.0, 67487.0, 50953.0, 36527.0, 25468.0, 16766.0, 11006.0, 6938.0, 4235.0, 2617.0, 1585.0, 1020.0, 631.0, 376.0, 207.0, 148.0, 87.0, 39.0, 31.0, 13.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.625, -42.11474609375, -40.6044921875, -39.09423828125, -37.583984375, -36.07373046875, -34.5634765625, -33.05322265625, -31.54296875, -30.03271484375, -28.5224609375, -27.01220703125, -25.501953125, -23.99169921875, -22.4814453125, -20.97119140625, -19.4609375, -17.95068359375, -16.4404296875, -14.93017578125, -13.419921875, -11.90966796875, -10.3994140625, -8.88916015625, -7.37890625, -5.86865234375, -4.3583984375, -2.84814453125, -1.337890625, 0.17236328125, 1.6826171875, 3.19287109375, 4.703125, 6.21337890625, 7.7236328125, 9.23388671875, 10.744140625, 12.25439453125, 13.7646484375, 15.27490234375, 16.78515625, 18.29541015625, 19.8056640625, 21.31591796875, 22.826171875, 24.33642578125, 25.8466796875, 27.35693359375, 28.8671875, 30.37744140625, 31.8876953125, 33.39794921875, 34.908203125, 36.41845703125, 37.9287109375, 39.43896484375, 40.94921875, 42.45947265625, 43.9697265625, 45.47998046875, 46.990234375, 48.50048828125, 50.0107421875, 51.52099609375, 53.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 16.0, 13.0, 10.0, 25.0, 20.0, 20.0, 28.0, 25.0, 31.0, 32.0, 47.0, 23.0, 38.0, 38.0, 40.0, 43.0, 46.0, 43.0, 57.0, 36.0, 37.0, 34.0, 31.0, 43.0, 27.0, 23.0, 24.0, 19.0, 15.0, 15.0, 7.0, 13.0, 9.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.6875, -90.01953125, -87.3515625, -84.68359375, -82.015625, -79.34765625, -76.6796875, -74.01171875, -71.34375, -68.67578125, -66.0078125, -63.33984375, -60.671875, -58.00390625, -55.3359375, -52.66796875, -50.0, -47.33203125, -44.6640625, -41.99609375, -39.328125, -36.66015625, -33.9921875, -31.32421875, -28.65625, -25.98828125, -23.3203125, -20.65234375, -17.984375, -15.31640625, -12.6484375, -9.98046875, -7.3125, -4.64453125, -1.9765625, 0.69140625, 3.359375, 6.02734375, 8.6953125, 11.36328125, 14.03125, 16.69921875, 19.3671875, 22.03515625, 24.703125, 27.37109375, 30.0390625, 32.70703125, 35.375, 38.04296875, 40.7109375, 43.37890625, 46.046875, 48.71484375, 51.3828125, 54.05078125, 56.71875, 59.38671875, 62.0546875, 64.72265625, 67.390625, 70.05859375, 72.7265625, 75.39453125, 78.0625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 9.0, 9.0, 22.0, 32.0, 68.0, 71.0, 103.0, 153.0, 271.0, 414.0, 631.0, 995.0, 1500.0, 2304.0, 3505.0, 5185.0, 7791.0, 11432.0, 16503.0, 23059.0, 31627.0, 42442.0, 54730.0, 66771.0, 78688.0, 88135.0, 91781.0, 91967.0, 86992.0, 77478.0, 66007.0, 53362.0, 41624.0, 31005.0, 22592.0, 15928.0, 11040.0, 7514.0, 5101.0, 3404.0, 2209.0, 1364.0, 961.0, 616.0, 423.0, 274.0, 183.0, 111.0, 58.0, 43.0, 35.0, 15.0, 11.0, 6.0, 3.0, 1.0, 4.0, 2.0], "bins": [-47.28125, -45.8466796875, -44.412109375, -42.9775390625, -41.54296875, -40.1083984375, -38.673828125, -37.2392578125, -35.8046875, -34.3701171875, -32.935546875, -31.5009765625, -30.06640625, -28.6318359375, -27.197265625, -25.7626953125, -24.328125, -22.8935546875, -21.458984375, -20.0244140625, -18.58984375, -17.1552734375, -15.720703125, -14.2861328125, -12.8515625, -11.4169921875, -9.982421875, -8.5478515625, -7.11328125, -5.6787109375, -4.244140625, -2.8095703125, -1.375, 0.0595703125, 1.494140625, 2.9287109375, 4.36328125, 5.7978515625, 7.232421875, 8.6669921875, 10.1015625, 11.5361328125, 12.970703125, 14.4052734375, 15.83984375, 17.2744140625, 18.708984375, 20.1435546875, 21.578125, 23.0126953125, 24.447265625, 25.8818359375, 27.31640625, 28.7509765625, 30.185546875, 31.6201171875, 33.0546875, 34.4892578125, 35.923828125, 37.3583984375, 38.79296875, 40.2275390625, 41.662109375, 43.0966796875, 44.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 14.0, 12.0, 15.0, 19.0, 25.0, 20.0, 16.0, 28.0, 28.0, 36.0, 39.0, 36.0, 40.0, 42.0, 37.0, 49.0, 43.0, 38.0, 37.0, 29.0, 35.0, 49.0, 32.0, 34.0, 30.0, 23.0, 17.0, 24.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 8.0, 9.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.24755859375, -48.4638671875, -46.68017578125, -44.896484375, -43.11279296875, -41.3291015625, -39.54541015625, -37.76171875, -35.97802734375, -34.1943359375, -32.41064453125, -30.626953125, -28.84326171875, -27.0595703125, -25.27587890625, -23.4921875, -21.70849609375, -19.9248046875, -18.14111328125, -16.357421875, -14.57373046875, -12.7900390625, -11.00634765625, -9.22265625, -7.43896484375, -5.6552734375, -3.87158203125, -2.087890625, -0.30419921875, 1.4794921875, 3.26318359375, 5.046875, 6.83056640625, 8.6142578125, 10.39794921875, 12.181640625, 13.96533203125, 15.7490234375, 17.53271484375, 19.31640625, 21.10009765625, 22.8837890625, 24.66748046875, 26.451171875, 28.23486328125, 30.0185546875, 31.80224609375, 33.5859375, 35.36962890625, 37.1533203125, 38.93701171875, 40.720703125, 42.50439453125, 44.2880859375, 46.07177734375, 47.85546875, 49.63916015625, 51.4228515625, 53.20654296875, 54.990234375, 56.77392578125, 58.5576171875, 60.34130859375, 62.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 7.0, 18.0, 13.0, 38.0, 61.0, 100.0, 161.0, 280.0, 485.0, 790.0, 1352.0, 2301.0, 4096.0, 6875.0, 11507.0, 19034.0, 30302.0, 45594.0, 65563.0, 87105.0, 107075.0, 119980.0, 122091.0, 112278.0, 94523.0, 72608.0, 52559.0, 35335.0, 22484.0, 13991.0, 8297.0, 4948.0, 2803.0, 1631.0, 925.0, 538.0, 310.0, 186.0, 116.0, 67.0, 43.0, 31.0, 20.0, 11.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-23.578125, -22.867431640625, -22.15673828125, -21.446044921875, -20.7353515625, -20.024658203125, -19.31396484375, -18.603271484375, -17.892578125, -17.181884765625, -16.47119140625, -15.760498046875, -15.0498046875, -14.339111328125, -13.62841796875, -12.917724609375, -12.20703125, -11.496337890625, -10.78564453125, -10.074951171875, -9.3642578125, -8.653564453125, -7.94287109375, -7.232177734375, -6.521484375, -5.810791015625, -5.10009765625, -4.389404296875, -3.6787109375, -2.968017578125, -2.25732421875, -1.546630859375, -0.8359375, -0.125244140625, 0.58544921875, 1.296142578125, 2.0068359375, 2.717529296875, 3.42822265625, 4.138916015625, 4.849609375, 5.560302734375, 6.27099609375, 6.981689453125, 7.6923828125, 8.403076171875, 9.11376953125, 9.824462890625, 10.53515625, 11.245849609375, 11.95654296875, 12.667236328125, 13.3779296875, 14.088623046875, 14.79931640625, 15.510009765625, 16.220703125, 16.931396484375, 17.64208984375, 18.352783203125, 19.0634765625, 19.774169921875, 20.48486328125, 21.195556640625, 21.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 14.0, 25.0, 19.0, 26.0, 18.0, 38.0, 49.0, 30.0, 46.0, 49.0, 39.0, 47.0, 57.0, 49.0, 48.0, 47.0, 42.0, 45.0, 37.0, 31.0, 34.0, 32.0, 23.0, 21.0, 16.0, 14.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028400421142578125, -0.0027502477169036865, -0.0026604533195495605, -0.0025706589221954346, -0.0024808645248413086, -0.0023910701274871826, -0.0023012757301330566, -0.0022114813327789307, -0.0021216869354248047, -0.0020318925380706787, -0.0019420981407165527, -0.0018523037433624268, -0.0017625093460083008, -0.0016727149486541748, -0.0015829205513000488, -0.0014931261539459229, -0.0014033317565917969, -0.001313537359237671, -0.001223742961883545, -0.001133948564529419, -0.001044154167175293, -0.000954359769821167, -0.000864565372467041, -0.000774770975112915, -0.0006849765777587891, -0.0005951821804046631, -0.0005053877830505371, -0.00041559338569641113, -0.00032579898834228516, -0.00023600459098815918, -0.0001462101936340332, -5.6415796279907227e-05, 3.337860107421875e-05, 0.00012317299842834473, 0.0002129673957824707, 0.0003027617931365967, 0.00039255619049072266, 0.00048235058784484863, 0.0005721449851989746, 0.0006619393825531006, 0.0007517337799072266, 0.0008415281772613525, 0.0009313225746154785, 0.0010211169719696045, 0.0011109113693237305, 0.0012007057666778564, 0.0012905001640319824, 0.0013802945613861084, 0.0014700889587402344, 0.0015598833560943604, 0.0016496777534484863, 0.0017394721508026123, 0.0018292665481567383, 0.0019190609455108643, 0.0020088553428649902, 0.002098649740219116, 0.002188444137573242, 0.002278238534927368, 0.002368032932281494, 0.00245782732963562, 0.002547621726989746, 0.002637416124343872, 0.002727210521697998, 0.002817004919052124, 0.00290679931640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 14.0, 18.0, 31.0, 34.0, 63.0, 101.0, 174.0, 277.0, 415.0, 652.0, 1083.0, 1661.0, 2605.0, 4134.0, 6115.0, 9402.0, 13553.0, 19606.0, 27198.0, 37052.0, 47712.0, 59921.0, 71899.0, 82279.0, 89032.0, 91428.0, 89238.0, 82608.0, 73386.0, 61071.0, 48568.0, 37712.0, 27819.0, 20028.0, 13964.0, 9401.0, 6433.0, 4274.0, 2799.0, 1804.0, 1067.0, 768.0, 412.0, 262.0, 173.0, 110.0, 82.0, 47.0, 30.0, 11.0, 10.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0], "bins": [-17.953125, -17.4013671875, -16.849609375, -16.2978515625, -15.74609375, -15.1943359375, -14.642578125, -14.0908203125, -13.5390625, -12.9873046875, -12.435546875, -11.8837890625, -11.33203125, -10.7802734375, -10.228515625, -9.6767578125, -9.125, -8.5732421875, -8.021484375, -7.4697265625, -6.91796875, -6.3662109375, -5.814453125, -5.2626953125, -4.7109375, -4.1591796875, -3.607421875, -3.0556640625, -2.50390625, -1.9521484375, -1.400390625, -0.8486328125, -0.296875, 0.2548828125, 0.806640625, 1.3583984375, 1.91015625, 2.4619140625, 3.013671875, 3.5654296875, 4.1171875, 4.6689453125, 5.220703125, 5.7724609375, 6.32421875, 6.8759765625, 7.427734375, 7.9794921875, 8.53125, 9.0830078125, 9.634765625, 10.1865234375, 10.73828125, 11.2900390625, 11.841796875, 12.3935546875, 12.9453125, 13.4970703125, 14.048828125, 14.6005859375, 15.15234375, 15.7041015625, 16.255859375, 16.8076171875, 17.359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 11.0, 4.0, 12.0, 18.0, 22.0, 18.0, 24.0, 35.0, 36.0, 31.0, 38.0, 39.0, 38.0, 47.0, 41.0, 36.0, 56.0, 44.0, 41.0, 47.0, 33.0, 51.0, 37.0, 34.0, 32.0, 28.0, 27.0, 21.0, 18.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.8963623046875, -9.573974609375, -9.2515869140625, -8.92919921875, -8.6068115234375, -8.284423828125, -7.9620361328125, -7.6396484375, -7.3172607421875, -6.994873046875, -6.6724853515625, -6.35009765625, -6.0277099609375, -5.705322265625, -5.3829345703125, -5.060546875, -4.7381591796875, -4.415771484375, -4.0933837890625, -3.77099609375, -3.4486083984375, -3.126220703125, -2.8038330078125, -2.4814453125, -2.1590576171875, -1.836669921875, -1.5142822265625, -1.19189453125, -0.8695068359375, -0.547119140625, -0.2247314453125, 0.09765625, 0.4200439453125, 0.742431640625, 1.0648193359375, 1.38720703125, 1.7095947265625, 2.031982421875, 2.3543701171875, 2.6767578125, 2.9991455078125, 3.321533203125, 3.6439208984375, 3.96630859375, 4.2886962890625, 4.611083984375, 4.9334716796875, 5.255859375, 5.5782470703125, 5.900634765625, 6.2230224609375, 6.54541015625, 6.8677978515625, 7.190185546875, 7.5125732421875, 7.8349609375, 8.1573486328125, 8.479736328125, 8.8021240234375, 9.12451171875, 9.4468994140625, 9.769287109375, 10.0916748046875, 10.4140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 2.0, 12.0, 6.0, 11.0, 14.0, 16.0, 17.0, 24.0, 17.0, 21.0, 22.0, 29.0, 26.0, 27.0, 29.0, 33.0, 36.0, 51.0, 37.0, 33.0, 45.0, 40.0, 43.0, 39.0, 36.0, 42.0, 36.0, 36.0, 28.0, 23.0, 15.0, 19.0, 18.0, 12.0, 12.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-73.91032409667969, -71.82327270507812, -69.73622131347656, -67.64917755126953, -65.56212615966797, -63.475074768066406, -61.38802719116211, -59.30097961425781, -57.21392822265625, -55.12687683105469, -53.03982925415039, -50.952781677246094, -48.86573028564453, -46.77867889404297, -44.69163131713867, -42.604583740234375, -40.51753234863281, -38.43048095703125, -36.34343338012695, -34.256385803222656, -32.169334411621094, -30.082284927368164, -27.995235443115234, -25.908185958862305, -23.821136474609375, -21.734086990356445, -19.647037506103516, -17.559988021850586, -15.472938537597656, -13.385889053344727, -11.298839569091797, -9.211790084838867, -7.124744415283203, -5.037694931030273, -2.9506454467773438, -0.8635959625244141, 1.2234535217285156, 3.3105030059814453, 5.397552490234375, 7.484601974487305, 9.571651458740234, 11.658700942993164, 13.745750427246094, 15.832799911499023, 17.919849395751953, 20.006898880004883, 22.093948364257812, 24.180997848510742, 26.268047332763672, 28.3550968170166, 30.44214630126953, 32.529197692871094, 34.61624526977539, 36.70329284667969, 38.79034423828125, 40.87739562988281, 42.96444320678711, 45.051490783691406, 47.13854217529297, 49.22559356689453, 51.31264114379883, 53.399688720703125, 55.48674011230469, 57.57379150390625, 59.66083908081055]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 9.0, 4.0, 15.0, 9.0, 13.0, 21.0, 20.0, 16.0, 19.0, 27.0, 32.0, 30.0, 32.0, 31.0, 45.0, 42.0, 39.0, 36.0, 51.0, 45.0, 48.0, 36.0, 47.0, 42.0, 53.0, 36.0, 23.0, 24.0, 16.0, 13.0, 10.0, 21.0, 16.0, 12.0, 9.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-97.46207427978516, -94.4552993774414, -91.44853210449219, -88.44175720214844, -85.43498229980469, -82.42821502685547, -79.42144012451172, -76.4146728515625, -73.40789794921875, -70.401123046875, -67.39435577392578, -64.38758087158203, -61.38080978393555, -58.37403869628906, -55.36726379394531, -52.36049270629883, -49.353721618652344, -46.34695053100586, -43.340179443359375, -40.333404541015625, -37.32663345336914, -34.319862365722656, -31.31308937072754, -28.306316375732422, -25.299545288085938, -22.292774200439453, -19.286001205444336, -16.27922821044922, -13.272457122802734, -10.265685081481934, -7.258913040161133, -4.252140045166016, -1.245361328125, 1.7614107131958008, 4.768182754516602, 7.774954795837402, 10.781726837158203, 13.788498878479004, 16.795270919799805, 19.802043914794922, 22.808815002441406, 25.81558609008789, 28.822359085083008, 31.829132080078125, 34.83590316772461, 37.842674255371094, 40.849449157714844, 43.85622024536133, 46.86299133300781, 49.8697624206543, 52.87653350830078, 55.88330841064453, 58.890079498291016, 61.8968505859375, 64.90362548828125, 67.910400390625, 70.91716766357422, 73.92394256591797, 76.93070983886719, 79.93748474121094, 82.94425964355469, 85.9510269165039, 88.95780181884766, 91.96456909179688, 94.97134399414062]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 8.0, 12.0, 18.0, 30.0, 46.0, 45.0, 61.0, 86.0, 133.0, 173.0, 212.0, 318.0, 467.0, 525.0, 647.0, 858.0, 1179.0, 1432.0, 1762.0, 2116.0, 2523.0, 2869.0, 3354.0, 1009523.0, 4180.0, 3228.0, 2842.0, 2398.0, 1986.0, 1670.0, 1310.0, 1052.0, 854.0, 652.0, 509.0, 365.0, 290.0, 251.0, 180.0, 122.0, 89.0, 62.0, 44.0, 26.0, 19.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 8.0, 3.0], "bins": [-596.8502197265625, -579.7380981445312, -562.6259155273438, -545.5137939453125, -528.4016723632812, -511.2895202636719, -494.1773681640625, -477.06524658203125, -459.9530944824219, -442.8409423828125, -425.72882080078125, -408.6166687011719, -391.5045166015625, -374.39239501953125, -357.2802429199219, -340.1680908203125, -323.05596923828125, -305.9438171386719, -288.8316955566406, -271.71954345703125, -254.60740661621094, -237.49526977539062, -220.38311767578125, -203.27098083496094, -186.15884399414062, -169.0467071533203, -151.9345703125, -134.82241821289062, -117.71028137207031, -100.59814453125, -83.48600006103516, -66.37385559082031, -49.261688232421875, -32.1495475769043, -15.037406921386719, 2.0747337341308594, 19.186874389648438, 36.29901123046875, 53.411155700683594, 70.52330017089844, 87.63543701171875, 104.74757385253906, 121.8597183227539, 138.97186279296875, 156.08399963378906, 173.19613647460938, 190.30828857421875, 207.42042541503906, 224.53256225585938, 241.6446990966797, 258.7568359375, 275.8689880371094, 292.98114013671875, 310.09326171875, 327.2054138183594, 344.31756591796875, 361.4296875, 378.5418395996094, 395.6539611816406, 412.76611328125, 429.87823486328125, 446.9903869628906, 464.1025390625, 481.21466064453125, 498.3268127441406]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 16.0, 18.0, 32.0, 47.0, 70.0, 116.0, 170.0, 250.0, 357.0, 509.0, 735.0, 1129.0, 1613.0, 2294.0, 3526.0, 5220.0, 8417.0, 15285.0, 33200.0, 51317824.0, 37883.0, 16696.0, 8907.0, 5475.0, 3691.0, 2394.0, 1714.0, 1191.0, 830.0, 555.0, 411.0, 232.0, 171.0, 119.0, 66.0, 60.0, 37.0, 28.0, 13.0, 9.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-682.1965942382812, -659.1227416992188, -636.0489501953125, -612.97509765625, -589.9012451171875, -566.8274536132812, -543.7536010742188, -520.6798095703125, -497.60595703125, -474.5321350097656, -451.4582824707031, -428.38446044921875, -405.3106384277344, -382.23681640625, -359.1629638671875, -336.0891418457031, -313.0152893066406, -289.94146728515625, -266.86761474609375, -243.79379272460938, -220.719970703125, -197.64613342285156, -174.57229614257812, -151.49847412109375, -128.4246368408203, -105.3508071899414, -82.2769775390625, -59.20314025878906, -36.129310607910156, -13.05548095703125, 10.018356323242188, 33.09217834472656, 56.166015625, 79.2398452758789, 102.31367492675781, 125.38751220703125, 148.46133422851562, 171.53517150878906, 194.6090087890625, 217.68283081054688, 240.7566680908203, 263.83050537109375, 286.9043273925781, 309.9781494140625, 333.052001953125, 356.1258239746094, 379.19964599609375, 402.27349853515625, 425.3473205566406, 448.421142578125, 471.4949951171875, 494.5688171386719, 517.6426391601562, 540.7164916992188, 563.790283203125, 586.8641357421875, 609.93798828125, 633.0118408203125, 656.0856323242188, 679.1594848632812, 702.2333374023438, 725.30712890625, 748.3809814453125, 771.454833984375, 794.5286254882812]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 5.0, 12.0, 11.0, 12.0, 9.0, 21.0, 29.0, 28.0, 45.0, 47.0, 64.0, 63.0, 89.0, 82.0, 74.0, 84.0, 62.0, 47.0, 51.0, 34.0, 29.0, 23.0, 17.0, 14.0, 11.0, 9.0, 6.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-522.4603271484375, -500.36871337890625, -478.277099609375, -456.18548583984375, -434.0938720703125, -412.00225830078125, -389.9106140136719, -367.8190002441406, -345.7273864746094, -323.6357727050781, -301.5441589355469, -279.4525146484375, -257.36090087890625, -235.26930236816406, -213.17767333984375, -191.0860595703125, -168.99444580078125, -146.90283203125, -124.81121063232422, -102.71958923339844, -80.62797546386719, -58.53636169433594, -36.444732666015625, -14.353118896484375, 7.738494873046875, 29.83011245727539, 51.921730041503906, 74.01335144042969, 96.10496520996094, 118.19657897949219, 140.2882080078125, 162.37982177734375, 184.471435546875, 206.56304931640625, 228.6546630859375, 250.7462921142578, 272.837890625, 294.92950439453125, 317.0211486816406, 339.1127624511719, 361.2043762207031, 383.2959899902344, 405.3876037597656, 427.479248046875, 449.57086181640625, 471.6624755859375, 493.75408935546875, 515.845703125, 537.9373168945312, 560.0289306640625, 582.1205444335938, 604.212158203125, 626.3037719726562, 648.3953857421875, 670.487060546875, 692.57861328125, 714.6702880859375, 736.7619018554688, 758.853515625, 780.9451293945312, 803.0367431640625, 825.1283569335938, 847.219970703125, 869.3116455078125, 891.4031982421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 10.0, 15.0, 13.0, 17.0, 23.0, 23.0, 30.0, 24.0, 31.0, 36.0, 47.0, 29.0, 55.0, 64.0, 65.0, 56.0, 51.0, 53.0, 43.0, 38.0, 45.0, 32.0, 23.0, 29.0, 15.0, 15.0, 13.0, 19.0, 11.0, 11.0, 4.0, 9.0, 5.0, 13.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-685.2730712890625, -664.1161499023438, -642.959228515625, -621.80224609375, -600.6453247070312, -579.4884033203125, -558.3314208984375, -537.1744995117188, -516.017578125, -494.86065673828125, -473.7037048339844, -452.5467529296875, -431.38983154296875, -410.23291015625, -389.0759582519531, -367.91900634765625, -346.7620849609375, -325.60516357421875, -304.4482116699219, -283.291259765625, -262.13433837890625, -240.97740173339844, -219.82046508789062, -198.6635284423828, -177.506591796875, -156.3496551513672, -135.19271850585938, -114.03578186035156, -92.87884521484375, -71.72190856933594, -50.564971923828125, -29.408035278320312, -8.25115966796875, 12.905776977539062, 34.062713623046875, 55.21965026855469, 76.3765869140625, 97.53352355957031, 118.69046020507812, 139.84739685058594, 161.00433349609375, 182.16127014160156, 203.31820678710938, 224.4751434326172, 245.632080078125, 266.78900146484375, 287.9459533691406, 309.1029052734375, 330.25982666015625, 351.416748046875, 372.5736999511719, 393.73065185546875, 414.8875732421875, 436.04449462890625, 457.2014465332031, 478.3583984375, 499.51531982421875, 520.6722412109375, 541.8292236328125, 562.9861450195312, 584.14306640625, 605.2999877929688, 626.4569091796875, 647.6138916015625, 668.7708129882812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 19.0, 15.0, 26.0, 43.0, 34.0, 71.0, 132.0, 210.0, 231.0, 366.0, 487.0, 806.0, 1212.0, 1887.0, 2929.0, 4771.0, 8133.0, 14753.0, 30545.0, 72491.0, 218260.0, 1744524.0, 1740637.0, 212032.0, 71431.0, 30100.0, 14913.0, 8406.0, 5041.0, 3223.0, 2068.0, 1383.0, 963.0, 647.0, 433.0, 319.0, 237.0, 139.0, 97.0, 81.0, 54.0, 38.0, 21.0, 16.0, 16.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.953125, -21.26708984375, -20.5810546875, -19.89501953125, -19.208984375, -18.52294921875, -17.8369140625, -17.15087890625, -16.46484375, -15.77880859375, -15.0927734375, -14.40673828125, -13.720703125, -13.03466796875, -12.3486328125, -11.66259765625, -10.9765625, -10.29052734375, -9.6044921875, -8.91845703125, -8.232421875, -7.54638671875, -6.8603515625, -6.17431640625, -5.48828125, -4.80224609375, -4.1162109375, -3.43017578125, -2.744140625, -2.05810546875, -1.3720703125, -0.68603515625, 0.0, 0.68603515625, 1.3720703125, 2.05810546875, 2.744140625, 3.43017578125, 4.1162109375, 4.80224609375, 5.48828125, 6.17431640625, 6.8603515625, 7.54638671875, 8.232421875, 8.91845703125, 9.6044921875, 10.29052734375, 10.9765625, 11.66259765625, 12.3486328125, 13.03466796875, 13.720703125, 14.40673828125, 15.0927734375, 15.77880859375, 16.46484375, 17.15087890625, 17.8369140625, 18.52294921875, 19.208984375, 19.89501953125, 20.5810546875, 21.26708984375, 21.953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 15.0, 26.0, 28.0, 45.0, 56.0, 71.0, 89.0, 106.0, 103.0, 92.0, 97.0, 49.0, 49.0, 35.0, 29.0, 18.0, 12.0, 8.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.27099609375, -2.1962890625, -2.12158203125, -2.046875, -1.97216796875, -1.8974609375, -1.82275390625, -1.748046875, -1.67333984375, -1.5986328125, -1.52392578125, -1.44921875, -1.37451171875, -1.2998046875, -1.22509765625, -1.150390625, -1.07568359375, -1.0009765625, -0.92626953125, -0.8515625, -0.77685546875, -0.7021484375, -0.62744140625, -0.552734375, -0.47802734375, -0.4033203125, -0.32861328125, -0.25390625, -0.17919921875, -0.1044921875, -0.02978515625, 0.044921875, 0.11962890625, 0.1943359375, 0.26904296875, 0.34375, 0.41845703125, 0.4931640625, 0.56787109375, 0.642578125, 0.71728515625, 0.7919921875, 0.86669921875, 0.94140625, 1.01611328125, 1.0908203125, 1.16552734375, 1.240234375, 1.31494140625, 1.3896484375, 1.46435546875, 1.5390625, 1.61376953125, 1.6884765625, 1.76318359375, 1.837890625, 1.91259765625, 1.9873046875, 2.06201171875, 2.13671875, 2.21142578125, 2.2861328125, 2.36083984375, 2.435546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 13.0, 19.0, 39.0, 47.0, 79.0, 96.0, 165.0, 213.0, 408.0, 640.0, 1160.0, 2180.0, 4869.0, 11423.0, 29105.0, 87300.0, 318323.0, 2193349.0, 1185279.0, 245429.0, 71245.0, 24468.0, 9447.0, 4216.0, 2025.0, 1028.0, 602.0, 369.0, 228.0, 137.0, 103.0, 54.0, 52.0, 36.0, 28.0, 12.0, 19.0, 14.0, 2.0, 4.0, 2.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.7119140625, -18.064453125, -17.4169921875, -16.76953125, -16.1220703125, -15.474609375, -14.8271484375, -14.1796875, -13.5322265625, -12.884765625, -12.2373046875, -11.58984375, -10.9423828125, -10.294921875, -9.6474609375, -9.0, -8.3525390625, -7.705078125, -7.0576171875, -6.41015625, -5.7626953125, -5.115234375, -4.4677734375, -3.8203125, -3.1728515625, -2.525390625, -1.8779296875, -1.23046875, -0.5830078125, 0.064453125, 0.7119140625, 1.359375, 2.0068359375, 2.654296875, 3.3017578125, 3.94921875, 4.5966796875, 5.244140625, 5.8916015625, 6.5390625, 7.1865234375, 7.833984375, 8.4814453125, 9.12890625, 9.7763671875, 10.423828125, 11.0712890625, 11.71875, 12.3662109375, 13.013671875, 13.6611328125, 14.30859375, 14.9560546875, 15.603515625, 16.2509765625, 16.8984375, 17.5458984375, 18.193359375, 18.8408203125, 19.48828125, 20.1357421875, 20.783203125, 21.4306640625, 22.078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 12.0, 11.0, 21.0, 19.0, 38.0, 29.0, 47.0, 47.0, 53.0, 92.0, 109.0, 143.0, 186.0, 240.0, 334.0, 910.0, 463.0, 286.0, 211.0, 164.0, 132.0, 92.0, 92.0, 79.0, 44.0, 42.0, 33.0, 29.0, 19.0, 22.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.2979736328125, -5.119384765625, -4.9407958984375, -4.76220703125, -4.5836181640625, -4.405029296875, -4.2264404296875, -4.0478515625, -3.8692626953125, -3.690673828125, -3.5120849609375, -3.33349609375, -3.1549072265625, -2.976318359375, -2.7977294921875, -2.619140625, -2.4405517578125, -2.261962890625, -2.0833740234375, -1.90478515625, -1.7261962890625, -1.547607421875, -1.3690185546875, -1.1904296875, -1.0118408203125, -0.833251953125, -0.6546630859375, -0.47607421875, -0.2974853515625, -0.118896484375, 0.0596923828125, 0.23828125, 0.4168701171875, 0.595458984375, 0.7740478515625, 0.95263671875, 1.1312255859375, 1.309814453125, 1.4884033203125, 1.6669921875, 1.8455810546875, 2.024169921875, 2.2027587890625, 2.38134765625, 2.5599365234375, 2.738525390625, 2.9171142578125, 3.095703125, 3.2742919921875, 3.452880859375, 3.6314697265625, 3.81005859375, 3.9886474609375, 4.167236328125, 4.3458251953125, 4.5244140625, 4.7030029296875, 4.881591796875, 5.0601806640625, 5.23876953125, 5.4173583984375, 5.595947265625, 5.7745361328125, 5.953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 19.0, 25.0, 42.0, 74.0, 91.0, 97.0, 95.0, 106.0, 107.0, 76.0, 64.0, 48.0, 24.0, 31.0, 17.0, 18.0, 10.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.60264587402344, -37.04033279418945, -35.4780158996582, -33.91570281982422, -32.35338592529297, -30.791072845458984, -29.228757858276367, -27.66644287109375, -26.104129791259766, -24.54181480407715, -22.97949981689453, -21.417186737060547, -19.85487174987793, -18.292556762695312, -16.730241775512695, -15.167927742004395, -13.605611801147461, -12.043296813964844, -10.480982780456543, -8.918667793273926, -7.356353282928467, -5.794038772583008, -4.231723785400391, -2.66940975189209, -1.1070947647094727, 0.4552198648452759, 2.0175344944000244, 3.5798492431640625, 5.1421637535095215, 6.7044782638549805, 8.266793251037598, 9.829107284545898, 11.391422271728516, 12.953737258911133, 14.516051292419434, 16.078365325927734, 17.64068031311035, 19.20299530029297, 20.765310287475586, 22.327625274658203, 23.889938354492188, 25.452253341674805, 27.014568328857422, 28.576881408691406, 30.139196395874023, 31.70151138305664, 33.263824462890625, 34.826141357421875, 36.388458251953125, 37.95077133178711, 39.51308822631836, 41.075401306152344, 42.637718200683594, 44.20003128051758, 45.76234436035156, 47.32466125488281, 48.8869743347168, 50.44928741455078, 52.01160430908203, 53.573917388916016, 55.136234283447266, 56.69854736328125, 58.2608642578125, 59.823177337646484, 61.38549041748047]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 18.0, 23.0, 26.0, 20.0, 24.0, 23.0, 27.0, 36.0, 37.0, 40.0, 48.0, 30.0, 43.0, 45.0, 41.0, 43.0, 41.0, 36.0, 53.0, 48.0, 41.0, 25.0, 31.0, 31.0, 18.0, 15.0, 15.0, 17.0, 11.0, 9.0, 10.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.839374542236328, -27.942052841186523, -27.04473114013672, -26.147411346435547, -25.250089645385742, -24.352767944335938, -23.455446243286133, -22.558124542236328, -21.660802841186523, -20.76348114013672, -19.866159439086914, -18.96883773803711, -18.071517944335938, -17.174196243286133, -16.276874542236328, -15.379552841186523, -14.482232093811035, -13.58491039276123, -12.687589645385742, -11.790267944335938, -10.892946243286133, -9.995624542236328, -9.09830379486084, -8.200982093811035, -7.303660869598389, -6.406339645385742, -5.5090179443359375, -4.611696720123291, -3.7143752574920654, -2.81705379486084, -1.9197325706481934, -1.0224108695983887, -0.1250896453857422, 0.7722317576408386, 1.6695531606674194, 2.5668745040893555, 3.464195966720581, 4.361517429351807, 5.258838653564453, 6.156160354614258, 7.053481578826904, 7.950802803039551, 8.848124504089355, 9.745445251464844, 10.642766952514648, 11.540088653564453, 12.437410354614258, 13.334732055664062, 14.23205280303955, 15.129374504089355, 16.026695251464844, 16.92401695251465, 17.821338653564453, 18.718660354614258, 19.615982055664062, 20.513301849365234, 21.41062355041504, 22.307945251464844, 23.20526695251465, 24.102588653564453, 24.999908447265625, 25.89723014831543, 26.794551849365234, 27.69187355041504, 28.589195251464844]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 3.0, 13.0, 14.0, 21.0, 21.0, 37.0, 48.0, 74.0, 128.0, 167.0, 282.0, 450.0, 691.0, 1154.0, 2068.0, 3930.0, 8130.0, 19257.0, 51896.0, 172421.0, 447539.0, 229764.0, 66582.0, 23472.0, 9842.0, 4600.0, 2316.0, 1429.0, 795.0, 502.0, 283.0, 210.0, 129.0, 85.0, 69.0, 37.0, 27.0, 23.0, 8.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.296875, -27.42919921875, -26.5615234375, -25.69384765625, -24.826171875, -23.95849609375, -23.0908203125, -22.22314453125, -21.35546875, -20.48779296875, -19.6201171875, -18.75244140625, -17.884765625, -17.01708984375, -16.1494140625, -15.28173828125, -14.4140625, -13.54638671875, -12.6787109375, -11.81103515625, -10.943359375, -10.07568359375, -9.2080078125, -8.34033203125, -7.47265625, -6.60498046875, -5.7373046875, -4.86962890625, -4.001953125, -3.13427734375, -2.2666015625, -1.39892578125, -0.53125, 0.33642578125, 1.2041015625, 2.07177734375, 2.939453125, 3.80712890625, 4.6748046875, 5.54248046875, 6.41015625, 7.27783203125, 8.1455078125, 9.01318359375, 9.880859375, 10.74853515625, 11.6162109375, 12.48388671875, 13.3515625, 14.21923828125, 15.0869140625, 15.95458984375, 16.822265625, 17.68994140625, 18.5576171875, 19.42529296875, 20.29296875, 21.16064453125, 22.0283203125, 22.89599609375, 23.763671875, 24.63134765625, 25.4990234375, 26.36669921875, 27.234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 13.0, 15.0, 14.0, 24.0, 27.0, 40.0, 58.0, 72.0, 74.0, 93.0, 94.0, 90.0, 85.0, 59.0, 53.0, 33.0, 29.0, 24.0, 22.0, 17.0, 10.0, 3.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.691131591796875, -2.60882568359375, -2.526519775390625, -2.4442138671875, -2.361907958984375, -2.27960205078125, -2.197296142578125, -2.114990234375, -2.032684326171875, -1.95037841796875, -1.868072509765625, -1.7857666015625, -1.703460693359375, -1.62115478515625, -1.538848876953125, -1.45654296875, -1.374237060546875, -1.29193115234375, -1.209625244140625, -1.1273193359375, -1.045013427734375, -0.96270751953125, -0.880401611328125, -0.798095703125, -0.715789794921875, -0.63348388671875, -0.551177978515625, -0.4688720703125, -0.386566162109375, -0.30426025390625, -0.221954345703125, -0.1396484375, -0.057342529296875, 0.02496337890625, 0.107269287109375, 0.1895751953125, 0.271881103515625, 0.35418701171875, 0.436492919921875, 0.518798828125, 0.601104736328125, 0.68341064453125, 0.765716552734375, 0.8480224609375, 0.930328369140625, 1.01263427734375, 1.094940185546875, 1.17724609375, 1.259552001953125, 1.34185791015625, 1.424163818359375, 1.5064697265625, 1.588775634765625, 1.67108154296875, 1.753387451171875, 1.835693359375, 1.917999267578125, 2.00030517578125, 2.082611083984375, 2.1649169921875, 2.247222900390625, 2.32952880859375, 2.411834716796875, 2.494140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 5.0, 19.0, 23.0, 43.0, 65.0, 110.0, 171.0, 324.0, 553.0, 1061.0, 1866.0, 3534.0, 7058.0, 15404.0, 45879.0, 257878.0, 564194.0, 103980.0, 25249.0, 10286.0, 4982.0, 2546.0, 1390.0, 818.0, 465.0, 253.0, 134.0, 75.0, 54.0, 36.0, 30.0, 14.0, 9.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.295654296875, -28.29443359375, -27.293212890625, -26.2919921875, -25.290771484375, -24.28955078125, -23.288330078125, -22.287109375, -21.285888671875, -20.28466796875, -19.283447265625, -18.2822265625, -17.281005859375, -16.27978515625, -15.278564453125, -14.27734375, -13.276123046875, -12.27490234375, -11.273681640625, -10.2724609375, -9.271240234375, -8.27001953125, -7.268798828125, -6.267578125, -5.266357421875, -4.26513671875, -3.263916015625, -2.2626953125, -1.261474609375, -0.26025390625, 0.740966796875, 1.7421875, 2.743408203125, 3.74462890625, 4.745849609375, 5.7470703125, 6.748291015625, 7.74951171875, 8.750732421875, 9.751953125, 10.753173828125, 11.75439453125, 12.755615234375, 13.7568359375, 14.758056640625, 15.75927734375, 16.760498046875, 17.76171875, 18.762939453125, 19.76416015625, 20.765380859375, 21.7666015625, 22.767822265625, 23.76904296875, 24.770263671875, 25.771484375, 26.772705078125, 27.77392578125, 28.775146484375, 29.7763671875, 30.777587890625, 31.77880859375, 32.780029296875, 33.78125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 14.0, 16.0, 16.0, 23.0, 25.0, 41.0, 36.0, 32.0, 43.0, 36.0, 42.0, 49.0, 60.0, 50.0, 28.0, 45.0, 33.0, 48.0, 46.0, 55.0, 32.0, 27.0, 27.0, 30.0, 13.0, 16.0, 14.0, 7.0, 11.0, 7.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2578125, -14.7589111328125, -14.260009765625, -13.7611083984375, -13.26220703125, -12.7633056640625, -12.264404296875, -11.7655029296875, -11.2666015625, -10.7677001953125, -10.268798828125, -9.7698974609375, -9.27099609375, -8.7720947265625, -8.273193359375, -7.7742919921875, -7.275390625, -6.7764892578125, -6.277587890625, -5.7786865234375, -5.27978515625, -4.7808837890625, -4.281982421875, -3.7830810546875, -3.2841796875, -2.7852783203125, -2.286376953125, -1.7874755859375, -1.28857421875, -0.7896728515625, -0.290771484375, 0.2081298828125, 0.70703125, 1.2059326171875, 1.704833984375, 2.2037353515625, 2.70263671875, 3.2015380859375, 3.700439453125, 4.1993408203125, 4.6982421875, 5.1971435546875, 5.696044921875, 6.1949462890625, 6.69384765625, 7.1927490234375, 7.691650390625, 8.1905517578125, 8.689453125, 9.1883544921875, 9.687255859375, 10.1861572265625, 10.68505859375, 11.1839599609375, 11.682861328125, 12.1817626953125, 12.6806640625, 13.1795654296875, 13.678466796875, 14.1773681640625, 14.67626953125, 15.1751708984375, 15.674072265625, 16.1729736328125, 16.671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 33.0, 27.0, 66.0, 81.0, 172.0, 258.0, 482.0, 1001.0, 2461.0, 8422.0, 48094.0, 822744.0, 143427.0, 14410.0, 3862.0, 1460.0, 621.0, 337.0, 205.0, 119.0, 60.0, 38.0, 22.0, 25.0, 16.0, 13.0, 7.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-72.9375, -70.8349609375, -68.732421875, -66.6298828125, -64.52734375, -62.4248046875, -60.322265625, -58.2197265625, -56.1171875, -54.0146484375, -51.912109375, -49.8095703125, -47.70703125, -45.6044921875, -43.501953125, -41.3994140625, -39.296875, -37.1943359375, -35.091796875, -32.9892578125, -30.88671875, -28.7841796875, -26.681640625, -24.5791015625, -22.4765625, -20.3740234375, -18.271484375, -16.1689453125, -14.06640625, -11.9638671875, -9.861328125, -7.7587890625, -5.65625, -3.5537109375, -1.451171875, 0.6513671875, 2.75390625, 4.8564453125, 6.958984375, 9.0615234375, 11.1640625, 13.2666015625, 15.369140625, 17.4716796875, 19.57421875, 21.6767578125, 23.779296875, 25.8818359375, 27.984375, 30.0869140625, 32.189453125, 34.2919921875, 36.39453125, 38.4970703125, 40.599609375, 42.7021484375, 44.8046875, 46.9072265625, 49.009765625, 51.1123046875, 53.21484375, 55.3173828125, 57.419921875, 59.5224609375, 61.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 11.0, 14.0, 9.0, 13.0, 16.0, 32.0, 58.0, 69.0, 135.0, 192.0, 153.0, 115.0, 65.0, 41.0, 26.0, 18.0, 6.0, 8.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00525665283203125, -0.005105137825012207, -0.004953622817993164, -0.004802107810974121, -0.004650592803955078, -0.004499077796936035, -0.004347562789916992, -0.004196047782897949, -0.004044532775878906, -0.0038930177688598633, -0.0037415027618408203, -0.0035899877548217773, -0.0034384727478027344, -0.0032869577407836914, -0.0031354427337646484, -0.0029839277267456055, -0.0028324127197265625, -0.0026808977127075195, -0.0025293827056884766, -0.0023778676986694336, -0.0022263526916503906, -0.0020748376846313477, -0.0019233226776123047, -0.0017718076705932617, -0.0016202926635742188, -0.0014687776565551758, -0.0013172626495361328, -0.0011657476425170898, -0.0010142326354980469, -0.0008627176284790039, -0.0007112026214599609, -0.000559687614440918, -0.000408172607421875, -0.00025665760040283203, -0.00010514259338378906, 4.6372413635253906e-05, 0.00019788742065429688, 0.00034940242767333984, 0.0005009174346923828, 0.0006524324417114258, 0.0008039474487304688, 0.0009554624557495117, 0.0011069774627685547, 0.0012584924697875977, 0.0014100074768066406, 0.0015615224838256836, 0.0017130374908447266, 0.0018645524978637695, 0.0020160675048828125, 0.0021675825119018555, 0.0023190975189208984, 0.0024706125259399414, 0.0026221275329589844, 0.0027736425399780273, 0.0029251575469970703, 0.0030766725540161133, 0.0032281875610351562, 0.0033797025680541992, 0.003531217575073242, 0.003682732582092285, 0.003834247589111328, 0.003985762596130371, 0.004137277603149414, 0.004288792610168457, 0.0044403076171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 2.0, 20.0, 14.0, 29.0, 13.0, 51.0, 91.0, 182.0, 327.0, 820.0, 2665.0, 14653.0, 484495.0, 525744.0, 15086.0, 2786.0, 814.0, 351.0, 167.0, 88.0, 47.0, 36.0, 25.0, 14.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.93701171875, -57.7177734375, -55.49853515625, -53.279296875, -51.06005859375, -48.8408203125, -46.62158203125, -44.40234375, -42.18310546875, -39.9638671875, -37.74462890625, -35.525390625, -33.30615234375, -31.0869140625, -28.86767578125, -26.6484375, -24.42919921875, -22.2099609375, -19.99072265625, -17.771484375, -15.55224609375, -13.3330078125, -11.11376953125, -8.89453125, -6.67529296875, -4.4560546875, -2.23681640625, -0.017578125, 2.20166015625, 4.4208984375, 6.64013671875, 8.859375, 11.07861328125, 13.2978515625, 15.51708984375, 17.736328125, 19.95556640625, 22.1748046875, 24.39404296875, 26.61328125, 28.83251953125, 31.0517578125, 33.27099609375, 35.490234375, 37.70947265625, 39.9287109375, 42.14794921875, 44.3671875, 46.58642578125, 48.8056640625, 51.02490234375, 53.244140625, 55.46337890625, 57.6826171875, 59.90185546875, 62.12109375, 64.34033203125, 66.5595703125, 68.77880859375, 70.998046875, 73.21728515625, 75.4365234375, 77.65576171875, 79.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 16.0, 16.0, 39.0, 85.0, 148.0, 195.0, 207.0, 145.0, 75.0, 28.0, 18.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3125, -31.1923828125, -30.072265625, -28.9521484375, -27.83203125, -26.7119140625, -25.591796875, -24.4716796875, -23.3515625, -22.2314453125, -21.111328125, -19.9912109375, -18.87109375, -17.7509765625, -16.630859375, -15.5107421875, -14.390625, -13.2705078125, -12.150390625, -11.0302734375, -9.91015625, -8.7900390625, -7.669921875, -6.5498046875, -5.4296875, -4.3095703125, -3.189453125, -2.0693359375, -0.94921875, 0.1708984375, 1.291015625, 2.4111328125, 3.53125, 4.6513671875, 5.771484375, 6.8916015625, 8.01171875, 9.1318359375, 10.251953125, 11.3720703125, 12.4921875, 13.6123046875, 14.732421875, 15.8525390625, 16.97265625, 18.0927734375, 19.212890625, 20.3330078125, 21.453125, 22.5732421875, 23.693359375, 24.8134765625, 25.93359375, 27.0537109375, 28.173828125, 29.2939453125, 30.4140625, 31.5341796875, 32.654296875, 33.7744140625, 34.89453125, 36.0146484375, 37.134765625, 38.2548828125, 39.375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 35.0, 55.0, 103.0, 223.0, 246.0, 149.0, 59.0, 20.0, 17.0, 8.0, 12.0, 3.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.4444274902344, -383.82470703125, -373.2049560546875, -362.5852355957031, -351.9654846191406, -341.34576416015625, -330.72601318359375, -320.1062927246094, -309.486572265625, -298.8668518066406, -288.2471008300781, -277.62738037109375, -267.00762939453125, -256.3879089355469, -245.76817321777344, -235.1484375, -224.52870178222656, -213.90896606445312, -203.2892303466797, -192.66949462890625, -182.04977416992188, -171.43003845214844, -160.810302734375, -150.19058227539062, -139.57083129882812, -128.9510955810547, -118.33136749267578, -107.71163177490234, -97.09190368652344, -86.47216796875, -75.85243225097656, -65.23270416259766, -54.61297607421875, -43.99324417114258, -33.373512268066406, -22.75377655029297, -12.134044647216797, -1.514312744140625, 9.105422973632812, 19.72515106201172, 30.344886779785156, 40.96461868286133, 51.5843505859375, 62.20408630371094, 72.82382202148438, 83.44355010986328, 94.06328582763672, 104.68301391601562, 115.30274963378906, 125.9224853515625, 136.54222106933594, 147.16195678710938, 157.78167724609375, 168.4014129638672, 179.02114868164062, 189.640869140625, 200.2606201171875, 210.88035583496094, 221.50009155273438, 232.11981201171875, 242.7395477294922, 253.35928344726562, 263.97900390625, 274.5987548828125, 285.2184753417969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 9.0, 31.0, 35.0, 59.0, 104.0, 140.0, 171.0, 135.0, 91.0, 70.0, 35.0, 18.0, 11.0, 11.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5455627441406, -280.0285339355469, -270.511474609375, -260.99444580078125, -251.4774169921875, -241.96038818359375, -232.44334411621094, -222.92630004882812, -213.40927124023438, -203.89224243164062, -194.3751983642578, -184.858154296875, -175.34112548828125, -165.8240966796875, -156.3070526123047, -146.79000854492188, -137.27297973632812, -127.75594329833984, -118.23890686035156, -108.72187042236328, -99.204833984375, -89.68779754638672, -80.17076110839844, -70.65372467041016, -61.136688232421875, -51.619651794433594, -42.10261535644531, -32.58557891845703, -23.06854248046875, -13.551506042480469, -4.0344696044921875, 5.482566833496094, 14.999603271484375, 24.516639709472656, 34.03367614746094, 43.55071258544922, 53.0677490234375, 62.58478546142578, 72.10182189941406, 81.61885833740234, 91.13589477539062, 100.6529312133789, 110.16996765136719, 119.68700408935547, 129.20404052734375, 138.7210693359375, 148.2381134033203, 157.75515747070312, 167.27218627929688, 176.78921508789062, 186.30625915527344, 195.82330322265625, 205.34033203125, 214.85736083984375, 224.37440490722656, 233.89144897460938, 243.40847778320312, 252.92550659179688, 262.44256591796875, 271.9595947265625, 281.47662353515625, 290.99365234375, 300.51068115234375, 310.0277404785156, 319.5447692871094]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 12.0, 17.0, 16.0, 27.0, 29.0, 34.0, 58.0, 66.0, 117.0, 130.0, 231.0, 312.0, 571.0, 1040.0, 1726.0, 3427.0, 7012.0, 17711.0, 55880.0, 322847.0, 3562003.0, 164426.0, 35870.0, 11529.0, 4567.0, 2101.0, 1008.0, 593.0, 333.0, 220.0, 119.0, 76.0, 44.0, 38.0, 23.0, 24.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.1484375, -64.859375, -62.5703125, -60.28125, -57.9921875, -55.703125, -53.4140625, -51.125, -48.8359375, -46.546875, -44.2578125, -41.96875, -39.6796875, -37.390625, -35.1015625, -32.8125, -30.5234375, -28.234375, -25.9453125, -23.65625, -21.3671875, -19.078125, -16.7890625, -14.5, -12.2109375, -9.921875, -7.6328125, -5.34375, -3.0546875, -0.765625, 1.5234375, 3.8125, 6.1015625, 8.390625, 10.6796875, 12.96875, 15.2578125, 17.546875, 19.8359375, 22.125, 24.4140625, 26.703125, 28.9921875, 31.28125, 33.5703125, 35.859375, 38.1484375, 40.4375, 42.7265625, 45.015625, 47.3046875, 49.59375, 51.8828125, 54.171875, 56.4609375, 58.75, 61.0390625, 63.328125, 65.6171875, 67.90625, 70.1953125, 72.484375, 74.7734375, 77.0625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 23.0, 22.0, 28.0, 32.0, 59.0, 62.0, 69.0, 87.0, 91.0, 90.0, 68.0, 69.0, 56.0, 52.0, 38.0, 23.0, 18.0, 18.0, 8.0, 6.0, 15.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.32421875, -3.23309326171875, -3.1419677734375, -3.05084228515625, -2.959716796875, -2.86859130859375, -2.7774658203125, -2.68634033203125, -2.59521484375, -2.50408935546875, -2.4129638671875, -2.32183837890625, -2.230712890625, -2.13958740234375, -2.0484619140625, -1.95733642578125, -1.8662109375, -1.77508544921875, -1.6839599609375, -1.59283447265625, -1.501708984375, -1.41058349609375, -1.3194580078125, -1.22833251953125, -1.13720703125, -1.04608154296875, -0.9549560546875, -0.86383056640625, -0.772705078125, -0.68157958984375, -0.5904541015625, -0.49932861328125, -0.408203125, -0.31707763671875, -0.2259521484375, -0.13482666015625, -0.043701171875, 0.04742431640625, 0.1385498046875, 0.22967529296875, 0.32080078125, 0.41192626953125, 0.5030517578125, 0.59417724609375, 0.685302734375, 0.77642822265625, 0.8675537109375, 0.95867919921875, 1.0498046875, 1.14093017578125, 1.2320556640625, 1.32318115234375, 1.414306640625, 1.50543212890625, 1.5965576171875, 1.68768310546875, 1.77880859375, 1.86993408203125, 1.9610595703125, 2.05218505859375, 2.143310546875, 2.23443603515625, 2.3255615234375, 2.41668701171875, 2.5078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 19.0, 44.0, 83.0, 184.0, 305.0, 738.0, 1849.0, 6324.0, 31292.0, 249216.0, 3414587.0, 429314.0, 47003.0, 9105.0, 2504.0, 845.0, 407.0, 178.0, 87.0, 57.0, 48.0, 20.0, 5.0, 11.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -46.7724609375, -44.607421875, -42.4423828125, -40.27734375, -38.1123046875, -35.947265625, -33.7822265625, -31.6171875, -29.4521484375, -27.287109375, -25.1220703125, -22.95703125, -20.7919921875, -18.626953125, -16.4619140625, -14.296875, -12.1318359375, -9.966796875, -7.8017578125, -5.63671875, -3.4716796875, -1.306640625, 0.8583984375, 3.0234375, 5.1884765625, 7.353515625, 9.5185546875, 11.68359375, 13.8486328125, 16.013671875, 18.1787109375, 20.34375, 22.5087890625, 24.673828125, 26.8388671875, 29.00390625, 31.1689453125, 33.333984375, 35.4990234375, 37.6640625, 39.8291015625, 41.994140625, 44.1591796875, 46.32421875, 48.4892578125, 50.654296875, 52.8193359375, 54.984375, 57.1494140625, 59.314453125, 61.4794921875, 63.64453125, 65.8095703125, 67.974609375, 70.1396484375, 72.3046875, 74.4697265625, 76.634765625, 78.7998046875, 80.96484375, 83.1298828125, 85.294921875, 87.4599609375, 89.625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 12.0, 10.0, 15.0, 21.0, 34.0, 27.0, 60.0, 72.0, 91.0, 169.0, 257.0, 342.0, 791.0, 977.0, 391.0, 211.0, 152.0, 110.0, 84.0, 67.0, 35.0, 27.0, 26.0, 26.0, 14.0, 12.0, 5.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640625, -6.4266357421875, -6.212646484375, -5.9986572265625, -5.78466796875, -5.5706787109375, -5.356689453125, -5.1427001953125, -4.9287109375, -4.7147216796875, -4.500732421875, -4.2867431640625, -4.07275390625, -3.8587646484375, -3.644775390625, -3.4307861328125, -3.216796875, -3.0028076171875, -2.788818359375, -2.5748291015625, -2.36083984375, -2.1468505859375, -1.932861328125, -1.7188720703125, -1.5048828125, -1.2908935546875, -1.076904296875, -0.8629150390625, -0.64892578125, -0.4349365234375, -0.220947265625, -0.0069580078125, 0.20703125, 0.4210205078125, 0.635009765625, 0.8489990234375, 1.06298828125, 1.2769775390625, 1.490966796875, 1.7049560546875, 1.9189453125, 2.1329345703125, 2.346923828125, 2.5609130859375, 2.77490234375, 2.9888916015625, 3.202880859375, 3.4168701171875, 3.630859375, 3.8448486328125, 4.058837890625, 4.2728271484375, 4.48681640625, 4.7008056640625, 4.914794921875, 5.1287841796875, 5.3427734375, 5.5567626953125, 5.770751953125, 5.9847412109375, 6.19873046875, 6.4127197265625, 6.626708984375, 6.8406982421875, 7.0546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 12.0, 11.0, 20.0, 42.0, 111.0, 139.0, 193.0, 199.0, 108.0, 82.0, 38.0, 13.0, 10.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.86197662353516, -87.64466857910156, -85.4273681640625, -83.2100601196289, -80.99275970458984, -78.77545166015625, -76.55815124511719, -74.3408432006836, -72.12353515625, -69.9062271118164, -67.68892669677734, -65.47161865234375, -63.25431823730469, -61.037010192871094, -58.819705963134766, -56.60240173339844, -54.385101318359375, -52.16779708862305, -49.95049285888672, -47.73318862915039, -45.51588439941406, -43.29857635498047, -41.08127212524414, -38.86396789550781, -36.646663665771484, -34.429359436035156, -32.21205520629883, -29.994749069213867, -27.77744483947754, -25.56014060974121, -23.34283447265625, -21.125530242919922, -18.90822982788086, -16.69092559814453, -14.473620414733887, -12.256315231323242, -10.039011001586914, -7.821706771850586, -5.604401588439941, -3.387096405029297, -1.1697921752929688, 1.0475125312805176, 3.264817237854004, 5.48212194442749, 7.699426651000977, 9.916730880737305, 12.13403606414795, 14.351341247558594, 16.568645477294922, 18.78594970703125, 21.003253936767578, 23.22056007385254, 25.437864303588867, 27.655168533325195, 29.872474670410156, 32.089778900146484, 34.30708312988281, 36.52438735961914, 38.74169158935547, 40.9589958190918, 43.176300048828125, 45.39360809326172, 47.61091232299805, 49.828216552734375, 52.0455207824707]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 18.0, 21.0, 21.0, 35.0, 45.0, 52.0, 47.0, 63.0, 64.0, 70.0, 72.0, 71.0, 68.0, 52.0, 58.0, 39.0, 30.0, 30.0, 13.0, 21.0, 18.0, 12.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.05409240722656, -38.81858444213867, -37.583072662353516, -36.347564697265625, -35.112056732177734, -33.87654495239258, -32.64103698730469, -31.405527114868164, -30.17001724243164, -28.934507369995117, -27.698999404907227, -26.463489532470703, -25.22797966003418, -23.992469787597656, -22.756961822509766, -21.521451950073242, -20.28594398498535, -19.050434112548828, -17.814926147460938, -16.579416275024414, -15.34390640258789, -14.108397483825684, -12.872888565063477, -11.637378692626953, -10.401869773864746, -9.166360855102539, -7.930850982666016, -6.695342063903809, -5.459832668304443, -4.224323272705078, -2.988814353942871, -1.7533044815063477, -0.5177955627441406, 0.7177137136459351, 1.9532229900360107, 3.188732147216797, 4.424241542816162, 5.659750938415527, 6.895259857177734, 8.130769729614258, 9.366278648376465, 10.601787567138672, 11.837297439575195, 13.072806358337402, 14.30831527709961, 15.543825149536133, 16.779335021972656, 18.014842987060547, 19.25035285949707, 20.485862731933594, 21.721370697021484, 22.956880569458008, 24.19239044189453, 25.427898406982422, 26.663408279418945, 27.89891815185547, 29.13442611694336, 30.369935989379883, 31.605443954467773, 32.8409538269043, 34.07646179199219, 35.311973571777344, 36.547481536865234, 37.782989501953125, 39.01850128173828]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 25.0, 40.0, 46.0, 90.0, 120.0, 238.0, 444.0, 757.0, 1428.0, 2633.0, 5027.0, 10306.0, 21847.0, 49668.0, 119740.0, 280112.0, 309627.0, 140089.0, 57074.0, 25276.0, 11755.0, 5737.0, 2960.0, 1543.0, 847.0, 442.0, 294.0, 151.0, 94.0, 46.0, 34.0, 27.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.359375, -22.693603515625, -22.02783203125, -21.362060546875, -20.6962890625, -20.030517578125, -19.36474609375, -18.698974609375, -18.033203125, -17.367431640625, -16.70166015625, -16.035888671875, -15.3701171875, -14.704345703125, -14.03857421875, -13.372802734375, -12.70703125, -12.041259765625, -11.37548828125, -10.709716796875, -10.0439453125, -9.378173828125, -8.71240234375, -8.046630859375, -7.380859375, -6.715087890625, -6.04931640625, -5.383544921875, -4.7177734375, -4.052001953125, -3.38623046875, -2.720458984375, -2.0546875, -1.388916015625, -0.72314453125, -0.057373046875, 0.6083984375, 1.274169921875, 1.93994140625, 2.605712890625, 3.271484375, 3.937255859375, 4.60302734375, 5.268798828125, 5.9345703125, 6.600341796875, 7.26611328125, 7.931884765625, 8.59765625, 9.263427734375, 9.92919921875, 10.594970703125, 11.2607421875, 11.926513671875, 12.59228515625, 13.258056640625, 13.923828125, 14.589599609375, 15.25537109375, 15.921142578125, 16.5869140625, 17.252685546875, 17.91845703125, 18.584228515625, 19.25]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 2.0, 8.0, 5.0, 11.0, 12.0, 15.0, 21.0, 16.0, 14.0, 18.0, 36.0, 25.0, 41.0, 40.0, 44.0, 46.0, 54.0, 50.0, 42.0, 50.0, 64.0, 45.0, 40.0, 44.0, 37.0, 37.0, 25.0, 17.0, 23.0, 25.0, 13.0, 17.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.9013671875, -1.8409271240234375, -1.780487060546875, -1.7200469970703125, -1.65960693359375, -1.5991668701171875, -1.538726806640625, -1.4782867431640625, -1.4178466796875, -1.3574066162109375, -1.296966552734375, -1.2365264892578125, -1.17608642578125, -1.1156463623046875, -1.055206298828125, -0.9947662353515625, -0.934326171875, -0.8738861083984375, -0.813446044921875, -0.7530059814453125, -0.69256591796875, -0.6321258544921875, -0.571685791015625, -0.5112457275390625, -0.4508056640625, -0.3903656005859375, -0.329925537109375, -0.2694854736328125, -0.20904541015625, -0.1486053466796875, -0.088165283203125, -0.0277252197265625, 0.03271484375, 0.0931549072265625, 0.153594970703125, 0.2140350341796875, 0.27447509765625, 0.3349151611328125, 0.395355224609375, 0.4557952880859375, 0.5162353515625, 0.5766754150390625, 0.637115478515625, 0.6975555419921875, 0.75799560546875, 0.8184356689453125, 0.878875732421875, 0.9393157958984375, 0.999755859375, 1.0601959228515625, 1.120635986328125, 1.1810760498046875, 1.24151611328125, 1.3019561767578125, 1.362396240234375, 1.4228363037109375, 1.4832763671875, 1.5437164306640625, 1.604156494140625, 1.6645965576171875, 1.72503662109375, 1.7854766845703125, 1.845916748046875, 1.9063568115234375, 1.966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 11.0, 15.0, 28.0, 75.0, 157.0, 430.0, 1347.0, 5086.0, 24362.0, 160063.0, 662916.0, 161562.0, 25059.0, 5258.0, 1374.0, 454.0, 164.0, 90.0, 40.0, 22.0, 14.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.03125, -29.90283203125, -28.7744140625, -27.64599609375, -26.517578125, -25.38916015625, -24.2607421875, -23.13232421875, -22.00390625, -20.87548828125, -19.7470703125, -18.61865234375, -17.490234375, -16.36181640625, -15.2333984375, -14.10498046875, -12.9765625, -11.84814453125, -10.7197265625, -9.59130859375, -8.462890625, -7.33447265625, -6.2060546875, -5.07763671875, -3.94921875, -2.82080078125, -1.6923828125, -0.56396484375, 0.564453125, 1.69287109375, 2.8212890625, 3.94970703125, 5.078125, 6.20654296875, 7.3349609375, 8.46337890625, 9.591796875, 10.72021484375, 11.8486328125, 12.97705078125, 14.10546875, 15.23388671875, 16.3623046875, 17.49072265625, 18.619140625, 19.74755859375, 20.8759765625, 22.00439453125, 23.1328125, 24.26123046875, 25.3896484375, 26.51806640625, 27.646484375, 28.77490234375, 29.9033203125, 31.03173828125, 32.16015625, 33.28857421875, 34.4169921875, 35.54541015625, 36.673828125, 37.80224609375, 38.9306640625, 40.05908203125, 41.1875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 12.0, 13.0, 15.0, 25.0, 18.0, 16.0, 20.0, 29.0, 30.0, 28.0, 27.0, 37.0, 26.0, 34.0, 37.0, 41.0, 54.0, 47.0, 39.0, 44.0, 37.0, 37.0, 38.0, 26.0, 29.0, 24.0, 23.0, 22.0, 23.0, 14.0, 15.0, 18.0, 11.0, 11.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.625, -10.297119140625, -9.96923828125, -9.641357421875, -9.3134765625, -8.985595703125, -8.65771484375, -8.329833984375, -8.001953125, -7.674072265625, -7.34619140625, -7.018310546875, -6.6904296875, -6.362548828125, -6.03466796875, -5.706787109375, -5.37890625, -5.051025390625, -4.72314453125, -4.395263671875, -4.0673828125, -3.739501953125, -3.41162109375, -3.083740234375, -2.755859375, -2.427978515625, -2.10009765625, -1.772216796875, -1.4443359375, -1.116455078125, -0.78857421875, -0.460693359375, -0.1328125, 0.195068359375, 0.52294921875, 0.850830078125, 1.1787109375, 1.506591796875, 1.83447265625, 2.162353515625, 2.490234375, 2.818115234375, 3.14599609375, 3.473876953125, 3.8017578125, 4.129638671875, 4.45751953125, 4.785400390625, 5.11328125, 5.441162109375, 5.76904296875, 6.096923828125, 6.4248046875, 6.752685546875, 7.08056640625, 7.408447265625, 7.736328125, 8.064208984375, 8.39208984375, 8.719970703125, 9.0478515625, 9.375732421875, 9.70361328125, 10.031494140625, 10.359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 11.0, 14.0, 23.0, 32.0, 63.0, 167.0, 395.0, 1006.0, 2956.0, 12642.0, 105324.0, 820626.0, 89522.0, 11428.0, 2785.0, 895.0, 353.0, 138.0, 73.0, 38.0, 22.0, 21.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-87.8125, -85.9228515625, -84.033203125, -82.1435546875, -80.25390625, -78.3642578125, -76.474609375, -74.5849609375, -72.6953125, -70.8056640625, -68.916015625, -67.0263671875, -65.13671875, -63.2470703125, -61.357421875, -59.4677734375, -57.578125, -55.6884765625, -53.798828125, -51.9091796875, -50.01953125, -48.1298828125, -46.240234375, -44.3505859375, -42.4609375, -40.5712890625, -38.681640625, -36.7919921875, -34.90234375, -33.0126953125, -31.123046875, -29.2333984375, -27.34375, -25.4541015625, -23.564453125, -21.6748046875, -19.78515625, -17.8955078125, -16.005859375, -14.1162109375, -12.2265625, -10.3369140625, -8.447265625, -6.5576171875, -4.66796875, -2.7783203125, -0.888671875, 1.0009765625, 2.890625, 4.7802734375, 6.669921875, 8.5595703125, 10.44921875, 12.3388671875, 14.228515625, 16.1181640625, 18.0078125, 19.8974609375, 21.787109375, 23.6767578125, 25.56640625, 27.4560546875, 29.345703125, 31.2353515625, 33.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 11.0, 13.0, 17.0, 36.0, 49.0, 75.0, 124.0, 195.0, 156.0, 123.0, 67.0, 49.0, 26.0, 16.0, 5.0, 4.0, 9.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002899169921875, -0.002813190221786499, -0.002727210521697998, -0.002641230821609497, -0.002555251121520996, -0.002469271421432495, -0.002383291721343994, -0.002297312021255493, -0.002211332321166992, -0.002125352621078491, -0.0020393729209899902, -0.0019533932209014893, -0.0018674135208129883, -0.0017814338207244873, -0.0016954541206359863, -0.0016094744205474854, -0.0015234947204589844, -0.0014375150203704834, -0.0013515353202819824, -0.0012655556201934814, -0.0011795759201049805, -0.0010935962200164795, -0.0010076165199279785, -0.0009216368198394775, -0.0008356571197509766, -0.0007496774196624756, -0.0006636977195739746, -0.0005777180194854736, -0.0004917383193969727, -0.0004057586193084717, -0.0003197789192199707, -0.00023379921913146973, -0.00014781951904296875, -6.183981895446777e-05, 2.4139881134033203e-05, 0.00011011958122253418, 0.00019609928131103516, 0.00028207898139953613, 0.0003680586814880371, 0.0004540383815765381, 0.0005400180816650391, 0.00062599778175354, 0.000711977481842041, 0.000797957181930542, 0.000883936882019043, 0.0009699165821075439, 0.001055896282196045, 0.001141875982284546, 0.0012278556823730469, 0.0013138353824615479, 0.0013998150825500488, 0.0014857947826385498, 0.0015717744827270508, 0.0016577541828155518, 0.0017437338829040527, 0.0018297135829925537, 0.0019156932830810547, 0.0020016729831695557, 0.0020876526832580566, 0.0021736323833465576, 0.0022596120834350586, 0.0023455917835235596, 0.0024315714836120605, 0.0025175511837005615, 0.0026035308837890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 16.0, 14.0, 29.0, 29.0, 44.0, 64.0, 100.0, 145.0, 209.0, 330.0, 489.0, 830.0, 1295.0, 2275.0, 3955.0, 7536.0, 15347.0, 36089.0, 107575.0, 355980.0, 344240.0, 103677.0, 35351.0, 15104.0, 7298.0, 4146.0, 2367.0, 1434.0, 831.0, 552.0, 361.0, 242.0, 171.0, 121.0, 80.0, 59.0, 50.0, 28.0, 22.0, 17.0, 15.0, 11.0, 4.0, 5.0, 6.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.347900390625, -16.68017578125, -16.012451171875, -15.3447265625, -14.677001953125, -14.00927734375, -13.341552734375, -12.673828125, -12.006103515625, -11.33837890625, -10.670654296875, -10.0029296875, -9.335205078125, -8.66748046875, -7.999755859375, -7.33203125, -6.664306640625, -5.99658203125, -5.328857421875, -4.6611328125, -3.993408203125, -3.32568359375, -2.657958984375, -1.990234375, -1.322509765625, -0.65478515625, 0.012939453125, 0.6806640625, 1.348388671875, 2.01611328125, 2.683837890625, 3.3515625, 4.019287109375, 4.68701171875, 5.354736328125, 6.0224609375, 6.690185546875, 7.35791015625, 8.025634765625, 8.693359375, 9.361083984375, 10.02880859375, 10.696533203125, 11.3642578125, 12.031982421875, 12.69970703125, 13.367431640625, 14.03515625, 14.702880859375, 15.37060546875, 16.038330078125, 16.7060546875, 17.373779296875, 18.04150390625, 18.709228515625, 19.376953125, 20.044677734375, 20.71240234375, 21.380126953125, 22.0478515625, 22.715576171875, 23.38330078125, 24.051025390625, 24.71875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 4.0, 10.0, 12.0, 13.0, 18.0, 18.0, 27.0, 30.0, 55.0, 76.0, 84.0, 101.0, 106.0, 95.0, 75.0, 68.0, 43.0, 34.0, 30.0, 20.0, 11.0, 8.0, 12.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.6593017578125, -11.107666015625, -10.5560302734375, -10.00439453125, -9.4527587890625, -8.901123046875, -8.3494873046875, -7.7978515625, -7.2462158203125, -6.694580078125, -6.1429443359375, -5.59130859375, -5.0396728515625, -4.488037109375, -3.9364013671875, -3.384765625, -2.8331298828125, -2.281494140625, -1.7298583984375, -1.17822265625, -0.6265869140625, -0.074951171875, 0.4766845703125, 1.0283203125, 1.5799560546875, 2.131591796875, 2.6832275390625, 3.23486328125, 3.7864990234375, 4.338134765625, 4.8897705078125, 5.44140625, 5.9930419921875, 6.544677734375, 7.0963134765625, 7.64794921875, 8.1995849609375, 8.751220703125, 9.3028564453125, 9.8544921875, 10.4061279296875, 10.957763671875, 11.5093994140625, 12.06103515625, 12.6126708984375, 13.164306640625, 13.7159423828125, 14.267578125, 14.8192138671875, 15.370849609375, 15.9224853515625, 16.47412109375, 17.0257568359375, 17.577392578125, 18.1290283203125, 18.6806640625, 19.2322998046875, 19.783935546875, 20.3355712890625, 20.88720703125, 21.4388427734375, 21.990478515625, 22.5421142578125, 23.09375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 14.0, 29.0, 45.0, 88.0, 159.0, 206.0, 191.0, 115.0, 67.0, 33.0, 14.0, 5.0, 7.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.4331817626953, -153.01084899902344, -146.58851623535156, -140.1661834716797, -133.74383544921875, -127.3215103149414, -120.899169921875, -114.47683715820312, -108.05450439453125, -101.63217163085938, -95.2098388671875, -88.7874984741211, -82.36516571044922, -75.94283294677734, -69.52049255371094, -63.09815979003906, -56.67582702636719, -50.25349426269531, -43.83115768432617, -37.40882110595703, -30.986488342285156, -24.56415557861328, -18.14181900024414, -11.719482421875, -5.297149658203125, 1.1251850128173828, 7.547519683837891, 13.969854354858398, 20.392189025878906, 26.81452178955078, 33.23685836791992, 39.65919494628906, 46.081512451171875, 52.50384521484375, 58.92618179321289, 65.34851837158203, 71.7708511352539, 78.19318389892578, 84.61552429199219, 91.03785705566406, 97.46018981933594, 103.88252258300781, 110.30485534667969, 116.7271957397461, 123.14952850341797, 129.57186889648438, 135.99420166015625, 142.41653442382812, 148.8388671875, 155.26119995117188, 161.68353271484375, 168.10586547851562, 174.5281982421875, 180.95053100585938, 187.3728790283203, 193.7952117919922, 200.21754455566406, 206.63987731933594, 213.0622100830078, 219.4845428466797, 225.90689086914062, 232.3292236328125, 238.75155639648438, 245.17388916015625, 251.59622192382812]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 14.0, 13.0, 15.0, 19.0, 29.0, 41.0, 37.0, 50.0, 52.0, 70.0, 77.0, 100.0, 73.0, 82.0, 76.0, 52.0, 41.0, 30.0, 27.0, 19.0, 13.0, 9.0, 10.0, 5.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-132.16354370117188, -127.71258544921875, -123.26162719726562, -118.8106689453125, -114.35971069335938, -109.90875244140625, -105.45779418945312, -101.0068359375, -96.55587768554688, -92.10491943359375, -87.65396118164062, -83.2030029296875, -78.75204467773438, -74.30108642578125, -69.85012817382812, -65.399169921875, -60.948211669921875, -56.49725341796875, -52.046295166015625, -47.5953369140625, -43.144378662109375, -38.69342041015625, -34.242462158203125, -29.79150390625, -25.340545654296875, -20.88958740234375, -16.438629150390625, -11.9876708984375, -7.536712646484375, -3.08575439453125, 1.365203857421875, 5.816162109375, 10.267135620117188, 14.718093872070312, 19.169052124023438, 23.620010375976562, 28.070968627929688, 32.52192687988281, 36.97288513183594, 41.42384338378906, 45.87480163574219, 50.32575988769531, 54.77671813964844, 59.22767639160156, 63.67863464355469, 68.12959289550781, 72.58055114746094, 77.03150939941406, 81.48246765136719, 85.93342590332031, 90.38438415527344, 94.83534240722656, 99.28630065917969, 103.73725891113281, 108.18821716308594, 112.63917541503906, 117.09013366699219, 121.54109191894531, 125.99205017089844, 130.44300842285156, 134.8939666748047, 139.3449249267578, 143.79588317871094, 148.24684143066406, 152.6977996826172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 23.0, 37.0, 66.0, 126.0, 153.0, 316.0, 530.0, 876.0, 1579.0, 2877.0, 5908.0, 12889.0, 34024.0, 137679.0, 3551778.0, 358117.0, 53731.0, 17676.0, 7413.0, 3760.0, 1967.0, 1104.0, 647.0, 368.0, 218.0, 131.0, 72.0, 56.0, 27.0, 25.0, 24.0, 19.0, 14.0, 12.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.125, -54.2353515625, -52.345703125, -50.4560546875, -48.56640625, -46.6767578125, -44.787109375, -42.8974609375, -41.0078125, -39.1181640625, -37.228515625, -35.3388671875, -33.44921875, -31.5595703125, -29.669921875, -27.7802734375, -25.890625, -24.0009765625, -22.111328125, -20.2216796875, -18.33203125, -16.4423828125, -14.552734375, -12.6630859375, -10.7734375, -8.8837890625, -6.994140625, -5.1044921875, -3.21484375, -1.3251953125, 0.564453125, 2.4541015625, 4.34375, 6.2333984375, 8.123046875, 10.0126953125, 11.90234375, 13.7919921875, 15.681640625, 17.5712890625, 19.4609375, 21.3505859375, 23.240234375, 25.1298828125, 27.01953125, 28.9091796875, 30.798828125, 32.6884765625, 34.578125, 36.4677734375, 38.357421875, 40.2470703125, 42.13671875, 44.0263671875, 45.916015625, 47.8056640625, 49.6953125, 51.5849609375, 53.474609375, 55.3642578125, 57.25390625, 59.1435546875, 61.033203125, 62.9228515625, 64.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 12.0, 12.0, 13.0, 18.0, 22.0, 42.0, 38.0, 34.0, 56.0, 56.0, 59.0, 78.0, 61.0, 84.0, 76.0, 72.0, 55.0, 43.0, 35.0, 27.0, 17.0, 19.0, 17.0, 9.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.550994873046875, -2.46136474609375, -2.371734619140625, -2.2821044921875, -2.192474365234375, -2.10284423828125, -2.013214111328125, -1.923583984375, -1.833953857421875, -1.74432373046875, -1.654693603515625, -1.5650634765625, -1.475433349609375, -1.38580322265625, -1.296173095703125, -1.20654296875, -1.116912841796875, -1.02728271484375, -0.937652587890625, -0.8480224609375, -0.758392333984375, -0.66876220703125, -0.579132080078125, -0.489501953125, -0.399871826171875, -0.31024169921875, -0.220611572265625, -0.1309814453125, -0.041351318359375, 0.04827880859375, 0.137908935546875, 0.2275390625, 0.317169189453125, 0.40679931640625, 0.496429443359375, 0.5860595703125, 0.675689697265625, 0.76531982421875, 0.854949951171875, 0.944580078125, 1.034210205078125, 1.12384033203125, 1.213470458984375, 1.3031005859375, 1.392730712890625, 1.48236083984375, 1.571990966796875, 1.66162109375, 1.751251220703125, 1.84088134765625, 1.930511474609375, 2.0201416015625, 2.109771728515625, 2.19940185546875, 2.289031982421875, 2.378662109375, 2.468292236328125, 2.55792236328125, 2.647552490234375, 2.7371826171875, 2.826812744140625, 2.91644287109375, 3.006072998046875, 3.095703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 14.0, 26.0, 37.0, 52.0, 74.0, 168.0, 277.0, 624.0, 1575.0, 5280.0, 22629.0, 170816.0, 3611610.0, 335762.0, 34657.0, 7112.0, 2023.0, 774.0, 343.0, 170.0, 88.0, 49.0, 30.0, 27.0, 6.0, 7.0, 7.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.625, -67.2744140625, -64.923828125, -62.5732421875, -60.22265625, -57.8720703125, -55.521484375, -53.1708984375, -50.8203125, -48.4697265625, -46.119140625, -43.7685546875, -41.41796875, -39.0673828125, -36.716796875, -34.3662109375, -32.015625, -29.6650390625, -27.314453125, -24.9638671875, -22.61328125, -20.2626953125, -17.912109375, -15.5615234375, -13.2109375, -10.8603515625, -8.509765625, -6.1591796875, -3.80859375, -1.4580078125, 0.892578125, 3.2431640625, 5.59375, 7.9443359375, 10.294921875, 12.6455078125, 14.99609375, 17.3466796875, 19.697265625, 22.0478515625, 24.3984375, 26.7490234375, 29.099609375, 31.4501953125, 33.80078125, 36.1513671875, 38.501953125, 40.8525390625, 43.203125, 45.5537109375, 47.904296875, 50.2548828125, 52.60546875, 54.9560546875, 57.306640625, 59.6572265625, 62.0078125, 64.3583984375, 66.708984375, 69.0595703125, 71.41015625, 73.7607421875, 76.111328125, 78.4619140625, 80.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 14.0, 31.0, 30.0, 57.0, 82.0, 158.0, 262.0, 650.0, 1669.0, 490.0, 231.0, 135.0, 86.0, 51.0, 23.0, 24.0, 12.0, 17.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9820556640625, -9.682861328125, -9.3836669921875, -9.08447265625, -8.7852783203125, -8.486083984375, -8.1868896484375, -7.8876953125, -7.5885009765625, -7.289306640625, -6.9901123046875, -6.69091796875, -6.3917236328125, -6.092529296875, -5.7933349609375, -5.494140625, -5.1949462890625, -4.895751953125, -4.5965576171875, -4.29736328125, -3.9981689453125, -3.698974609375, -3.3997802734375, -3.1005859375, -2.8013916015625, -2.502197265625, -2.2030029296875, -1.90380859375, -1.6046142578125, -1.305419921875, -1.0062255859375, -0.70703125, -0.4078369140625, -0.108642578125, 0.1905517578125, 0.48974609375, 0.7889404296875, 1.088134765625, 1.3873291015625, 1.6865234375, 1.9857177734375, 2.284912109375, 2.5841064453125, 2.88330078125, 3.1824951171875, 3.481689453125, 3.7808837890625, 4.080078125, 4.3792724609375, 4.678466796875, 4.9776611328125, 5.27685546875, 5.5760498046875, 5.875244140625, 6.1744384765625, 6.4736328125, 6.7728271484375, 7.072021484375, 7.3712158203125, 7.67041015625, 7.9696044921875, 8.268798828125, 8.5679931640625, 8.8671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 16.0, 21.0, 31.0, 69.0, 120.0, 176.0, 182.0, 172.0, 93.0, 48.0, 33.0, 18.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.056697845458984, -34.79891586303711, -32.5411376953125, -30.283355712890625, -28.025575637817383, -25.76779556274414, -23.510013580322266, -21.252233505249023, -18.99445343017578, -16.73667335510254, -14.47889232635498, -12.221111297607422, -9.96333122253418, -7.7055511474609375, -5.447770118713379, -3.1899890899658203, -0.9322090148925781, 1.3255715370178223, 3.5833520889282227, 5.841132640838623, 8.098913192749023, 10.356693267822266, 12.614474296569824, 14.872255325317383, 17.130035400390625, 19.387815475463867, 21.64559555053711, 23.903377532958984, 26.161157608032227, 28.41893768310547, 30.676719665527344, 32.93450164794922, 35.192283630371094, 37.45006561279297, 39.70784378051758, 41.96562576293945, 44.22340393066406, 46.48118591308594, 48.73896789550781, 50.99674987792969, 53.2545280456543, 55.51231002807617, 57.77008819580078, 60.027870178222656, 62.28565216064453, 64.54342651367188, 66.80120849609375, 69.05899047851562, 71.3167724609375, 73.57455444335938, 75.83233642578125, 78.0901107788086, 80.34789276123047, 82.60567474365234, 84.86345672607422, 87.1212387084961, 89.37901306152344, 91.63679504394531, 93.89457702636719, 96.15235137939453, 98.4101333618164, 100.66791534423828, 102.92569732666016, 105.18347930908203, 107.4412612915039]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 10.0, 13.0, 15.0, 25.0, 20.0, 22.0, 30.0, 41.0, 35.0, 51.0, 47.0, 56.0, 56.0, 46.0, 52.0, 42.0, 46.0, 46.0, 40.0, 38.0, 44.0, 32.0, 38.0, 21.0, 19.0, 24.0, 14.0, 14.0, 10.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-32.26142120361328, -31.34774398803711, -30.434066772460938, -29.520389556884766, -28.606712341308594, -27.693035125732422, -26.77935791015625, -25.86568260192871, -24.95200538635254, -24.038328170776367, -23.124650955200195, -22.210973739624023, -21.29729652404785, -20.383621215820312, -19.46994400024414, -18.55626678466797, -17.642589569091797, -16.728912353515625, -15.815235137939453, -14.901557922363281, -13.987881660461426, -13.074204444885254, -12.160527229309082, -11.246850967407227, -10.333171844482422, -9.41949462890625, -8.505817413330078, -7.5921406745910645, -6.678463935852051, -5.764786720275879, -4.851109504699707, -3.9374327659606934, -3.0237560272216797, -2.110079050064087, -1.1964019536972046, -0.28272485733032227, 0.6309521198272705, 1.5446290969848633, 2.458306312561035, 3.371983051300049, 4.285660266876221, 5.199337482452393, 6.113014221191406, 7.026691436767578, 7.94036865234375, 8.854045867919922, 9.767723083496094, 10.68139934539795, 11.595076560974121, 12.508753776550293, 13.422430992126465, 14.33610725402832, 15.249784469604492, 16.163461685180664, 17.077138900756836, 17.990816116333008, 18.90449333190918, 19.81817054748535, 20.731847763061523, 21.645524978637695, 22.559202194213867, 23.472877502441406, 24.386554718017578, 25.30023193359375, 26.213909149169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 6.0, 10.0, 17.0, 15.0, 20.0, 38.0, 42.0, 67.0, 109.0, 308.0, 1199.0, 6348.0, 43488.0, 359241.0, 545880.0, 78401.0, 10594.0, 1960.0, 405.0, 143.0, 65.0, 30.0, 32.0, 29.0, 23.0, 13.0, 12.0, 9.0, 7.0, 6.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -54.90576171875, -53.2490234375, -51.59228515625, -49.935546875, -48.27880859375, -46.6220703125, -44.96533203125, -43.30859375, -41.65185546875, -39.9951171875, -38.33837890625, -36.681640625, -35.02490234375, -33.3681640625, -31.71142578125, -30.0546875, -28.39794921875, -26.7412109375, -25.08447265625, -23.427734375, -21.77099609375, -20.1142578125, -18.45751953125, -16.80078125, -15.14404296875, -13.4873046875, -11.83056640625, -10.173828125, -8.51708984375, -6.8603515625, -5.20361328125, -3.546875, -1.89013671875, -0.2333984375, 1.42333984375, 3.080078125, 4.73681640625, 6.3935546875, 8.05029296875, 9.70703125, 11.36376953125, 13.0205078125, 14.67724609375, 16.333984375, 17.99072265625, 19.6474609375, 21.30419921875, 22.9609375, 24.61767578125, 26.2744140625, 27.93115234375, 29.587890625, 31.24462890625, 32.9013671875, 34.55810546875, 36.21484375, 37.87158203125, 39.5283203125, 41.18505859375, 42.841796875, 44.49853515625, 46.1552734375, 47.81201171875, 49.46875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 19.0, 33.0, 52.0, 45.0, 69.0, 75.0, 92.0, 99.0, 97.0, 99.0, 78.0, 65.0, 38.0, 42.0, 26.0, 17.0, 17.0, 5.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6025543212890625, -1.487335205078125, -1.3721160888671875, -1.25689697265625, -1.1416778564453125, -1.026458740234375, -0.9112396240234375, -0.7960205078125, -0.6808013916015625, -0.565582275390625, -0.4503631591796875, -0.33514404296875, -0.2199249267578125, -0.104705810546875, 0.0105133056640625, 0.125732421875, 0.2409515380859375, 0.356170654296875, 0.4713897705078125, 0.58660888671875, 0.7018280029296875, 0.817047119140625, 0.9322662353515625, 1.0474853515625, 1.1627044677734375, 1.277923583984375, 1.3931427001953125, 1.50836181640625, 1.6235809326171875, 1.738800048828125, 1.8540191650390625, 1.96923828125, 2.0844573974609375, 2.199676513671875, 2.3148956298828125, 2.43011474609375, 2.5453338623046875, 2.660552978515625, 2.7757720947265625, 2.8909912109375, 3.0062103271484375, 3.121429443359375, 3.2366485595703125, 3.35186767578125, 3.4670867919921875, 3.582305908203125, 3.6975250244140625, 3.812744140625, 3.9279632568359375, 4.043182373046875, 4.1584014892578125, 4.27362060546875, 4.3888397216796875, 4.504058837890625, 4.6192779541015625, 4.7344970703125, 4.8497161865234375, 4.964935302734375, 5.0801544189453125, 5.19537353515625, 5.3105926513671875, 5.425811767578125, 5.5410308837890625, 5.65625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 14.0, 11.0, 14.0, 17.0, 16.0, 28.0, 31.0, 43.0, 62.0, 99.0, 107.0, 169.0, 249.0, 298.0, 458.0, 718.0, 1270.0, 2468.0, 5914.0, 16521.0, 55698.0, 189123.0, 405187.0, 252774.0, 78923.0, 23462.0, 7773.0, 2993.0, 1467.0, 776.0, 527.0, 368.0, 275.0, 178.0, 137.0, 103.0, 75.0, 57.0, 31.0, 28.0, 36.0, 18.0, 14.0, 4.0, 9.0, 0.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.25, -25.420166015625, -24.59033203125, -23.760498046875, -22.9306640625, -22.100830078125, -21.27099609375, -20.441162109375, -19.611328125, -18.781494140625, -17.95166015625, -17.121826171875, -16.2919921875, -15.462158203125, -14.63232421875, -13.802490234375, -12.97265625, -12.142822265625, -11.31298828125, -10.483154296875, -9.6533203125, -8.823486328125, -7.99365234375, -7.163818359375, -6.333984375, -5.504150390625, -4.67431640625, -3.844482421875, -3.0146484375, -2.184814453125, -1.35498046875, -0.525146484375, 0.3046875, 1.134521484375, 1.96435546875, 2.794189453125, 3.6240234375, 4.453857421875, 5.28369140625, 6.113525390625, 6.943359375, 7.773193359375, 8.60302734375, 9.432861328125, 10.2626953125, 11.092529296875, 11.92236328125, 12.752197265625, 13.58203125, 14.411865234375, 15.24169921875, 16.071533203125, 16.9013671875, 17.731201171875, 18.56103515625, 19.390869140625, 20.220703125, 21.050537109375, 21.88037109375, 22.710205078125, 23.5400390625, 24.369873046875, 25.19970703125, 26.029541015625, 26.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 12.0, 11.0, 18.0, 16.0, 17.0, 28.0, 18.0, 31.0, 28.0, 37.0, 40.0, 41.0, 31.0, 58.0, 45.0, 49.0, 40.0, 50.0, 56.0, 46.0, 27.0, 37.0, 37.0, 38.0, 16.0, 23.0, 15.0, 21.0, 21.0, 15.0, 17.0, 10.0, 6.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.1953125, -12.8140869140625, -12.432861328125, -12.0516357421875, -11.67041015625, -11.2891845703125, -10.907958984375, -10.5267333984375, -10.1455078125, -9.7642822265625, -9.383056640625, -9.0018310546875, -8.62060546875, -8.2393798828125, -7.858154296875, -7.4769287109375, -7.095703125, -6.7144775390625, -6.333251953125, -5.9520263671875, -5.57080078125, -5.1895751953125, -4.808349609375, -4.4271240234375, -4.0458984375, -3.6646728515625, -3.283447265625, -2.9022216796875, -2.52099609375, -2.1397705078125, -1.758544921875, -1.3773193359375, -0.99609375, -0.6148681640625, -0.233642578125, 0.1475830078125, 0.52880859375, 0.9100341796875, 1.291259765625, 1.6724853515625, 2.0537109375, 2.4349365234375, 2.816162109375, 3.1973876953125, 3.57861328125, 3.9598388671875, 4.341064453125, 4.7222900390625, 5.103515625, 5.4847412109375, 5.865966796875, 6.2471923828125, 6.62841796875, 7.0096435546875, 7.390869140625, 7.7720947265625, 8.1533203125, 8.5345458984375, 8.915771484375, 9.2969970703125, 9.67822265625, 10.0594482421875, 10.440673828125, 10.8218994140625, 11.203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 12.0, 16.0, 20.0, 29.0, 49.0, 90.0, 127.0, 225.0, 407.0, 753.0, 1362.0, 3100.0, 7549.0, 21899.0, 73770.0, 258416.0, 424315.0, 179603.0, 50872.0, 15546.0, 5460.0, 2395.0, 1128.0, 569.0, 303.0, 196.0, 132.0, 63.0, 42.0, 26.0, 21.0, 18.0, 18.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.613037109375, -18.77294921875, -17.932861328125, -17.0927734375, -16.252685546875, -15.41259765625, -14.572509765625, -13.732421875, -12.892333984375, -12.05224609375, -11.212158203125, -10.3720703125, -9.531982421875, -8.69189453125, -7.851806640625, -7.01171875, -6.171630859375, -5.33154296875, -4.491455078125, -3.6513671875, -2.811279296875, -1.97119140625, -1.131103515625, -0.291015625, 0.549072265625, 1.38916015625, 2.229248046875, 3.0693359375, 3.909423828125, 4.74951171875, 5.589599609375, 6.4296875, 7.269775390625, 8.10986328125, 8.949951171875, 9.7900390625, 10.630126953125, 11.47021484375, 12.310302734375, 13.150390625, 13.990478515625, 14.83056640625, 15.670654296875, 16.5107421875, 17.350830078125, 18.19091796875, 19.031005859375, 19.87109375, 20.711181640625, 21.55126953125, 22.391357421875, 23.2314453125, 24.071533203125, 24.91162109375, 25.751708984375, 26.591796875, 27.431884765625, 28.27197265625, 29.112060546875, 29.9521484375, 30.792236328125, 31.63232421875, 32.472412109375, 33.3125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 22.0, 28.0, 32.0, 33.0, 40.0, 47.0, 54.0, 83.0, 90.0, 88.0, 107.0, 66.0, 57.0, 44.0, 44.0, 30.0, 30.0, 16.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00262451171875, -0.0025433599948883057, -0.0024622082710266113, -0.002381056547164917, -0.0022999048233032227, -0.0022187530994415283, -0.002137601375579834, -0.0020564496517181396, -0.0019752979278564453, -0.001894146203994751, -0.0018129944801330566, -0.0017318427562713623, -0.001650691032409668, -0.0015695393085479736, -0.0014883875846862793, -0.001407235860824585, -0.0013260841369628906, -0.0012449324131011963, -0.001163780689239502, -0.0010826289653778076, -0.0010014772415161133, -0.0009203255176544189, -0.0008391737937927246, -0.0007580220699310303, -0.0006768703460693359, -0.0005957186222076416, -0.0005145668983459473, -0.00043341517448425293, -0.0003522634506225586, -0.00027111172676086426, -0.00018996000289916992, -0.00010880827903747559, -2.765655517578125e-05, 5.3495168685913086e-05, 0.00013464689254760742, 0.00021579861640930176, 0.0002969503402709961, 0.00037810206413269043, 0.00045925378799438477, 0.0005404055118560791, 0.0006215572357177734, 0.0007027089595794678, 0.0007838606834411621, 0.0008650124073028564, 0.0009461641311645508, 0.0010273158550262451, 0.0011084675788879395, 0.0011896193027496338, 0.0012707710266113281, 0.0013519227504730225, 0.0014330744743347168, 0.0015142261981964111, 0.0015953779220581055, 0.0016765296459197998, 0.0017576813697814941, 0.0018388330936431885, 0.0019199848175048828, 0.002001136541366577, 0.0020822882652282715, 0.002163439989089966, 0.00224459171295166, 0.0023257434368133545, 0.002406895160675049, 0.002488046884536743, 0.0025691986083984375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 7.0, 13.0, 13.0, 20.0, 18.0, 21.0, 31.0, 53.0, 65.0, 103.0, 144.0, 173.0, 336.0, 589.0, 1171.0, 2268.0, 5334.0, 14274.0, 43287.0, 153118.0, 416964.0, 286311.0, 82616.0, 25123.0, 9000.0, 3647.0, 1604.0, 879.0, 443.0, 279.0, 190.0, 125.0, 97.0, 74.0, 37.0, 29.0, 22.0, 19.0, 10.0, 8.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.33154296875, -25.4755859375, -24.61962890625, -23.763671875, -22.90771484375, -22.0517578125, -21.19580078125, -20.33984375, -19.48388671875, -18.6279296875, -17.77197265625, -16.916015625, -16.06005859375, -15.2041015625, -14.34814453125, -13.4921875, -12.63623046875, -11.7802734375, -10.92431640625, -10.068359375, -9.21240234375, -8.3564453125, -7.50048828125, -6.64453125, -5.78857421875, -4.9326171875, -4.07666015625, -3.220703125, -2.36474609375, -1.5087890625, -0.65283203125, 0.203125, 1.05908203125, 1.9150390625, 2.77099609375, 3.626953125, 4.48291015625, 5.3388671875, 6.19482421875, 7.05078125, 7.90673828125, 8.7626953125, 9.61865234375, 10.474609375, 11.33056640625, 12.1865234375, 13.04248046875, 13.8984375, 14.75439453125, 15.6103515625, 16.46630859375, 17.322265625, 18.17822265625, 19.0341796875, 19.89013671875, 20.74609375, 21.60205078125, 22.4580078125, 23.31396484375, 24.169921875, 25.02587890625, 25.8818359375, 26.73779296875, 27.59375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 8.0, 13.0, 8.0, 16.0, 18.0, 22.0, 37.0, 48.0, 35.0, 66.0, 56.0, 63.0, 81.0, 70.0, 78.0, 59.0, 60.0, 44.0, 36.0, 30.0, 27.0, 26.0, 22.0, 15.0, 3.0, 12.0, 8.0, 8.0, 8.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8812255859375, -12.496826171875, -12.1124267578125, -11.72802734375, -11.3436279296875, -10.959228515625, -10.5748291015625, -10.1904296875, -9.8060302734375, -9.421630859375, -9.0372314453125, -8.65283203125, -8.2684326171875, -7.884033203125, -7.4996337890625, -7.115234375, -6.7308349609375, -6.346435546875, -5.9620361328125, -5.57763671875, -5.1932373046875, -4.808837890625, -4.4244384765625, -4.0400390625, -3.6556396484375, -3.271240234375, -2.8868408203125, -2.50244140625, -2.1180419921875, -1.733642578125, -1.3492431640625, -0.96484375, -0.5804443359375, -0.196044921875, 0.1883544921875, 0.57275390625, 0.9571533203125, 1.341552734375, 1.7259521484375, 2.1103515625, 2.4947509765625, 2.879150390625, 3.2635498046875, 3.64794921875, 4.0323486328125, 4.416748046875, 4.8011474609375, 5.185546875, 5.5699462890625, 5.954345703125, 6.3387451171875, 6.72314453125, 7.1075439453125, 7.491943359375, 7.8763427734375, 8.2607421875, 8.6451416015625, 9.029541015625, 9.4139404296875, 9.79833984375, 10.1827392578125, 10.567138671875, 10.9515380859375, 11.3359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 11.0, 29.0, 49.0, 84.0, 164.0, 191.0, 172.0, 127.0, 75.0, 39.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.6391296386719, -249.26834106445312, -241.89755249023438, -234.52676391601562, -227.1559600830078, -219.78517150878906, -212.4143829345703, -205.04359436035156, -197.67279052734375, -190.302001953125, -182.93121337890625, -175.5604248046875, -168.1896209716797, -160.81883239746094, -153.4480438232422, -146.07725524902344, -138.7064666748047, -131.33567810058594, -123.96488189697266, -116.5940933227539, -109.22329711914062, -101.85250854492188, -94.48171997070312, -87.11093139648438, -79.7401351928711, -72.36934661865234, -64.99855041503906, -57.62776184082031, -50.2569694519043, -42.88617706298828, -35.51538848876953, -28.144596099853516, -20.7738037109375, -13.4030122756958, -6.032220840454102, 1.3385696411132812, 8.709362030029297, 16.080154418945312, 23.450942993164062, 30.821735382080078, 38.192527770996094, 45.56332015991211, 52.934112548828125, 60.304901123046875, 67.67568969726562, 75.0464859008789, 82.41727447509766, 89.78807067871094, 97.15885925292969, 104.52964782714844, 111.90044403076172, 119.27123260498047, 126.64202880859375, 134.0128173828125, 141.38360595703125, 148.75439453125, 156.12518310546875, 163.4959716796875, 170.86676025390625, 178.237548828125, 185.6083526611328, 192.97914123535156, 200.3499298095703, 207.72071838378906, 215.09152221679688]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 7.0, 12.0, 22.0, 18.0, 28.0, 33.0, 31.0, 46.0, 40.0, 47.0, 51.0, 63.0, 50.0, 64.0, 47.0, 44.0, 60.0, 49.0, 49.0, 37.0, 35.0, 30.0, 26.0, 19.0, 19.0, 15.0, 13.0, 7.0, 15.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-142.22293090820312, -138.83920288085938, -135.45547485351562, -132.07174682617188, -128.6880340576172, -125.30430603027344, -121.92057800292969, -118.53684997558594, -115.15312957763672, -111.76940155029297, -108.38568115234375, -105.001953125, -101.61822509765625, -98.23450469970703, -94.85077667236328, -91.46705627441406, -88.08332824707031, -84.69960021972656, -81.31587982177734, -77.9321517944336, -74.54842376708984, -71.16470336914062, -67.78097534179688, -64.39724731445312, -61.013519287109375, -57.62979507446289, -54.24606704711914, -50.862342834472656, -47.47861862182617, -44.09489440917969, -40.71116638183594, -37.32744216918945, -33.94371795654297, -30.55999183654785, -27.176267623901367, -23.79254150390625, -20.408817291259766, -17.02509117126465, -13.641365051269531, -10.257640838623047, -6.87391471862793, -3.49018931388855, -0.10646390914916992, 3.277261734008789, 6.66098690032959, 10.04471206665039, 13.428438186645508, 16.812162399291992, 20.19588851928711, 23.579614639282227, 26.96333885192871, 30.347064971923828, 33.73078918457031, 37.11451721191406, 40.49824142456055, 43.88196563720703, 47.26569366455078, 50.649417877197266, 54.033145904541016, 57.4168701171875, 60.800594329833984, 64.18431854248047, 67.56804656982422, 70.95176696777344, 74.33549499511719]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 13.0, 21.0, 35.0, 57.0, 97.0, 235.0, 1787.0, 42350.0, 4097835.0, 49331.0, 1845.0, 302.0, 132.0, 93.0, 42.0, 34.0, 28.0, 13.0, 12.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.75, -140.25390625, -134.7578125, -129.26171875, -123.765625, -118.26953125, -112.7734375, -107.27734375, -101.78125, -96.28515625, -90.7890625, -85.29296875, -79.796875, -74.30078125, -68.8046875, -63.30859375, -57.8125, -52.31640625, -46.8203125, -41.32421875, -35.828125, -30.33203125, -24.8359375, -19.33984375, -13.84375, -8.34765625, -2.8515625, 2.64453125, 8.140625, 13.63671875, 19.1328125, 24.62890625, 30.125, 35.62109375, 41.1171875, 46.61328125, 52.109375, 57.60546875, 63.1015625, 68.59765625, 74.09375, 79.58984375, 85.0859375, 90.58203125, 96.078125, 101.57421875, 107.0703125, 112.56640625, 118.0625, 123.55859375, 129.0546875, 134.55078125, 140.046875, 145.54296875, 151.0390625, 156.53515625, 162.03125, 167.52734375, 173.0234375, 178.51953125, 184.015625, 189.51171875, 195.0078125, 200.50390625, 206.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 19.0, 34.0, 42.0, 66.0, 70.0, 94.0, 103.0, 104.0, 89.0, 95.0, 76.0, 65.0, 40.0, 23.0, 20.0, 17.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.072021484375, -3.91748046875, -3.762939453125, -3.6083984375, -3.453857421875, -3.29931640625, -3.144775390625, -2.990234375, -2.835693359375, -2.68115234375, -2.526611328125, -2.3720703125, -2.217529296875, -2.06298828125, -1.908447265625, -1.75390625, -1.599365234375, -1.44482421875, -1.290283203125, -1.1357421875, -0.981201171875, -0.82666015625, -0.672119140625, -0.517578125, -0.363037109375, -0.20849609375, -0.053955078125, 0.1005859375, 0.255126953125, 0.40966796875, 0.564208984375, 0.71875, 0.873291015625, 1.02783203125, 1.182373046875, 1.3369140625, 1.491455078125, 1.64599609375, 1.800537109375, 1.955078125, 2.109619140625, 2.26416015625, 2.418701171875, 2.5732421875, 2.727783203125, 2.88232421875, 3.036865234375, 3.19140625, 3.345947265625, 3.50048828125, 3.655029296875, 3.8095703125, 3.964111328125, 4.11865234375, 4.273193359375, 4.427734375, 4.582275390625, 4.73681640625, 4.891357421875, 5.0458984375, 5.200439453125, 5.35498046875, 5.509521484375, 5.6640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 12.0, 7.0, 11.0, 15.0, 16.0, 21.0, 24.0, 26.0, 45.0, 60.0, 94.0, 121.0, 191.0, 313.0, 585.0, 1165.0, 2797.0, 7862.0, 26771.0, 120375.0, 1201273.0, 2622468.0, 160235.0, 34006.0, 9535.0, 3259.0, 1391.0, 655.0, 321.0, 205.0, 140.0, 76.0, 45.0, 41.0, 24.0, 24.0, 18.0, 13.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.78125, -52.248046875, -50.71484375, -49.181640625, -47.6484375, -46.115234375, -44.58203125, -43.048828125, -41.515625, -39.982421875, -38.44921875, -36.916015625, -35.3828125, -33.849609375, -32.31640625, -30.783203125, -29.25, -27.716796875, -26.18359375, -24.650390625, -23.1171875, -21.583984375, -20.05078125, -18.517578125, -16.984375, -15.451171875, -13.91796875, -12.384765625, -10.8515625, -9.318359375, -7.78515625, -6.251953125, -4.71875, -3.185546875, -1.65234375, -0.119140625, 1.4140625, 2.947265625, 4.48046875, 6.013671875, 7.546875, 9.080078125, 10.61328125, 12.146484375, 13.6796875, 15.212890625, 16.74609375, 18.279296875, 19.8125, 21.345703125, 22.87890625, 24.412109375, 25.9453125, 27.478515625, 29.01171875, 30.544921875, 32.078125, 33.611328125, 35.14453125, 36.677734375, 38.2109375, 39.744140625, 41.27734375, 42.810546875, 44.34375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 9.0, 33.0, 23.0, 49.0, 79.0, 141.0, 281.0, 725.0, 1656.0, 511.0, 203.0, 130.0, 63.0, 60.0, 35.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.015625, -15.645751953125, -15.27587890625, -14.906005859375, -14.5361328125, -14.166259765625, -13.79638671875, -13.426513671875, -13.056640625, -12.686767578125, -12.31689453125, -11.947021484375, -11.5771484375, -11.207275390625, -10.83740234375, -10.467529296875, -10.09765625, -9.727783203125, -9.35791015625, -8.988037109375, -8.6181640625, -8.248291015625, -7.87841796875, -7.508544921875, -7.138671875, -6.768798828125, -6.39892578125, -6.029052734375, -5.6591796875, -5.289306640625, -4.91943359375, -4.549560546875, -4.1796875, -3.809814453125, -3.43994140625, -3.070068359375, -2.7001953125, -2.330322265625, -1.96044921875, -1.590576171875, -1.220703125, -0.850830078125, -0.48095703125, -0.111083984375, 0.2587890625, 0.628662109375, 0.99853515625, 1.368408203125, 1.73828125, 2.108154296875, 2.47802734375, 2.847900390625, 3.2177734375, 3.587646484375, 3.95751953125, 4.327392578125, 4.697265625, 5.067138671875, 5.43701171875, 5.806884765625, 6.1767578125, 6.546630859375, 6.91650390625, 7.286376953125, 7.65625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 14.0, 50.0, 118.0, 200.0, 263.0, 172.0, 107.0, 42.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.45655822753906, -179.21998596191406, -174.9833984375, -170.746826171875, -166.51025390625, -162.273681640625, -158.037109375, -153.80052185058594, -149.56394958496094, -145.32737731933594, -141.09078979492188, -136.85421752929688, -132.61764526367188, -128.38107299804688, -124.14449310302734, -119.90791320800781, -115.67134094238281, -111.43476867675781, -107.19818878173828, -102.96160888671875, -98.72503662109375, -94.48846435546875, -90.25188446044922, -86.01530456542969, -81.77873229980469, -77.54216003417969, -73.30558013916016, -69.06900024414062, -64.83242797851562, -60.59585189819336, -56.359275817871094, -52.12269973754883, -47.88611602783203, -43.649539947509766, -39.4129638671875, -35.176387786865234, -30.93981170654297, -26.703235626220703, -22.466659545898438, -18.230083465576172, -13.993507385253906, -9.75693130493164, -5.520355224609375, -1.2837791442871094, 2.9527969360351562, 7.189373016357422, 11.425949096679688, 15.662525177001953, 19.89910125732422, 24.135677337646484, 28.37225341796875, 32.608829498291016, 36.84540557861328, 41.08198165893555, 45.31855773925781, 49.55513381958008, 53.791709899902344, 58.02828598022461, 62.264862060546875, 66.50143432617188, 70.7380142211914, 74.97459411621094, 79.21116638183594, 83.44773864746094, 87.68431854248047]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 5.0, 8.0, 10.0, 12.0, 20.0, 13.0, 31.0, 18.0, 29.0, 20.0, 33.0, 36.0, 45.0, 42.0, 43.0, 34.0, 40.0, 41.0, 35.0, 35.0, 51.0, 41.0, 41.0, 36.0, 32.0, 26.0, 31.0, 25.0, 18.0, 20.0, 17.0, 21.0, 9.0, 17.0, 8.0, 14.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.88884735107422, -30.899494171142578, -29.91014289855957, -28.92078971862793, -27.931438446044922, -26.94208526611328, -25.95273208618164, -24.963380813598633, -23.974027633666992, -22.98467445373535, -21.995323181152344, -21.005970001220703, -20.016618728637695, -19.027265548706055, -18.037914276123047, -17.048561096191406, -16.059207916259766, -15.069855690002441, -14.080503463745117, -13.091150283813477, -12.101798057556152, -11.112445831298828, -10.123093605041504, -9.13374137878418, -8.144390106201172, -7.155037879943848, -6.165685176849365, -5.176332950592041, -4.186980247497559, -3.1976280212402344, -2.20827579498291, -1.2189230918884277, -0.2295703887939453, 0.7597820162773132, 1.7491344213485718, 2.7384867668151855, 3.727839231491089, 4.717191696166992, 5.706543922424316, 6.695896625518799, 7.685248851776123, 8.674601554870605, 9.66395378112793, 10.653306007385254, 11.642658233642578, 12.632011413574219, 13.621362686157227, 14.610715866088867, 15.600068092346191, 16.589420318603516, 17.578773498535156, 18.568124771118164, 19.557477951049805, 20.546829223632812, 21.536182403564453, 22.525535583496094, 23.5148868560791, 24.504240036010742, 25.49359130859375, 26.48294448852539, 27.4722957611084, 28.46164894104004, 29.451000213623047, 30.440353393554688, 31.429706573486328]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 12.0, 8.0, 19.0, 17.0, 34.0, 28.0, 32.0, 55.0, 75.0, 125.0, 234.0, 442.0, 1133.0, 3194.0, 10380.0, 36794.0, 135507.0, 388350.0, 328191.0, 103536.0, 27934.0, 8031.0, 2475.0, 947.0, 379.0, 191.0, 107.0, 83.0, 46.0, 33.0, 32.0, 17.0, 17.0, 18.0, 8.0, 10.0, 4.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.203125, -29.284912109375, -28.36669921875, -27.448486328125, -26.5302734375, -25.612060546875, -24.69384765625, -23.775634765625, -22.857421875, -21.939208984375, -21.02099609375, -20.102783203125, -19.1845703125, -18.266357421875, -17.34814453125, -16.429931640625, -15.51171875, -14.593505859375, -13.67529296875, -12.757080078125, -11.8388671875, -10.920654296875, -10.00244140625, -9.084228515625, -8.166015625, -7.247802734375, -6.32958984375, -5.411376953125, -4.4931640625, -3.574951171875, -2.65673828125, -1.738525390625, -0.8203125, 0.097900390625, 1.01611328125, 1.934326171875, 2.8525390625, 3.770751953125, 4.68896484375, 5.607177734375, 6.525390625, 7.443603515625, 8.36181640625, 9.280029296875, 10.1982421875, 11.116455078125, 12.03466796875, 12.952880859375, 13.87109375, 14.789306640625, 15.70751953125, 16.625732421875, 17.5439453125, 18.462158203125, 19.38037109375, 20.298583984375, 21.216796875, 22.135009765625, 23.05322265625, 23.971435546875, 24.8896484375, 25.807861328125, 26.72607421875, 27.644287109375, 28.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 8.0, 26.0, 18.0, 35.0, 40.0, 60.0, 61.0, 75.0, 100.0, 91.0, 93.0, 84.0, 80.0, 62.0, 53.0, 39.0, 30.0, 16.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.03277587890625, -3.8819580078125, -3.73114013671875, -3.580322265625, -3.42950439453125, -3.2786865234375, -3.12786865234375, -2.97705078125, -2.82623291015625, -2.6754150390625, -2.52459716796875, -2.373779296875, -2.22296142578125, -2.0721435546875, -1.92132568359375, -1.7705078125, -1.61968994140625, -1.4688720703125, -1.31805419921875, -1.167236328125, -1.01641845703125, -0.8656005859375, -0.71478271484375, -0.56396484375, -0.41314697265625, -0.2623291015625, -0.11151123046875, 0.039306640625, 0.19012451171875, 0.3409423828125, 0.49176025390625, 0.642578125, 0.79339599609375, 0.9442138671875, 1.09503173828125, 1.245849609375, 1.39666748046875, 1.5474853515625, 1.69830322265625, 1.84912109375, 1.99993896484375, 2.1507568359375, 2.30157470703125, 2.452392578125, 2.60321044921875, 2.7540283203125, 2.90484619140625, 3.0556640625, 3.20648193359375, 3.3572998046875, 3.50811767578125, 3.658935546875, 3.80975341796875, 3.9605712890625, 4.11138916015625, 4.26220703125, 4.41302490234375, 4.5638427734375, 4.71466064453125, 4.865478515625, 5.01629638671875, 5.1671142578125, 5.31793212890625, 5.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 14.0, 23.0, 22.0, 44.0, 53.0, 67.0, 88.0, 120.0, 190.0, 306.0, 418.0, 626.0, 1136.0, 2296.0, 6296.0, 23377.0, 108402.0, 439809.0, 358500.0, 79307.0, 17573.0, 5044.0, 1984.0, 1025.0, 561.0, 373.0, 251.0, 178.0, 116.0, 94.0, 69.0, 40.0, 37.0, 29.0, 12.0, 15.0, 7.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.75, -30.72265625, -29.6953125, -28.66796875, -27.640625, -26.61328125, -25.5859375, -24.55859375, -23.53125, -22.50390625, -21.4765625, -20.44921875, -19.421875, -18.39453125, -17.3671875, -16.33984375, -15.3125, -14.28515625, -13.2578125, -12.23046875, -11.203125, -10.17578125, -9.1484375, -8.12109375, -7.09375, -6.06640625, -5.0390625, -4.01171875, -2.984375, -1.95703125, -0.9296875, 0.09765625, 1.125, 2.15234375, 3.1796875, 4.20703125, 5.234375, 6.26171875, 7.2890625, 8.31640625, 9.34375, 10.37109375, 11.3984375, 12.42578125, 13.453125, 14.48046875, 15.5078125, 16.53515625, 17.5625, 18.58984375, 19.6171875, 20.64453125, 21.671875, 22.69921875, 23.7265625, 24.75390625, 25.78125, 26.80859375, 27.8359375, 28.86328125, 29.890625, 30.91796875, 31.9453125, 32.97265625, 34.0]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 7.0, 12.0, 17.0, 23.0, 17.0, 33.0, 27.0, 25.0, 37.0, 34.0, 40.0, 42.0, 44.0, 49.0, 46.0, 51.0, 44.0, 50.0, 40.0, 46.0, 31.0, 39.0, 38.0, 23.0, 26.0, 17.0, 19.0, 19.0, 14.0, 8.0, 8.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0626220703125, -13.601806640625, -13.1409912109375, -12.68017578125, -12.2193603515625, -11.758544921875, -11.2977294921875, -10.8369140625, -10.3760986328125, -9.915283203125, -9.4544677734375, -8.99365234375, -8.5328369140625, -8.072021484375, -7.6112060546875, -7.150390625, -6.6895751953125, -6.228759765625, -5.7679443359375, -5.30712890625, -4.8463134765625, -4.385498046875, -3.9246826171875, -3.4638671875, -3.0030517578125, -2.542236328125, -2.0814208984375, -1.62060546875, -1.1597900390625, -0.698974609375, -0.2381591796875, 0.22265625, 0.6834716796875, 1.144287109375, 1.6051025390625, 2.06591796875, 2.5267333984375, 2.987548828125, 3.4483642578125, 3.9091796875, 4.3699951171875, 4.830810546875, 5.2916259765625, 5.75244140625, 6.2132568359375, 6.674072265625, 7.1348876953125, 7.595703125, 8.0565185546875, 8.517333984375, 8.9781494140625, 9.43896484375, 9.8997802734375, 10.360595703125, 10.8214111328125, 11.2822265625, 11.7430419921875, 12.203857421875, 12.6646728515625, 13.12548828125, 13.5863037109375, 14.047119140625, 14.5079345703125, 14.96875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 16.0, 19.0, 35.0, 54.0, 74.0, 152.0, 214.0, 420.0, 741.0, 1674.0, 4044.0, 11536.0, 41975.0, 210372.0, 545070.0, 178645.0, 36264.0, 10246.0, 3722.0, 1567.0, 773.0, 353.0, 240.0, 116.0, 80.0, 39.0, 26.0, 19.0, 17.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.755615234375, -20.93310546875, -20.110595703125, -19.2880859375, -18.465576171875, -17.64306640625, -16.820556640625, -15.998046875, -15.175537109375, -14.35302734375, -13.530517578125, -12.7080078125, -11.885498046875, -11.06298828125, -10.240478515625, -9.41796875, -8.595458984375, -7.77294921875, -6.950439453125, -6.1279296875, -5.305419921875, -4.48291015625, -3.660400390625, -2.837890625, -2.015380859375, -1.19287109375, -0.370361328125, 0.4521484375, 1.274658203125, 2.09716796875, 2.919677734375, 3.7421875, 4.564697265625, 5.38720703125, 6.209716796875, 7.0322265625, 7.854736328125, 8.67724609375, 9.499755859375, 10.322265625, 11.144775390625, 11.96728515625, 12.789794921875, 13.6123046875, 14.434814453125, 15.25732421875, 16.079833984375, 16.90234375, 17.724853515625, 18.54736328125, 19.369873046875, 20.1923828125, 21.014892578125, 21.83740234375, 22.659912109375, 23.482421875, 24.304931640625, 25.12744140625, 25.949951171875, 26.7724609375, 27.594970703125, 28.41748046875, 29.239990234375, 30.0625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 12.0, 10.0, 24.0, 34.0, 40.0, 39.0, 47.0, 72.0, 74.0, 77.0, 89.0, 75.0, 69.0, 65.0, 62.0, 42.0, 41.0, 21.0, 20.0, 15.0, 16.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017547607421875, -0.0016904175281524658, -0.0016260743141174316, -0.0015617311000823975, -0.0014973878860473633, -0.001433044672012329, -0.001368701457977295, -0.0013043582439422607, -0.0012400150299072266, -0.0011756718158721924, -0.0011113286018371582, -0.001046985387802124, -0.0009826421737670898, -0.0009182989597320557, -0.0008539557456970215, -0.0007896125316619873, -0.0007252693176269531, -0.0006609261035919189, -0.0005965828895568848, -0.0005322396755218506, -0.0004678964614868164, -0.0004035532474517822, -0.00033921003341674805, -0.00027486681938171387, -0.0002105236053466797, -0.0001461803913116455, -8.183717727661133e-05, -1.749396324157715e-05, 4.684925079345703e-05, 0.00011119246482849121, 0.0001755356788635254, 0.00023987889289855957, 0.00030422210693359375, 0.00036856532096862793, 0.0004329085350036621, 0.0004972517490386963, 0.0005615949630737305, 0.0006259381771087646, 0.0006902813911437988, 0.000754624605178833, 0.0008189678192138672, 0.0008833110332489014, 0.0009476542472839355, 0.0010119974613189697, 0.001076340675354004, 0.001140683889389038, 0.0012050271034240723, 0.0012693703174591064, 0.0013337135314941406, 0.0013980567455291748, 0.001462399959564209, 0.0015267431735992432, 0.0015910863876342773, 0.0016554296016693115, 0.0017197728157043457, 0.0017841160297393799, 0.001848459243774414, 0.0019128024578094482, 0.0019771456718444824, 0.0020414888858795166, 0.0021058320999145508, 0.002170175313949585, 0.002234518527984619, 0.0022988617420196533, 0.0023632049560546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 9.0, 14.0, 18.0, 34.0, 46.0, 71.0, 132.0, 232.0, 393.0, 780.0, 1727.0, 4260.0, 16191.0, 121039.0, 637198.0, 229432.0, 26747.0, 5893.0, 2169.0, 948.0, 506.0, 296.0, 138.0, 104.0, 64.0, 26.0, 17.0, 15.0, 4.0, 8.0, 5.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.59375, -44.382568359375, -43.17138671875, -41.960205078125, -40.7490234375, -39.537841796875, -38.32666015625, -37.115478515625, -35.904296875, -34.693115234375, -33.48193359375, -32.270751953125, -31.0595703125, -29.848388671875, -28.63720703125, -27.426025390625, -26.21484375, -25.003662109375, -23.79248046875, -22.581298828125, -21.3701171875, -20.158935546875, -18.94775390625, -17.736572265625, -16.525390625, -15.314208984375, -14.10302734375, -12.891845703125, -11.6806640625, -10.469482421875, -9.25830078125, -8.047119140625, -6.8359375, -5.624755859375, -4.41357421875, -3.202392578125, -1.9912109375, -0.780029296875, 0.43115234375, 1.642333984375, 2.853515625, 4.064697265625, 5.27587890625, 6.487060546875, 7.6982421875, 8.909423828125, 10.12060546875, 11.331787109375, 12.54296875, 13.754150390625, 14.96533203125, 16.176513671875, 17.3876953125, 18.598876953125, 19.81005859375, 21.021240234375, 22.232421875, 23.443603515625, 24.65478515625, 25.865966796875, 27.0771484375, 28.288330078125, 29.49951171875, 30.710693359375, 31.921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 12.0, 10.0, 23.0, 34.0, 51.0, 66.0, 78.0, 79.0, 88.0, 95.0, 95.0, 76.0, 68.0, 58.0, 46.0, 33.0, 19.0, 19.0, 13.0, 7.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.4141845703125, -13.804931640625, -13.1956787109375, -12.58642578125, -11.9771728515625, -11.367919921875, -10.7586669921875, -10.1494140625, -9.5401611328125, -8.930908203125, -8.3216552734375, -7.71240234375, -7.1031494140625, -6.493896484375, -5.8846435546875, -5.275390625, -4.6661376953125, -4.056884765625, -3.4476318359375, -2.83837890625, -2.2291259765625, -1.619873046875, -1.0106201171875, -0.4013671875, 0.2078857421875, 0.817138671875, 1.4263916015625, 2.03564453125, 2.6448974609375, 3.254150390625, 3.8634033203125, 4.47265625, 5.0819091796875, 5.691162109375, 6.3004150390625, 6.90966796875, 7.5189208984375, 8.128173828125, 8.7374267578125, 9.3466796875, 9.9559326171875, 10.565185546875, 11.1744384765625, 11.78369140625, 12.3929443359375, 13.002197265625, 13.6114501953125, 14.220703125, 14.8299560546875, 15.439208984375, 16.0484619140625, 16.65771484375, 17.2669677734375, 17.876220703125, 18.4854736328125, 19.0947265625, 19.7039794921875, 20.313232421875, 20.9224853515625, 21.53173828125, 22.1409912109375, 22.750244140625, 23.3594970703125, 23.96875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 11.0, 34.0, 112.0, 229.0, 309.0, 192.0, 83.0, 20.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-598.8878173828125, -586.2535400390625, -573.6192626953125, -560.9849853515625, -548.3506469726562, -535.7163696289062, -523.0820922851562, -510.44781494140625, -497.81353759765625, -485.17926025390625, -472.5449523925781, -459.9106750488281, -447.2763977050781, -434.6421203613281, -422.0078125, -409.37353515625, -396.7392578125, -384.10498046875, -371.4706726074219, -358.8363952636719, -346.2021179199219, -333.5678405761719, -320.93353271484375, -308.29925537109375, -295.6649475097656, -283.0306701660156, -270.3963623046875, -257.7620849609375, -245.1278076171875, -232.49351501464844, -219.85922241210938, -207.22494506835938, -194.59066772460938, -181.9563751220703, -169.3220977783203, -156.68780517578125, -144.05352783203125, -131.4192352294922, -118.78495025634766, -106.15066528320312, -93.5163803100586, -80.88209533691406, -68.24781036376953, -55.613521575927734, -42.9792366027832, -30.344951629638672, -17.710662841796875, -5.076377868652344, 7.5579071044921875, 20.19219207763672, 32.82647705078125, 45.46076583862305, 58.09505081176758, 70.72933959960938, 83.3636245727539, 95.99790954589844, 108.63219451904297, 121.2664794921875, 133.90077209472656, 146.53504943847656, 159.16934204101562, 171.80361938476562, 184.4379119873047, 197.07220458984375, 209.70648193359375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 19.0, 27.0, 39.0, 40.0, 33.0, 51.0, 47.0, 49.0, 41.0, 49.0, 62.0, 44.0, 41.0, 57.0, 49.0, 47.0, 44.0, 37.0, 30.0, 37.0, 16.0, 20.0, 9.0, 14.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.0939483642578, -127.42398071289062, -123.75401306152344, -120.08403778076172, -116.41407012939453, -112.74410247802734, -109.07412719726562, -105.40415954589844, -101.73419189453125, -98.06422424316406, -94.39425659179688, -90.72428131103516, -87.05431365966797, -83.38434600830078, -79.71437072753906, -76.04440307617188, -72.37443542480469, -68.7044677734375, -65.03450012207031, -61.364524841308594, -57.694557189941406, -54.02458953857422, -50.354618072509766, -46.68464660644531, -43.014678955078125, -39.34471130371094, -35.674739837646484, -32.00476837158203, -28.334800720214844, -24.664831161499023, -20.994861602783203, -17.324892044067383, -13.654922485351562, -9.984952926635742, -6.314983367919922, -2.6450138092041016, 1.0249557495117188, 4.694925308227539, 8.36489486694336, 12.03486442565918, 15.704833984375, 19.37480354309082, 23.04477310180664, 26.71474266052246, 30.38471221923828, 34.05467987060547, 37.72465133666992, 41.394622802734375, 45.06459045410156, 48.73455810546875, 52.4045295715332, 56.074501037597656, 59.744468688964844, 63.41443634033203, 67.08441162109375, 70.75437927246094, 74.42434692382812, 78.09431457519531, 81.7642822265625, 85.43425750732422, 89.1042251586914, 92.7741928100586, 96.44416809082031, 100.1141357421875, 103.78410339355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 6.0, 3.0, 7.0, 12.0, 11.0, 18.0, 28.0, 37.0, 36.0, 52.0, 89.0, 139.0, 272.0, 449.0, 924.0, 1971.0, 4639.0, 13197.0, 45641.0, 272647.0, 3532624.0, 255167.0, 44081.0, 13010.0, 4775.0, 2015.0, 1013.0, 478.0, 274.0, 211.0, 119.0, 81.0, 55.0, 48.0, 30.0, 23.0, 23.0, 19.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.78125, -36.455078125, -35.12890625, -33.802734375, -32.4765625, -31.150390625, -29.82421875, -28.498046875, -27.171875, -25.845703125, -24.51953125, -23.193359375, -21.8671875, -20.541015625, -19.21484375, -17.888671875, -16.5625, -15.236328125, -13.91015625, -12.583984375, -11.2578125, -9.931640625, -8.60546875, -7.279296875, -5.953125, -4.626953125, -3.30078125, -1.974609375, -0.6484375, 0.677734375, 2.00390625, 3.330078125, 4.65625, 5.982421875, 7.30859375, 8.634765625, 9.9609375, 11.287109375, 12.61328125, 13.939453125, 15.265625, 16.591796875, 17.91796875, 19.244140625, 20.5703125, 21.896484375, 23.22265625, 24.548828125, 25.875, 27.201171875, 28.52734375, 29.853515625, 31.1796875, 32.505859375, 33.83203125, 35.158203125, 36.484375, 37.810546875, 39.13671875, 40.462890625, 41.7890625, 43.115234375, 44.44140625, 45.767578125, 47.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 24.0, 34.0, 23.0, 32.0, 54.0, 50.0, 64.0, 79.0, 78.0, 68.0, 57.0, 48.0, 51.0, 68.0, 50.0, 44.0, 20.0, 24.0, 32.0, 14.0, 15.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.469329833984375, -3.34295654296875, -3.216583251953125, -3.0902099609375, -2.963836669921875, -2.83746337890625, -2.711090087890625, -2.584716796875, -2.458343505859375, -2.33197021484375, -2.205596923828125, -2.0792236328125, -1.952850341796875, -1.82647705078125, -1.700103759765625, -1.57373046875, -1.447357177734375, -1.32098388671875, -1.194610595703125, -1.0682373046875, -0.941864013671875, -0.81549072265625, -0.689117431640625, -0.562744140625, -0.436370849609375, -0.30999755859375, -0.183624267578125, -0.0572509765625, 0.069122314453125, 0.19549560546875, 0.321868896484375, 0.4482421875, 0.574615478515625, 0.70098876953125, 0.827362060546875, 0.9537353515625, 1.080108642578125, 1.20648193359375, 1.332855224609375, 1.459228515625, 1.585601806640625, 1.71197509765625, 1.838348388671875, 1.9647216796875, 2.091094970703125, 2.21746826171875, 2.343841552734375, 2.47021484375, 2.596588134765625, 2.72296142578125, 2.849334716796875, 2.9757080078125, 3.102081298828125, 3.22845458984375, 3.354827880859375, 3.481201171875, 3.607574462890625, 3.73394775390625, 3.860321044921875, 3.9866943359375, 4.113067626953125, 4.23944091796875, 4.365814208984375, 4.4921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 6.0, 10.0, 9.0, 10.0, 11.0, 21.0, 16.0, 29.0, 21.0, 34.0, 44.0, 61.0, 107.0, 238.0, 588.0, 1898.0, 11325.0, 149555.0, 3819637.0, 194009.0, 13147.0, 2219.0, 590.0, 202.0, 117.0, 74.0, 58.0, 47.0, 23.0, 26.0, 20.0, 20.0, 19.0, 15.0, 10.0, 12.0, 11.0, 14.0, 3.0, 1.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.4609375, -67.109375, -64.7578125, -62.40625, -60.0546875, -57.703125, -55.3515625, -53.0, -50.6484375, -48.296875, -45.9453125, -43.59375, -41.2421875, -38.890625, -36.5390625, -34.1875, -31.8359375, -29.484375, -27.1328125, -24.78125, -22.4296875, -20.078125, -17.7265625, -15.375, -13.0234375, -10.671875, -8.3203125, -5.96875, -3.6171875, -1.265625, 1.0859375, 3.4375, 5.7890625, 8.140625, 10.4921875, 12.84375, 15.1953125, 17.546875, 19.8984375, 22.25, 24.6015625, 26.953125, 29.3046875, 31.65625, 34.0078125, 36.359375, 38.7109375, 41.0625, 43.4140625, 45.765625, 48.1171875, 50.46875, 52.8203125, 55.171875, 57.5234375, 59.875, 62.2265625, 64.578125, 66.9296875, 69.28125, 71.6328125, 73.984375, 76.3359375, 78.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 15.0, 28.0, 55.0, 155.0, 496.0, 2310.0, 697.0, 186.0, 75.0, 27.0, 16.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.0706787109375, -8.352294921875, -7.6339111328125, -6.91552734375, -6.1971435546875, -5.478759765625, -4.7603759765625, -4.0419921875, -3.3236083984375, -2.605224609375, -1.8868408203125, -1.16845703125, -0.4500732421875, 0.268310546875, 0.9866943359375, 1.705078125, 2.4234619140625, 3.141845703125, 3.8602294921875, 4.57861328125, 5.2969970703125, 6.015380859375, 6.7337646484375, 7.4521484375, 8.1705322265625, 8.888916015625, 9.6072998046875, 10.32568359375, 11.0440673828125, 11.762451171875, 12.4808349609375, 13.19921875, 13.9176025390625, 14.635986328125, 15.3543701171875, 16.07275390625, 16.7911376953125, 17.509521484375, 18.2279052734375, 18.9462890625, 19.6646728515625, 20.383056640625, 21.1014404296875, 21.81982421875, 22.5382080078125, 23.256591796875, 23.9749755859375, 24.693359375, 25.4117431640625, 26.130126953125, 26.8485107421875, 27.56689453125, 28.2852783203125, 29.003662109375, 29.7220458984375, 30.4404296875, 31.1588134765625, 31.877197265625, 32.5955810546875, 33.31396484375, 34.0323486328125, 34.750732421875, 35.4691162109375, 36.1875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 15.0, 19.0, 36.0, 72.0, 115.0, 165.0, 184.0, 123.0, 105.0, 76.0, 27.0, 23.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.16114807128906, -78.63786315917969, -76.11457824707031, -73.59130096435547, -71.0680160522461, -68.54473114013672, -66.02144622802734, -63.49816131591797, -60.97488021850586, -58.451595306396484, -55.928314208984375, -53.405029296875, -50.881744384765625, -48.358463287353516, -45.83517837524414, -43.31189727783203, -40.788612365722656, -38.26532745361328, -35.74204635620117, -33.2187614440918, -30.695478439331055, -28.172195434570312, -25.648910522460938, -23.125627517700195, -20.602344512939453, -18.07906150817871, -15.555777549743652, -13.032493591308594, -10.509210586547852, -7.985927581787109, -5.462643623352051, -2.939359664916992, -0.41606903076171875, 2.1072144508361816, 4.630497932434082, 7.153781414031982, 9.677064895629883, 12.200347900390625, 14.723631858825684, 17.246915817260742, 19.770198822021484, 22.293481826782227, 24.81676483154297, 27.340049743652344, 29.863332748413086, 32.38661575317383, 34.9099006652832, 37.43318176269531, 39.95646667480469, 42.47975158691406, 45.00303268432617, 47.52631759643555, 50.049598693847656, 52.57288360595703, 55.096168518066406, 57.61945343017578, 60.14273452758789, 62.666019439697266, 65.18930053710938, 67.71258544921875, 70.23587036132812, 72.7591552734375, 75.28243255615234, 77.80571746826172, 80.3290023803711]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 11.0, 10.0, 7.0, 19.0, 28.0, 18.0, 35.0, 44.0, 47.0, 55.0, 63.0, 74.0, 61.0, 69.0, 61.0, 60.0, 51.0, 51.0, 53.0, 37.0, 37.0, 25.0, 18.0, 13.0, 18.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.13761901855469, -55.70052719116211, -54.26343536376953, -52.82634353637695, -51.389251708984375, -49.9521598815918, -48.51506805419922, -47.07797622680664, -45.64088439941406, -44.203792572021484, -42.766700744628906, -41.32960891723633, -39.89251708984375, -38.45542526245117, -37.018333435058594, -35.581241607666016, -34.14414978027344, -32.70705795288086, -31.26996612548828, -29.832874298095703, -28.395782470703125, -26.958690643310547, -25.52159881591797, -24.08450698852539, -22.647415161132812, -21.210323333740234, -19.773231506347656, -18.336139678955078, -16.8990478515625, -15.461956024169922, -14.024864196777344, -12.587772369384766, -11.150680541992188, -9.71358871459961, -8.276496887207031, -6.839405059814453, -5.402313232421875, -3.965221405029297, -2.5281295776367188, -1.0910377502441406, 0.3460540771484375, 1.7831459045410156, 3.2202377319335938, 4.657329559326172, 6.09442138671875, 7.531513214111328, 8.968605041503906, 10.405696868896484, 11.842788696289062, 13.27988052368164, 14.716972351074219, 16.154064178466797, 17.591156005859375, 19.028247833251953, 20.46533966064453, 21.90243148803711, 23.339523315429688, 24.776615142822266, 26.213706970214844, 27.650798797607422, 29.087890625, 30.524982452392578, 31.962074279785156, 33.399166107177734, 34.83625793457031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 11.0, 12.0, 15.0, 33.0, 32.0, 64.0, 78.0, 139.0, 226.0, 408.0, 813.0, 1567.0, 3395.0, 7340.0, 18487.0, 47728.0, 120080.0, 252779.0, 306068.0, 170344.0, 71385.0, 27563.0, 10951.0, 4665.0, 2077.0, 1055.0, 524.0, 269.0, 157.0, 104.0, 55.0, 37.0, 20.0, 14.0, 14.0, 10.0, 7.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-20.71875, -20.1466064453125, -19.574462890625, -19.0023193359375, -18.43017578125, -17.8580322265625, -17.285888671875, -16.7137451171875, -16.1416015625, -15.5694580078125, -14.997314453125, -14.4251708984375, -13.85302734375, -13.2808837890625, -12.708740234375, -12.1365966796875, -11.564453125, -10.9923095703125, -10.420166015625, -9.8480224609375, -9.27587890625, -8.7037353515625, -8.131591796875, -7.5594482421875, -6.9873046875, -6.4151611328125, -5.843017578125, -5.2708740234375, -4.69873046875, -4.1265869140625, -3.554443359375, -2.9822998046875, -2.41015625, -1.8380126953125, -1.265869140625, -0.6937255859375, -0.12158203125, 0.4505615234375, 1.022705078125, 1.5948486328125, 2.1669921875, 2.7391357421875, 3.311279296875, 3.8834228515625, 4.45556640625, 5.0277099609375, 5.599853515625, 6.1719970703125, 6.744140625, 7.3162841796875, 7.888427734375, 8.4605712890625, 9.03271484375, 9.6048583984375, 10.177001953125, 10.7491455078125, 11.3212890625, 11.8934326171875, 12.465576171875, 13.0377197265625, 13.60986328125, 14.1820068359375, 14.754150390625, 15.3262939453125, 15.8984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 3.0, 9.0, 9.0, 12.0, 9.0, 19.0, 19.0, 17.0, 27.0, 22.0, 24.0, 30.0, 32.0, 38.0, 38.0, 53.0, 56.0, 46.0, 45.0, 42.0, 32.0, 42.0, 33.0, 42.0, 36.0, 42.0, 28.0, 38.0, 29.0, 23.0, 9.0, 20.0, 13.0, 18.0, 13.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.2625732421875, -2.179443359375, -2.0963134765625, -2.01318359375, -1.9300537109375, -1.846923828125, -1.7637939453125, -1.6806640625, -1.5975341796875, -1.514404296875, -1.4312744140625, -1.34814453125, -1.2650146484375, -1.181884765625, -1.0987548828125, -1.015625, -0.9324951171875, -0.849365234375, -0.7662353515625, -0.68310546875, -0.5999755859375, -0.516845703125, -0.4337158203125, -0.3505859375, -0.2674560546875, -0.184326171875, -0.1011962890625, -0.01806640625, 0.0650634765625, 0.148193359375, 0.2313232421875, 0.314453125, 0.3975830078125, 0.480712890625, 0.5638427734375, 0.64697265625, 0.7301025390625, 0.813232421875, 0.8963623046875, 0.9794921875, 1.0626220703125, 1.145751953125, 1.2288818359375, 1.31201171875, 1.3951416015625, 1.478271484375, 1.5614013671875, 1.64453125, 1.7276611328125, 1.810791015625, 1.8939208984375, 1.97705078125, 2.0601806640625, 2.143310546875, 2.2264404296875, 2.3095703125, 2.3927001953125, 2.475830078125, 2.5589599609375, 2.64208984375, 2.7252197265625, 2.808349609375, 2.8914794921875, 2.974609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 9.0, 8.0, 19.0, 27.0, 31.0, 44.0, 69.0, 75.0, 136.0, 172.0, 193.0, 304.0, 455.0, 631.0, 1106.0, 2261.0, 5325.0, 16657.0, 58467.0, 196333.0, 409294.0, 246134.0, 76359.0, 21660.0, 6691.0, 2625.0, 1192.0, 696.0, 453.0, 299.0, 231.0, 169.0, 119.0, 84.0, 69.0, 41.0, 32.0, 21.0, 17.0, 15.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.703125, -19.059326171875, -18.41552734375, -17.771728515625, -17.1279296875, -16.484130859375, -15.84033203125, -15.196533203125, -14.552734375, -13.908935546875, -13.26513671875, -12.621337890625, -11.9775390625, -11.333740234375, -10.68994140625, -10.046142578125, -9.40234375, -8.758544921875, -8.11474609375, -7.470947265625, -6.8271484375, -6.183349609375, -5.53955078125, -4.895751953125, -4.251953125, -3.608154296875, -2.96435546875, -2.320556640625, -1.6767578125, -1.032958984375, -0.38916015625, 0.254638671875, 0.8984375, 1.542236328125, 2.18603515625, 2.829833984375, 3.4736328125, 4.117431640625, 4.76123046875, 5.405029296875, 6.048828125, 6.692626953125, 7.33642578125, 7.980224609375, 8.6240234375, 9.267822265625, 9.91162109375, 10.555419921875, 11.19921875, 11.843017578125, 12.48681640625, 13.130615234375, 13.7744140625, 14.418212890625, 15.06201171875, 15.705810546875, 16.349609375, 16.993408203125, 17.63720703125, 18.281005859375, 18.9248046875, 19.568603515625, 20.21240234375, 20.856201171875, 21.5]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 8.0, 11.0, 13.0, 19.0, 29.0, 19.0, 18.0, 42.0, 40.0, 28.0, 45.0, 40.0, 40.0, 40.0, 42.0, 46.0, 41.0, 55.0, 51.0, 50.0, 39.0, 32.0, 28.0, 27.0, 27.0, 18.0, 23.0, 16.0, 18.0, 14.0, 8.0, 6.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5, -12.0701904296875, -11.640380859375, -11.2105712890625, -10.78076171875, -10.3509521484375, -9.921142578125, -9.4913330078125, -9.0615234375, -8.6317138671875, -8.201904296875, -7.7720947265625, -7.34228515625, -6.9124755859375, -6.482666015625, -6.0528564453125, -5.623046875, -5.1932373046875, -4.763427734375, -4.3336181640625, -3.90380859375, -3.4739990234375, -3.044189453125, -2.6143798828125, -2.1845703125, -1.7547607421875, -1.324951171875, -0.8951416015625, -0.46533203125, -0.0355224609375, 0.394287109375, 0.8240966796875, 1.25390625, 1.6837158203125, 2.113525390625, 2.5433349609375, 2.97314453125, 3.4029541015625, 3.832763671875, 4.2625732421875, 4.6923828125, 5.1221923828125, 5.552001953125, 5.9818115234375, 6.41162109375, 6.8414306640625, 7.271240234375, 7.7010498046875, 8.130859375, 8.5606689453125, 8.990478515625, 9.4202880859375, 9.85009765625, 10.2799072265625, 10.709716796875, 11.1395263671875, 11.5693359375, 11.9991455078125, 12.428955078125, 12.8587646484375, 13.28857421875, 13.7183837890625, 14.148193359375, 14.5780029296875, 15.0078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 7.0, 12.0, 11.0, 25.0, 37.0, 73.0, 93.0, 159.0, 329.0, 593.0, 1502.0, 4325.0, 17947.0, 172213.0, 725797.0, 106006.0, 13367.0, 3493.0, 1255.0, 577.0, 313.0, 173.0, 97.0, 58.0, 36.0, 19.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.4375, -21.618896484375, -20.80029296875, -19.981689453125, -19.1630859375, -18.344482421875, -17.52587890625, -16.707275390625, -15.888671875, -15.070068359375, -14.25146484375, -13.432861328125, -12.6142578125, -11.795654296875, -10.97705078125, -10.158447265625, -9.33984375, -8.521240234375, -7.70263671875, -6.884033203125, -6.0654296875, -5.246826171875, -4.42822265625, -3.609619140625, -2.791015625, -1.972412109375, -1.15380859375, -0.335205078125, 0.4833984375, 1.302001953125, 2.12060546875, 2.939208984375, 3.7578125, 4.576416015625, 5.39501953125, 6.213623046875, 7.0322265625, 7.850830078125, 8.66943359375, 9.488037109375, 10.306640625, 11.125244140625, 11.94384765625, 12.762451171875, 13.5810546875, 14.399658203125, 15.21826171875, 16.036865234375, 16.85546875, 17.674072265625, 18.49267578125, 19.311279296875, 20.1298828125, 20.948486328125, 21.76708984375, 22.585693359375, 23.404296875, 24.222900390625, 25.04150390625, 25.860107421875, 26.6787109375, 27.497314453125, 28.31591796875, 29.134521484375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 9.0, 17.0, 17.0, 29.0, 25.0, 33.0, 42.0, 43.0, 84.0, 85.0, 95.0, 114.0, 82.0, 61.0, 46.0, 48.0, 32.0, 20.0, 25.0, 19.0, 11.0, 5.0, 1.0, 11.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014190673828125, -0.0013680458068847656, -0.0013170242309570312, -0.0012660026550292969, -0.0012149810791015625, -0.0011639595031738281, -0.0011129379272460938, -0.0010619163513183594, -0.001010894775390625, -0.0009598731994628906, -0.0009088516235351562, -0.0008578300476074219, -0.0008068084716796875, -0.0007557868957519531, -0.0007047653198242188, -0.0006537437438964844, -0.00060272216796875, -0.0005517005920410156, -0.0005006790161132812, -0.0004496574401855469, -0.0003986358642578125, -0.0003476142883300781, -0.00029659271240234375, -0.0002455711364746094, -0.000194549560546875, -0.00014352798461914062, -9.250640869140625e-05, -4.1484832763671875e-05, 9.5367431640625e-06, 6.0558319091796875e-05, 0.00011157989501953125, 0.00016260147094726562, 0.000213623046875, 0.0002646446228027344, 0.00031566619873046875, 0.0003666877746582031, 0.0004177093505859375, 0.0004687309265136719, 0.0005197525024414062, 0.0005707740783691406, 0.000621795654296875, 0.0006728172302246094, 0.0007238388061523438, 0.0007748603820800781, 0.0008258819580078125, 0.0008769035339355469, 0.0009279251098632812, 0.0009789466857910156, 0.00102996826171875, 0.0010809898376464844, 0.0011320114135742188, 0.0011830329895019531, 0.0012340545654296875, 0.0012850761413574219, 0.0013360977172851562, 0.0013871192932128906, 0.001438140869140625, 0.0014891624450683594, 0.0015401840209960938, 0.0015912055969238281, 0.0016422271728515625, 0.0016932487487792969, 0.0017442703247070312, 0.0017952919006347656, 0.0018463134765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 5.0, 16.0, 22.0, 32.0, 58.0, 103.0, 184.0, 378.0, 855.0, 2815.0, 14848.0, 222504.0, 751103.0, 46721.0, 6180.0, 1504.0, 600.0, 275.0, 125.0, 74.0, 52.0, 29.0, 16.0, 9.0, 8.0, 2.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.40625, -47.260498046875, -46.11474609375, -44.968994140625, -43.8232421875, -42.677490234375, -41.53173828125, -40.385986328125, -39.240234375, -38.094482421875, -36.94873046875, -35.802978515625, -34.6572265625, -33.511474609375, -32.36572265625, -31.219970703125, -30.07421875, -28.928466796875, -27.78271484375, -26.636962890625, -25.4912109375, -24.345458984375, -23.19970703125, -22.053955078125, -20.908203125, -19.762451171875, -18.61669921875, -17.470947265625, -16.3251953125, -15.179443359375, -14.03369140625, -12.887939453125, -11.7421875, -10.596435546875, -9.45068359375, -8.304931640625, -7.1591796875, -6.013427734375, -4.86767578125, -3.721923828125, -2.576171875, -1.430419921875, -0.28466796875, 0.861083984375, 2.0068359375, 3.152587890625, 4.29833984375, 5.444091796875, 6.58984375, 7.735595703125, 8.88134765625, 10.027099609375, 11.1728515625, 12.318603515625, 13.46435546875, 14.610107421875, 15.755859375, 16.901611328125, 18.04736328125, 19.193115234375, 20.3388671875, 21.484619140625, 22.63037109375, 23.776123046875, 24.921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 11.0, 11.0, 12.0, 33.0, 43.0, 61.0, 75.0, 81.0, 113.0, 101.0, 105.0, 91.0, 62.0, 53.0, 37.0, 20.0, 18.0, 17.0, 15.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.874267578125, -8.43603515625, -7.997802734375, -7.5595703125, -7.121337890625, -6.68310546875, -6.244873046875, -5.806640625, -5.368408203125, -4.93017578125, -4.491943359375, -4.0537109375, -3.615478515625, -3.17724609375, -2.739013671875, -2.30078125, -1.862548828125, -1.42431640625, -0.986083984375, -0.5478515625, -0.109619140625, 0.32861328125, 0.766845703125, 1.205078125, 1.643310546875, 2.08154296875, 2.519775390625, 2.9580078125, 3.396240234375, 3.83447265625, 4.272705078125, 4.7109375, 5.149169921875, 5.58740234375, 6.025634765625, 6.4638671875, 6.902099609375, 7.34033203125, 7.778564453125, 8.216796875, 8.655029296875, 9.09326171875, 9.531494140625, 9.9697265625, 10.407958984375, 10.84619140625, 11.284423828125, 11.72265625, 12.160888671875, 12.59912109375, 13.037353515625, 13.4755859375, 13.913818359375, 14.35205078125, 14.790283203125, 15.228515625, 15.666748046875, 16.10498046875, 16.543212890625, 16.9814453125, 17.419677734375, 17.85791015625, 18.296142578125, 18.734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 22.0, 32.0, 64.0, 99.0, 142.0, 158.0, 159.0, 120.0, 84.0, 47.0, 30.0, 17.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.94647216796875, -160.3875274658203, -154.82859802246094, -149.2696533203125, -143.71072387695312, -138.1517791748047, -132.59283447265625, -127.03389739990234, -121.47496032714844, -115.91602325439453, -110.35708618164062, -104.79814147949219, -99.23920440673828, -93.68026733398438, -88.12132263183594, -82.56238555908203, -77.00344848632812, -71.44451141357422, -65.88557434082031, -60.326629638671875, -54.76769256591797, -49.20875549316406, -43.64981460571289, -38.09087371826172, -32.53193664550781, -26.972997665405273, -21.414058685302734, -15.855119705200195, -10.296180725097656, -4.737241744995117, 0.8216972351074219, 6.380638122558594, 11.9395751953125, 17.49851417541504, 23.057453155517578, 28.616392135620117, 34.175331115722656, 39.73426818847656, 45.293209075927734, 50.852149963378906, 56.41108703613281, 61.97002410888672, 67.52896118164062, 73.08790588378906, 78.64684295654297, 84.20578002929688, 89.76472473144531, 95.32366180419922, 100.88259887695312, 106.44153594970703, 112.00047302246094, 117.55941772460938, 123.11835479736328, 128.6772918701172, 134.23623657226562, 139.795166015625, 145.35411071777344, 150.91305541992188, 156.47198486328125, 162.0309295654297, 167.58987426757812, 173.1488037109375, 178.70774841308594, 184.26669311523438, 189.82562255859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 4.0, 9.0, 9.0, 11.0, 17.0, 18.0, 27.0, 35.0, 30.0, 27.0, 45.0, 38.0, 41.0, 34.0, 38.0, 52.0, 44.0, 41.0, 53.0, 51.0, 40.0, 40.0, 38.0, 45.0, 22.0, 20.0, 28.0, 31.0, 17.0, 14.0, 11.0, 13.0, 5.0, 7.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.92521667480469, -88.2435302734375, -85.56185150146484, -82.88017272949219, -80.198486328125, -77.51679992675781, -74.83512115478516, -72.1534423828125, -69.47175598144531, -66.79006958007812, -64.10839080810547, -61.42670822143555, -58.745025634765625, -56.0633430480957, -53.38166046142578, -50.69997787475586, -48.01829528808594, -45.336612701416016, -42.654930114746094, -39.97324752807617, -37.29156494140625, -34.60988235473633, -31.928199768066406, -29.246517181396484, -26.564834594726562, -23.88315200805664, -21.20146942138672, -18.519786834716797, -15.838104248046875, -13.156421661376953, -10.474739074707031, -7.793056488037109, -5.111366271972656, -2.4296836853027344, 0.2519989013671875, 2.9336814880371094, 5.615364074707031, 8.297046661376953, 10.978729248046875, 13.660411834716797, 16.34209442138672, 19.02377700805664, 21.705459594726562, 24.387142181396484, 27.068824768066406, 29.750507354736328, 32.43218994140625, 35.11387252807617, 37.795555114746094, 40.477237701416016, 43.15892028808594, 45.84060287475586, 48.52228546142578, 51.2039680480957, 53.885650634765625, 56.56733322143555, 59.24901580810547, 61.93069839477539, 64.61238098144531, 67.2940673828125, 69.97574615478516, 72.65742492675781, 75.339111328125, 78.02079772949219, 80.70247650146484]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 10.0, 15.0, 20.0, 32.0, 67.0, 103.0, 200.0, 504.0, 1018.0, 2261.0, 5891.0, 17608.0, 70589.0, 730587.0, 3214596.0, 111527.0, 25110.0, 8064.0, 3359.0, 1385.0, 665.0, 330.0, 159.0, 77.0, 44.0, 22.0, 15.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.03125, -38.033935546875, -37.03662109375, -36.039306640625, -35.0419921875, -34.044677734375, -33.04736328125, -32.050048828125, -31.052734375, -30.055419921875, -29.05810546875, -28.060791015625, -27.0634765625, -26.066162109375, -25.06884765625, -24.071533203125, -23.07421875, -22.076904296875, -21.07958984375, -20.082275390625, -19.0849609375, -18.087646484375, -17.09033203125, -16.093017578125, -15.095703125, -14.098388671875, -13.10107421875, -12.103759765625, -11.1064453125, -10.109130859375, -9.11181640625, -8.114501953125, -7.1171875, -6.119873046875, -5.12255859375, -4.125244140625, -3.1279296875, -2.130615234375, -1.13330078125, -0.135986328125, 0.861328125, 1.858642578125, 2.85595703125, 3.853271484375, 4.8505859375, 5.847900390625, 6.84521484375, 7.842529296875, 8.83984375, 9.837158203125, 10.83447265625, 11.831787109375, 12.8291015625, 13.826416015625, 14.82373046875, 15.821044921875, 16.818359375, 17.815673828125, 18.81298828125, 19.810302734375, 20.8076171875, 21.804931640625, 22.80224609375, 23.799560546875, 24.796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 4.0, 15.0, 16.0, 25.0, 31.0, 28.0, 36.0, 31.0, 44.0, 51.0, 46.0, 60.0, 42.0, 47.0, 48.0, 58.0, 55.0, 46.0, 42.0, 35.0, 43.0, 26.0, 26.0, 27.0, 20.0, 13.0, 9.0, 10.0, 13.0, 4.0, 8.0, 8.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.081695556640625, -2.98565673828125, -2.889617919921875, -2.7935791015625, -2.697540283203125, -2.60150146484375, -2.505462646484375, -2.409423828125, -2.313385009765625, -2.21734619140625, -2.121307373046875, -2.0252685546875, -1.929229736328125, -1.83319091796875, -1.737152099609375, -1.64111328125, -1.545074462890625, -1.44903564453125, -1.352996826171875, -1.2569580078125, -1.160919189453125, -1.06488037109375, -0.968841552734375, -0.872802734375, -0.776763916015625, -0.68072509765625, -0.584686279296875, -0.4886474609375, -0.392608642578125, -0.29656982421875, -0.200531005859375, -0.1044921875, -0.008453369140625, 0.08758544921875, 0.183624267578125, 0.2796630859375, 0.375701904296875, 0.47174072265625, 0.567779541015625, 0.663818359375, 0.759857177734375, 0.85589599609375, 0.951934814453125, 1.0479736328125, 1.144012451171875, 1.24005126953125, 1.336090087890625, 1.43212890625, 1.528167724609375, 1.62420654296875, 1.720245361328125, 1.8162841796875, 1.912322998046875, 2.00836181640625, 2.104400634765625, 2.200439453125, 2.296478271484375, 2.39251708984375, 2.488555908203125, 2.5845947265625, 2.680633544921875, 2.77667236328125, 2.872711181640625, 2.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 10.0, 8.0, 12.0, 15.0, 15.0, 26.0, 33.0, 55.0, 86.0, 132.0, 215.0, 365.0, 592.0, 1204.0, 2277.0, 4653.0, 10766.0, 27214.0, 77887.0, 277390.0, 2438005.0, 1068519.0, 190012.0, 57828.0, 20613.0, 8569.0, 3807.0, 1781.0, 940.0, 501.0, 319.0, 150.0, 92.0, 65.0, 38.0, 27.0, 20.0, 16.0, 4.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.591552734375, -15.01123046875, -14.430908203125, -13.8505859375, -13.270263671875, -12.68994140625, -12.109619140625, -11.529296875, -10.948974609375, -10.36865234375, -9.788330078125, -9.2080078125, -8.627685546875, -8.04736328125, -7.467041015625, -6.88671875, -6.306396484375, -5.72607421875, -5.145751953125, -4.5654296875, -3.985107421875, -3.40478515625, -2.824462890625, -2.244140625, -1.663818359375, -1.08349609375, -0.503173828125, 0.0771484375, 0.657470703125, 1.23779296875, 1.818115234375, 2.3984375, 2.978759765625, 3.55908203125, 4.139404296875, 4.7197265625, 5.300048828125, 5.88037109375, 6.460693359375, 7.041015625, 7.621337890625, 8.20166015625, 8.781982421875, 9.3623046875, 9.942626953125, 10.52294921875, 11.103271484375, 11.68359375, 12.263916015625, 12.84423828125, 13.424560546875, 14.0048828125, 14.585205078125, 15.16552734375, 15.745849609375, 16.326171875, 16.906494140625, 17.48681640625, 18.067138671875, 18.6474609375, 19.227783203125, 19.80810546875, 20.388427734375, 20.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 11.0, 3.0, 11.0, 12.0, 17.0, 27.0, 47.0, 70.0, 75.0, 86.0, 110.0, 162.0, 274.0, 438.0, 1137.0, 580.0, 307.0, 185.0, 129.0, 81.0, 80.0, 58.0, 40.0, 28.0, 19.0, 19.0, 10.0, 13.0, 6.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.4921875, -5.32904052734375, -5.1658935546875, -5.00274658203125, -4.839599609375, -4.67645263671875, -4.5133056640625, -4.35015869140625, -4.18701171875, -4.02386474609375, -3.8607177734375, -3.69757080078125, -3.534423828125, -3.37127685546875, -3.2081298828125, -3.04498291015625, -2.8818359375, -2.71868896484375, -2.5555419921875, -2.39239501953125, -2.229248046875, -2.06610107421875, -1.9029541015625, -1.73980712890625, -1.57666015625, -1.41351318359375, -1.2503662109375, -1.08721923828125, -0.924072265625, -0.76092529296875, -0.5977783203125, -0.43463134765625, -0.271484375, -0.10833740234375, 0.0548095703125, 0.21795654296875, 0.381103515625, 0.54425048828125, 0.7073974609375, 0.87054443359375, 1.03369140625, 1.19683837890625, 1.3599853515625, 1.52313232421875, 1.686279296875, 1.84942626953125, 2.0125732421875, 2.17572021484375, 2.3388671875, 2.50201416015625, 2.6651611328125, 2.82830810546875, 2.991455078125, 3.15460205078125, 3.3177490234375, 3.48089599609375, 3.64404296875, 3.80718994140625, 3.9703369140625, 4.13348388671875, 4.296630859375, 4.45977783203125, 4.6229248046875, 4.78607177734375, 4.94921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 21.0, 30.0, 48.0, 100.0, 111.0, 145.0, 165.0, 158.0, 84.0, 59.0, 34.0, 21.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-92.56082153320312, -90.71758270263672, -88.87434387207031, -87.03111267089844, -85.18787384033203, -83.34463500976562, -81.50139617919922, -79.65815734863281, -77.8149185180664, -75.9716796875, -74.1284408569336, -72.28520202636719, -70.44197082519531, -68.5987319946289, -66.7554931640625, -64.9122543334961, -63.06901931762695, -61.22578048706055, -59.382545471191406, -57.539306640625, -55.696067810058594, -53.85282897949219, -52.00959396362305, -50.16635513305664, -48.3231201171875, -46.479881286621094, -44.63664627075195, -42.79340744018555, -40.95016860961914, -39.10693359375, -37.263694763183594, -35.42045593261719, -33.57721710205078, -31.733980178833008, -29.8907413482666, -28.047504425048828, -26.204265594482422, -24.36102867126465, -22.517791748046875, -20.67455291748047, -18.831315994262695, -16.988079071044922, -15.144840240478516, -13.301603317260742, -11.458365440368652, -9.615127563476562, -7.771890640258789, -5.928652763366699, -4.085414886474609, -2.2421772480010986, -0.3989396095275879, 1.4442977905273438, 3.2875356674194336, 5.130773544311523, 6.974010467529297, 8.817248344421387, 10.660486221313477, 12.503724098205566, 14.346961975097656, 16.19019889831543, 18.033435821533203, 19.87667465209961, 21.719911575317383, 23.563148498535156, 25.406387329101562]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 17.0, 14.0, 16.0, 11.0, 23.0, 28.0, 29.0, 28.0, 35.0, 35.0, 29.0, 37.0, 54.0, 38.0, 43.0, 43.0, 46.0, 38.0, 36.0, 32.0, 40.0, 40.0, 48.0, 32.0, 26.0, 39.0, 20.0, 12.0, 16.0, 11.0, 8.0, 4.0, 11.0, 8.0, 5.0, 7.0, 4.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.20660400390625, -21.53872299194336, -20.870840072631836, -20.202959060668945, -19.535078048706055, -18.86719512939453, -18.19931411743164, -17.53143310546875, -16.863550186157227, -16.195669174194336, -15.527787208557129, -14.859905242919922, -14.192023277282715, -13.524141311645508, -12.856260299682617, -12.18837833404541, -11.52049732208252, -10.852615356445312, -10.184734344482422, -9.516852378845215, -8.848970413208008, -8.181089401245117, -7.51320743560791, -6.845325469970703, -6.177443981170654, -5.5095624923706055, -4.841680526733398, -4.17379903793335, -3.5059173107147217, -2.8380355834960938, -2.170154094696045, -1.502272129058838, -0.8343906402587891, -0.1665089726448059, 0.5013726949691772, 1.1692543029785156, 1.8371360301971436, 2.5050177574157715, 3.1728992462158203, 3.8407812118530273, 4.508662700653076, 5.176544189453125, 5.844426155090332, 6.512307643890381, 7.18018913269043, 7.848071098327637, 8.515953063964844, 9.183834075927734, 9.851716041564941, 10.519598007202148, 11.187479019165039, 11.855360984802246, 12.523242950439453, 13.191123962402344, 13.85900592803955, 14.526887893676758, 15.194768905639648, 15.862650871276855, 16.530532836914062, 17.198413848876953, 17.866294860839844, 18.534177780151367, 19.202058792114258, 19.86994171142578, 20.537822723388672]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 12.0, 19.0, 26.0, 33.0, 52.0, 109.0, 151.0, 276.0, 467.0, 844.0, 1494.0, 2945.0, 5712.0, 12337.0, 27901.0, 63312.0, 138802.0, 252186.0, 261544.0, 152215.0, 70477.0, 30570.0, 13598.0, 6409.0, 3223.0, 1620.0, 880.0, 507.0, 317.0, 171.0, 132.0, 73.0, 40.0, 25.0, 18.0, 23.0, 3.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-16.40625, -15.9752197265625, -15.544189453125, -15.1131591796875, -14.68212890625, -14.2510986328125, -13.820068359375, -13.3890380859375, -12.9580078125, -12.5269775390625, -12.095947265625, -11.6649169921875, -11.23388671875, -10.8028564453125, -10.371826171875, -9.9407958984375, -9.509765625, -9.0787353515625, -8.647705078125, -8.2166748046875, -7.78564453125, -7.3546142578125, -6.923583984375, -6.4925537109375, -6.0615234375, -5.6304931640625, -5.199462890625, -4.7684326171875, -4.33740234375, -3.9063720703125, -3.475341796875, -3.0443115234375, -2.61328125, -2.1822509765625, -1.751220703125, -1.3201904296875, -0.88916015625, -0.4581298828125, -0.027099609375, 0.4039306640625, 0.8349609375, 1.2659912109375, 1.697021484375, 2.1280517578125, 2.55908203125, 2.9901123046875, 3.421142578125, 3.8521728515625, 4.283203125, 4.7142333984375, 5.145263671875, 5.5762939453125, 6.00732421875, 6.4383544921875, 6.869384765625, 7.3004150390625, 7.7314453125, 8.1624755859375, 8.593505859375, 9.0245361328125, 9.45556640625, 9.8865966796875, 10.317626953125, 10.7486572265625, 11.1796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 13.0, 20.0, 33.0, 25.0, 24.0, 31.0, 35.0, 46.0, 39.0, 48.0, 59.0, 48.0, 47.0, 53.0, 51.0, 38.0, 46.0, 45.0, 37.0, 35.0, 30.0, 26.0, 20.0, 15.0, 17.0, 18.0, 21.0, 8.0, 8.0, 2.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62109375, -2.52734375, -2.43359375, -2.33984375, -2.24609375, -2.15234375, -2.05859375, -1.96484375, -1.87109375, -1.77734375, -1.68359375, -1.58984375, -1.49609375, -1.40234375, -1.30859375, -1.21484375, -1.12109375, -1.02734375, -0.93359375, -0.83984375, -0.74609375, -0.65234375, -0.55859375, -0.46484375, -0.37109375, -0.27734375, -0.18359375, -0.08984375, 0.00390625, 0.09765625, 0.19140625, 0.28515625, 0.37890625, 0.47265625, 0.56640625, 0.66015625, 0.75390625, 0.84765625, 0.94140625, 1.03515625, 1.12890625, 1.22265625, 1.31640625, 1.41015625, 1.50390625, 1.59765625, 1.69140625, 1.78515625, 1.87890625, 1.97265625, 2.06640625, 2.16015625, 2.25390625, 2.34765625, 2.44140625, 2.53515625, 2.62890625, 2.72265625, 2.81640625, 2.91015625, 3.00390625, 3.09765625, 3.19140625, 3.28515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 11.0, 7.0, 17.0, 11.0, 16.0, 36.0, 40.0, 60.0, 76.0, 118.0, 131.0, 181.0, 247.0, 351.0, 517.0, 817.0, 1472.0, 3274.0, 8241.0, 24338.0, 79119.0, 240144.0, 387550.0, 202691.0, 65343.0, 20237.0, 6950.0, 2751.0, 1350.0, 754.0, 484.0, 328.0, 227.0, 165.0, 134.0, 103.0, 62.0, 52.0, 40.0, 26.0, 17.0, 19.0, 12.0, 10.0, 5.0, 11.0, 2.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.03125, -16.505859375, -15.98046875, -15.455078125, -14.9296875, -14.404296875, -13.87890625, -13.353515625, -12.828125, -12.302734375, -11.77734375, -11.251953125, -10.7265625, -10.201171875, -9.67578125, -9.150390625, -8.625, -8.099609375, -7.57421875, -7.048828125, -6.5234375, -5.998046875, -5.47265625, -4.947265625, -4.421875, -3.896484375, -3.37109375, -2.845703125, -2.3203125, -1.794921875, -1.26953125, -0.744140625, -0.21875, 0.306640625, 0.83203125, 1.357421875, 1.8828125, 2.408203125, 2.93359375, 3.458984375, 3.984375, 4.509765625, 5.03515625, 5.560546875, 6.0859375, 6.611328125, 7.13671875, 7.662109375, 8.1875, 8.712890625, 9.23828125, 9.763671875, 10.2890625, 10.814453125, 11.33984375, 11.865234375, 12.390625, 12.916015625, 13.44140625, 13.966796875, 14.4921875, 15.017578125, 15.54296875, 16.068359375, 16.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 9.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 21.0, 11.0, 18.0, 13.0, 26.0, 23.0, 19.0, 27.0, 24.0, 30.0, 46.0, 39.0, 32.0, 43.0, 36.0, 32.0, 44.0, 38.0, 33.0, 54.0, 39.0, 36.0, 39.0, 26.0, 32.0, 26.0, 33.0, 24.0, 14.0, 15.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.6328125, -13.2420654296875, -12.851318359375, -12.4605712890625, -12.06982421875, -11.6790771484375, -11.288330078125, -10.8975830078125, -10.5068359375, -10.1160888671875, -9.725341796875, -9.3345947265625, -8.94384765625, -8.5531005859375, -8.162353515625, -7.7716064453125, -7.380859375, -6.9901123046875, -6.599365234375, -6.2086181640625, -5.81787109375, -5.4271240234375, -5.036376953125, -4.6456298828125, -4.2548828125, -3.8641357421875, -3.473388671875, -3.0826416015625, -2.69189453125, -2.3011474609375, -1.910400390625, -1.5196533203125, -1.12890625, -0.7381591796875, -0.347412109375, 0.0433349609375, 0.43408203125, 0.8248291015625, 1.215576171875, 1.6063232421875, 1.9970703125, 2.3878173828125, 2.778564453125, 3.1693115234375, 3.56005859375, 3.9508056640625, 4.341552734375, 4.7322998046875, 5.123046875, 5.5137939453125, 5.904541015625, 6.2952880859375, 6.68603515625, 7.0767822265625, 7.467529296875, 7.8582763671875, 8.2490234375, 8.6397705078125, 9.030517578125, 9.4212646484375, 9.81201171875, 10.2027587890625, 10.593505859375, 10.9842529296875, 11.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 3.0, 8.0, 16.0, 11.0, 11.0, 34.0, 47.0, 63.0, 84.0, 147.0, 229.0, 408.0, 704.0, 1397.0, 2943.0, 6942.0, 19973.0, 75340.0, 313443.0, 443586.0, 132638.0, 32367.0, 10162.0, 4029.0, 1762.0, 929.0, 494.0, 279.0, 169.0, 95.0, 66.0, 59.0, 37.0, 23.0, 18.0, 8.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.173828125, -9.84765625, -9.521484375, -9.1953125, -8.869140625, -8.54296875, -8.216796875, -7.890625, -7.564453125, -7.23828125, -6.912109375, -6.5859375, -6.259765625, -5.93359375, -5.607421875, -5.28125, -4.955078125, -4.62890625, -4.302734375, -3.9765625, -3.650390625, -3.32421875, -2.998046875, -2.671875, -2.345703125, -2.01953125, -1.693359375, -1.3671875, -1.041015625, -0.71484375, -0.388671875, -0.0625, 0.263671875, 0.58984375, 0.916015625, 1.2421875, 1.568359375, 1.89453125, 2.220703125, 2.546875, 2.873046875, 3.19921875, 3.525390625, 3.8515625, 4.177734375, 4.50390625, 4.830078125, 5.15625, 5.482421875, 5.80859375, 6.134765625, 6.4609375, 6.787109375, 7.11328125, 7.439453125, 7.765625, 8.091796875, 8.41796875, 8.744140625, 9.0703125, 9.396484375, 9.72265625, 10.048828125, 10.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 2.0, 11.0, 13.0, 14.0, 26.0, 32.0, 64.0, 90.0, 101.0, 145.0, 161.0, 106.0, 83.0, 47.0, 39.0, 24.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002864837646484375, -0.002793237566947937, -0.002721637487411499, -0.002650037407875061, -0.002578437328338623, -0.002506837248802185, -0.002435237169265747, -0.002363637089729309, -0.002292037010192871, -0.002220436930656433, -0.002148836851119995, -0.002077236771583557, -0.002005636692047119, -0.0019340366125106812, -0.0018624365329742432, -0.0017908364534378052, -0.0017192363739013672, -0.0016476362943649292, -0.0015760362148284912, -0.0015044361352920532, -0.0014328360557556152, -0.0013612359762191772, -0.0012896358966827393, -0.0012180358171463013, -0.0011464357376098633, -0.0010748356580734253, -0.0010032355785369873, -0.0009316354990005493, -0.0008600354194641113, -0.0007884353399276733, -0.0007168352603912354, -0.0006452351808547974, -0.0005736351013183594, -0.0005020350217819214, -0.0004304349422454834, -0.0003588348627090454, -0.0002872347831726074, -0.00021563470363616943, -0.00014403462409973145, -7.243454456329346e-05, -8.344650268554688e-07, 7.076561450958252e-05, 0.0001423656940460205, 0.0002139657735824585, 0.0002855658531188965, 0.00035716593265533447, 0.00042876601219177246, 0.0005003660917282104, 0.0005719661712646484, 0.0006435662508010864, 0.0007151663303375244, 0.0007867664098739624, 0.0008583664894104004, 0.0009299665689468384, 0.0010015666484832764, 0.0010731667280197144, 0.0011447668075561523, 0.0012163668870925903, 0.0012879669666290283, 0.0013595670461654663, 0.0014311671257019043, 0.0015027672052383423, 0.0015743672847747803, 0.0016459673643112183, 0.0017175674438476562]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 14.0, 12.0, 9.0, 20.0, 31.0, 50.0, 58.0, 100.0, 160.0, 266.0, 464.0, 880.0, 2031.0, 4737.0, 14952.0, 68718.0, 385709.0, 454937.0, 87472.0, 18147.0, 5442.0, 2087.0, 1001.0, 487.0, 246.0, 176.0, 90.0, 73.0, 45.0, 40.0, 23.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.59375, -12.1749267578125, -11.756103515625, -11.3372802734375, -10.91845703125, -10.4996337890625, -10.080810546875, -9.6619873046875, -9.2431640625, -8.8243408203125, -8.405517578125, -7.9866943359375, -7.56787109375, -7.1490478515625, -6.730224609375, -6.3114013671875, -5.892578125, -5.4737548828125, -5.054931640625, -4.6361083984375, -4.21728515625, -3.7984619140625, -3.379638671875, -2.9608154296875, -2.5419921875, -2.1231689453125, -1.704345703125, -1.2855224609375, -0.86669921875, -0.4478759765625, -0.029052734375, 0.3897705078125, 0.80859375, 1.2274169921875, 1.646240234375, 2.0650634765625, 2.48388671875, 2.9027099609375, 3.321533203125, 3.7403564453125, 4.1591796875, 4.5780029296875, 4.996826171875, 5.4156494140625, 5.83447265625, 6.2532958984375, 6.672119140625, 7.0909423828125, 7.509765625, 7.9285888671875, 8.347412109375, 8.7662353515625, 9.18505859375, 9.6038818359375, 10.022705078125, 10.4415283203125, 10.8603515625, 11.2791748046875, 11.697998046875, 12.1168212890625, 12.53564453125, 12.9544677734375, 13.373291015625, 13.7921142578125, 14.2109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 9.0, 2.0, 5.0, 5.0, 10.0, 7.0, 14.0, 13.0, 17.0, 15.0, 24.0, 29.0, 31.0, 34.0, 44.0, 49.0, 56.0, 84.0, 67.0, 66.0, 71.0, 64.0, 49.0, 33.0, 34.0, 30.0, 25.0, 22.0, 17.0, 12.0, 8.0, 12.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.01953125, -6.838134765625, -6.65673828125, -6.475341796875, -6.2939453125, -6.112548828125, -5.93115234375, -5.749755859375, -5.568359375, -5.386962890625, -5.20556640625, -5.024169921875, -4.8427734375, -4.661376953125, -4.47998046875, -4.298583984375, -4.1171875, -3.935791015625, -3.75439453125, -3.572998046875, -3.3916015625, -3.210205078125, -3.02880859375, -2.847412109375, -2.666015625, -2.484619140625, -2.30322265625, -2.121826171875, -1.9404296875, -1.759033203125, -1.57763671875, -1.396240234375, -1.21484375, -1.033447265625, -0.85205078125, -0.670654296875, -0.4892578125, -0.307861328125, -0.12646484375, 0.054931640625, 0.236328125, 0.417724609375, 0.59912109375, 0.780517578125, 0.9619140625, 1.143310546875, 1.32470703125, 1.506103515625, 1.6875, 1.868896484375, 2.05029296875, 2.231689453125, 2.4130859375, 2.594482421875, 2.77587890625, 2.957275390625, 3.138671875, 3.320068359375, 3.50146484375, 3.682861328125, 3.8642578125, 4.045654296875, 4.22705078125, 4.408447265625, 4.58984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 23.0, 28.0, 74.0, 109.0, 181.0, 190.0, 167.0, 121.0, 67.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-231.29701232910156, -225.31338500976562, -219.32974243164062, -213.34609985351562, -207.3624725341797, -201.37884521484375, -195.39520263671875, -189.41156005859375, -183.4279327392578, -177.44430541992188, -171.46066284179688, -165.47702026367188, -159.49339294433594, -153.509765625, -147.526123046875, -141.54248046875, -135.55885314941406, -129.57522583007812, -123.59158325195312, -117.60794830322266, -111.62431335449219, -105.64067840576172, -99.65704345703125, -93.67340850830078, -87.68977355957031, -81.70613861083984, -75.72250366210938, -69.7388687133789, -63.75523376464844, -57.77159881591797, -51.7879638671875, -45.80432891845703, -39.8206787109375, -33.83704376220703, -27.853408813476562, -21.869773864746094, -15.886138916015625, -9.902503967285156, -3.9188690185546875, 2.0647659301757812, 8.04840087890625, 14.032035827636719, 20.015670776367188, 25.999305725097656, 31.982940673828125, 37.966575622558594, 43.95021057128906, 49.93384552001953, 55.91748046875, 61.90111541748047, 67.88475036621094, 73.8683853149414, 79.85202026367188, 85.83565521240234, 91.81929016113281, 97.80292510986328, 103.78656005859375, 109.77019500732422, 115.75382995605469, 121.73746490478516, 127.72109985351562, 133.70474243164062, 139.68836975097656, 145.6719970703125, 151.6556396484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 11.0, 20.0, 23.0, 23.0, 32.0, 28.0, 36.0, 51.0, 52.0, 49.0, 41.0, 54.0, 46.0, 54.0, 56.0, 52.0, 47.0, 43.0, 31.0, 37.0, 30.0, 29.0, 24.0, 23.0, 20.0, 12.0, 12.0, 13.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.86239624023438, -75.18463897705078, -72.50687408447266, -69.82911682128906, -67.15135955810547, -64.47359466552734, -61.79583740234375, -59.11807632446289, -56.44031524658203, -53.76255416870117, -51.08479690551758, -48.40703582763672, -45.72927474975586, -43.051513671875, -40.373756408691406, -37.69599533081055, -35.01823806762695, -32.340476989746094, -29.662717819213867, -26.98495864868164, -24.30719757080078, -21.629438400268555, -18.951679229736328, -16.27391815185547, -13.596158981323242, -10.9183988571167, -8.240638732910156, -5.56287956237793, -2.8851194381713867, -0.20735931396484375, 2.470399856567383, 5.148160934448242, 7.825920104980469, 10.503680229187012, 13.181440353393555, 15.859199523925781, 18.53696060180664, 21.214719772338867, 23.892478942871094, 26.570240020751953, 29.24799919128418, 31.925758361816406, 34.603519439697266, 37.281280517578125, 39.95903778076172, 42.63679885864258, 45.31455993652344, 47.99231719970703, 50.67007827758789, 53.34783935546875, 56.025596618652344, 58.7033576965332, 61.38111877441406, 64.05887603759766, 66.73663330078125, 69.41439819335938, 72.09215545654297, 74.76991271972656, 77.44767761230469, 80.12543487548828, 82.80319213867188, 85.48095703125, 88.1587142944336, 90.83647155761719, 93.51423645019531]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 11.0, 11.0, 14.0, 24.0, 42.0, 58.0, 86.0, 118.0, 232.0, 326.0, 559.0, 988.0, 1790.0, 3384.0, 6574.0, 13549.0, 31488.0, 83918.0, 296046.0, 2758383.0, 750726.0, 152539.0, 51578.0, 20496.0, 9777.0, 4941.0, 2696.0, 1533.0, 854.0, 528.0, 352.0, 211.0, 147.0, 79.0, 63.0, 48.0, 34.0, 23.0, 14.0, 12.0, 8.0, 9.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.0625, -16.55712890625, -16.0517578125, -15.54638671875, -15.041015625, -14.53564453125, -14.0302734375, -13.52490234375, -13.01953125, -12.51416015625, -12.0087890625, -11.50341796875, -10.998046875, -10.49267578125, -9.9873046875, -9.48193359375, -8.9765625, -8.47119140625, -7.9658203125, -7.46044921875, -6.955078125, -6.44970703125, -5.9443359375, -5.43896484375, -4.93359375, -4.42822265625, -3.9228515625, -3.41748046875, -2.912109375, -2.40673828125, -1.9013671875, -1.39599609375, -0.890625, -0.38525390625, 0.1201171875, 0.62548828125, 1.130859375, 1.63623046875, 2.1416015625, 2.64697265625, 3.15234375, 3.65771484375, 4.1630859375, 4.66845703125, 5.173828125, 5.67919921875, 6.1845703125, 6.68994140625, 7.1953125, 7.70068359375, 8.2060546875, 8.71142578125, 9.216796875, 9.72216796875, 10.2275390625, 10.73291015625, 11.23828125, 11.74365234375, 12.2490234375, 12.75439453125, 13.259765625, 13.76513671875, 14.2705078125, 14.77587890625, 15.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 2.0, 6.0, 5.0, 6.0, 15.0, 21.0, 18.0, 17.0, 31.0, 27.0, 43.0, 36.0, 43.0, 52.0, 34.0, 47.0, 82.0, 53.0, 65.0, 52.0, 57.0, 37.0, 34.0, 29.0, 30.0, 22.0, 20.0, 32.0, 16.0, 15.0, 15.0, 6.0, 10.0, 12.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.882720947265625, -2.78497314453125, -2.687225341796875, -2.5894775390625, -2.491729736328125, -2.39398193359375, -2.296234130859375, -2.198486328125, -2.100738525390625, -2.00299072265625, -1.905242919921875, -1.8074951171875, -1.709747314453125, -1.61199951171875, -1.514251708984375, -1.41650390625, -1.318756103515625, -1.22100830078125, -1.123260498046875, -1.0255126953125, -0.927764892578125, -0.83001708984375, -0.732269287109375, -0.634521484375, -0.536773681640625, -0.43902587890625, -0.341278076171875, -0.2435302734375, -0.145782470703125, -0.04803466796875, 0.049713134765625, 0.1474609375, 0.245208740234375, 0.34295654296875, 0.440704345703125, 0.5384521484375, 0.636199951171875, 0.73394775390625, 0.831695556640625, 0.929443359375, 1.027191162109375, 1.12493896484375, 1.222686767578125, 1.3204345703125, 1.418182373046875, 1.51593017578125, 1.613677978515625, 1.71142578125, 1.809173583984375, 1.90692138671875, 2.004669189453125, 2.1024169921875, 2.200164794921875, 2.29791259765625, 2.395660400390625, 2.493408203125, 2.591156005859375, 2.68890380859375, 2.786651611328125, 2.8843994140625, 2.982147216796875, 3.07989501953125, 3.177642822265625, 3.275390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 16.0, 21.0, 30.0, 39.0, 66.0, 73.0, 94.0, 197.0, 338.0, 1029.0, 5150.0, 60832.0, 3448651.0, 652444.0, 21278.0, 2523.0, 644.0, 303.0, 152.0, 103.0, 85.0, 51.0, 40.0, 33.0, 29.0, 11.0, 14.0, 5.0, 7.0, 3.0, 4.0, 4.0, 5.0], "bins": [-68.375, -66.814208984375, -65.25341796875, -63.692626953125, -62.1318359375, -60.571044921875, -59.01025390625, -57.449462890625, -55.888671875, -54.327880859375, -52.76708984375, -51.206298828125, -49.6455078125, -48.084716796875, -46.52392578125, -44.963134765625, -43.40234375, -41.841552734375, -40.28076171875, -38.719970703125, -37.1591796875, -35.598388671875, -34.03759765625, -32.476806640625, -30.916015625, -29.355224609375, -27.79443359375, -26.233642578125, -24.6728515625, -23.112060546875, -21.55126953125, -19.990478515625, -18.4296875, -16.868896484375, -15.30810546875, -13.747314453125, -12.1865234375, -10.625732421875, -9.06494140625, -7.504150390625, -5.943359375, -4.382568359375, -2.82177734375, -1.260986328125, 0.2998046875, 1.860595703125, 3.42138671875, 4.982177734375, 6.54296875, 8.103759765625, 9.66455078125, 11.225341796875, 12.7861328125, 14.346923828125, 15.90771484375, 17.468505859375, 19.029296875, 20.590087890625, 22.15087890625, 23.711669921875, 25.2724609375, 26.833251953125, 28.39404296875, 29.954833984375, 31.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 17.0, 24.0, 47.0, 91.0, 164.0, 318.0, 748.0, 1413.0, 532.0, 313.0, 172.0, 85.0, 49.0, 33.0, 21.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.73760986328125, -5.3385009765625, -4.93939208984375, -4.540283203125, -4.14117431640625, -3.7420654296875, -3.34295654296875, -2.94384765625, -2.54473876953125, -2.1456298828125, -1.74652099609375, -1.347412109375, -0.94830322265625, -0.5491943359375, -0.15008544921875, 0.2490234375, 0.64813232421875, 1.0472412109375, 1.44635009765625, 1.845458984375, 2.24456787109375, 2.6436767578125, 3.04278564453125, 3.44189453125, 3.84100341796875, 4.2401123046875, 4.63922119140625, 5.038330078125, 5.43743896484375, 5.8365478515625, 6.23565673828125, 6.634765625, 7.03387451171875, 7.4329833984375, 7.83209228515625, 8.231201171875, 8.63031005859375, 9.0294189453125, 9.42852783203125, 9.82763671875, 10.22674560546875, 10.6258544921875, 11.02496337890625, 11.424072265625, 11.82318115234375, 12.2222900390625, 12.62139892578125, 13.0205078125, 13.41961669921875, 13.8187255859375, 14.21783447265625, 14.616943359375, 15.01605224609375, 15.4151611328125, 15.81427001953125, 16.21337890625, 16.61248779296875, 17.0115966796875, 17.41070556640625, 17.809814453125, 18.20892333984375, 18.6080322265625, 19.00714111328125, 19.40625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 15.0, 33.0, 65.0, 98.0, 140.0, 169.0, 154.0, 127.0, 96.0, 37.0, 24.0, 16.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.52430725097656, -116.35123443603516, -113.17815399169922, -110.00508117675781, -106.83200073242188, -103.65892791748047, -100.48585510253906, -97.31277465820312, -94.13970184326172, -90.96662902832031, -87.79354858398438, -84.62047576904297, -81.44740295410156, -78.27432250976562, -75.10124969482422, -71.92817687988281, -68.75509643554688, -65.58202362060547, -62.40894317626953, -59.235870361328125, -56.06279373168945, -52.88971710205078, -49.716644287109375, -46.5435676574707, -43.37049102783203, -40.19741439819336, -37.02433776855469, -33.85126495361328, -30.67818832397461, -27.505111694335938, -24.3320369720459, -21.15896224975586, -17.985885620117188, -14.812809944152832, -11.639734268188477, -8.466658592224121, -5.293582916259766, -2.12050724029541, 1.0525684356689453, 4.225643157958984, 7.398719787597656, 10.571795463562012, 13.744871139526367, 16.917945861816406, 20.091022491455078, 23.26409912109375, 26.43717384338379, 29.610248565673828, 32.7833251953125, 35.95640182495117, 39.129478454589844, 42.30255126953125, 45.47562789916992, 48.648704528808594, 51.82177734375, 54.99485397338867, 58.167930603027344, 61.341007232666016, 64.51408386230469, 67.6871566772461, 70.8602294921875, 74.03330993652344, 77.20638275146484, 80.37945556640625, 83.55253601074219]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 7.0, 13.0, 12.0, 11.0, 17.0, 27.0, 25.0, 37.0, 29.0, 40.0, 42.0, 31.0, 61.0, 54.0, 52.0, 46.0, 51.0, 50.0, 45.0, 41.0, 43.0, 38.0, 26.0, 36.0, 28.0, 20.0, 16.0, 13.0, 14.0, 16.0, 15.0, 10.0, 8.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.718284606933594, -33.530364990234375, -32.342445373535156, -31.15452766418457, -29.966609954833984, -28.778690338134766, -27.590770721435547, -26.402851104736328, -25.214933395385742, -24.027013778686523, -22.839096069335938, -21.65117645263672, -20.4632568359375, -19.275339126586914, -18.087419509887695, -16.89950180053711, -15.71158218383789, -14.523663520812988, -13.335744857788086, -12.147825241088867, -10.959906578063965, -9.771987915039062, -8.584068298339844, -7.396149635314941, -6.208230972290039, -5.020312309265137, -3.832393169403076, -2.6444742679595947, -1.4565553665161133, -0.26863670349121094, 0.9192824363708496, 2.10720157623291, 3.2951202392578125, 4.483038902282715, 5.670958042144775, 6.858877182006836, 8.046795845031738, 9.23471450805664, 10.42263412475586, 11.610552787780762, 12.798471450805664, 13.986390113830566, 15.174308776855469, 16.362228393554688, 17.550148010253906, 18.738065719604492, 19.92598533630371, 21.113903045654297, 22.301822662353516, 23.489742279052734, 24.67765998840332, 25.86557960510254, 27.053497314453125, 28.241416931152344, 29.429336547851562, 30.61725616455078, 31.805173873901367, 32.99309158325195, 34.18101119995117, 35.36893081665039, 36.55685043334961, 37.74476623535156, 38.93268585205078, 40.12060546875, 41.30852508544922]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 15.0, 10.0, 17.0, 20.0, 48.0, 48.0, 91.0, 138.0, 231.0, 373.0, 671.0, 1090.0, 2229.0, 4442.0, 9532.0, 21119.0, 47715.0, 105883.0, 222966.0, 308323.0, 174033.0, 81361.0, 36548.0, 16605.0, 7491.0, 3470.0, 1820.0, 925.0, 531.0, 312.0, 196.0, 102.0, 75.0, 41.0, 24.0, 23.0, 15.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8203125, -15.345703125, -14.87109375, -14.396484375, -13.921875, -13.447265625, -12.97265625, -12.498046875, -12.0234375, -11.548828125, -11.07421875, -10.599609375, -10.125, -9.650390625, -9.17578125, -8.701171875, -8.2265625, -7.751953125, -7.27734375, -6.802734375, -6.328125, -5.853515625, -5.37890625, -4.904296875, -4.4296875, -3.955078125, -3.48046875, -3.005859375, -2.53125, -2.056640625, -1.58203125, -1.107421875, -0.6328125, -0.158203125, 0.31640625, 0.791015625, 1.265625, 1.740234375, 2.21484375, 2.689453125, 3.1640625, 3.638671875, 4.11328125, 4.587890625, 5.0625, 5.537109375, 6.01171875, 6.486328125, 6.9609375, 7.435546875, 7.91015625, 8.384765625, 8.859375, 9.333984375, 9.80859375, 10.283203125, 10.7578125, 11.232421875, 11.70703125, 12.181640625, 12.65625, 13.130859375, 13.60546875, 14.080078125, 14.5546875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 17.0, 11.0, 23.0, 17.0, 27.0, 33.0, 19.0, 37.0, 30.0, 38.0, 46.0, 47.0, 49.0, 60.0, 61.0, 46.0, 43.0, 43.0, 40.0, 39.0, 33.0, 38.0, 25.0, 27.0, 14.0, 27.0, 18.0, 15.0, 13.0, 15.0, 6.0, 8.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.334197998046875, -2.24456787109375, -2.154937744140625, -2.0653076171875, -1.975677490234375, -1.88604736328125, -1.796417236328125, -1.706787109375, -1.617156982421875, -1.52752685546875, -1.437896728515625, -1.3482666015625, -1.258636474609375, -1.16900634765625, -1.079376220703125, -0.98974609375, -0.900115966796875, -0.81048583984375, -0.720855712890625, -0.6312255859375, -0.541595458984375, -0.45196533203125, -0.362335205078125, -0.272705078125, -0.183074951171875, -0.09344482421875, -0.003814697265625, 0.0858154296875, 0.175445556640625, 0.26507568359375, 0.354705810546875, 0.4443359375, 0.533966064453125, 0.62359619140625, 0.713226318359375, 0.8028564453125, 0.892486572265625, 0.98211669921875, 1.071746826171875, 1.161376953125, 1.251007080078125, 1.34063720703125, 1.430267333984375, 1.5198974609375, 1.609527587890625, 1.69915771484375, 1.788787841796875, 1.87841796875, 1.968048095703125, 2.05767822265625, 2.147308349609375, 2.2369384765625, 2.326568603515625, 2.41619873046875, 2.505828857421875, 2.595458984375, 2.685089111328125, 2.77471923828125, 2.864349365234375, 2.9539794921875, 3.043609619140625, 3.13323974609375, 3.222869873046875, 3.3125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 0.0, 8.0, 9.0, 9.0, 13.0, 20.0, 28.0, 27.0, 36.0, 44.0, 50.0, 79.0, 75.0, 115.0, 164.0, 164.0, 246.0, 366.0, 543.0, 833.0, 1383.0, 2520.0, 4933.0, 9875.0, 21844.0, 49167.0, 107570.0, 225417.0, 298251.0, 173958.0, 81041.0, 36286.0, 16369.0, 7588.0, 3840.0, 1982.0, 1159.0, 739.0, 505.0, 335.0, 253.0, 159.0, 122.0, 105.0, 79.0, 56.0, 50.0, 38.0, 27.0, 21.0, 14.0, 17.0, 8.0, 3.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0], "bins": [-11.59375, -11.2349853515625, -10.876220703125, -10.5174560546875, -10.15869140625, -9.7999267578125, -9.441162109375, -9.0823974609375, -8.7236328125, -8.3648681640625, -8.006103515625, -7.6473388671875, -7.28857421875, -6.9298095703125, -6.571044921875, -6.2122802734375, -5.853515625, -5.4947509765625, -5.135986328125, -4.7772216796875, -4.41845703125, -4.0596923828125, -3.700927734375, -3.3421630859375, -2.9833984375, -2.6246337890625, -2.265869140625, -1.9071044921875, -1.54833984375, -1.1895751953125, -0.830810546875, -0.4720458984375, -0.11328125, 0.2454833984375, 0.604248046875, 0.9630126953125, 1.32177734375, 1.6805419921875, 2.039306640625, 2.3980712890625, 2.7568359375, 3.1156005859375, 3.474365234375, 3.8331298828125, 4.19189453125, 4.5506591796875, 4.909423828125, 5.2681884765625, 5.626953125, 5.9857177734375, 6.344482421875, 6.7032470703125, 7.06201171875, 7.4207763671875, 7.779541015625, 8.1383056640625, 8.4970703125, 8.8558349609375, 9.214599609375, 9.5733642578125, 9.93212890625, 10.2908935546875, 10.649658203125, 11.0084228515625, 11.3671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 19.0, 41.0, 34.0, 40.0, 37.0, 41.0, 57.0, 42.0, 54.0, 44.0, 59.0, 56.0, 44.0, 37.0, 54.0, 44.0, 37.0, 21.0, 32.0, 19.0, 16.0, 14.0, 17.0, 17.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453125, -12.997802734375, -12.54248046875, -12.087158203125, -11.6318359375, -11.176513671875, -10.72119140625, -10.265869140625, -9.810546875, -9.355224609375, -8.89990234375, -8.444580078125, -7.9892578125, -7.533935546875, -7.07861328125, -6.623291015625, -6.16796875, -5.712646484375, -5.25732421875, -4.802001953125, -4.3466796875, -3.891357421875, -3.43603515625, -2.980712890625, -2.525390625, -2.070068359375, -1.61474609375, -1.159423828125, -0.7041015625, -0.248779296875, 0.20654296875, 0.661865234375, 1.1171875, 1.572509765625, 2.02783203125, 2.483154296875, 2.9384765625, 3.393798828125, 3.84912109375, 4.304443359375, 4.759765625, 5.215087890625, 5.67041015625, 6.125732421875, 6.5810546875, 7.036376953125, 7.49169921875, 7.947021484375, 8.40234375, 8.857666015625, 9.31298828125, 9.768310546875, 10.2236328125, 10.678955078125, 11.13427734375, 11.589599609375, 12.044921875, 12.500244140625, 12.95556640625, 13.410888671875, 13.8662109375, 14.321533203125, 14.77685546875, 15.232177734375, 15.6875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 13.0, 20.0, 34.0, 45.0, 67.0, 130.0, 234.0, 353.0, 689.0, 1337.0, 3090.0, 7960.0, 24572.0, 95402.0, 383326.0, 392536.0, 99049.0, 25246.0, 8244.0, 3180.0, 1357.0, 693.0, 379.0, 209.0, 134.0, 81.0, 50.0, 33.0, 18.0, 13.0, 12.0, 7.0, 8.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.9827880859375, -9.660888671875, -9.3389892578125, -9.01708984375, -8.6951904296875, -8.373291015625, -8.0513916015625, -7.7294921875, -7.4075927734375, -7.085693359375, -6.7637939453125, -6.44189453125, -6.1199951171875, -5.798095703125, -5.4761962890625, -5.154296875, -4.8323974609375, -4.510498046875, -4.1885986328125, -3.86669921875, -3.5447998046875, -3.222900390625, -2.9010009765625, -2.5791015625, -2.2572021484375, -1.935302734375, -1.6134033203125, -1.29150390625, -0.9696044921875, -0.647705078125, -0.3258056640625, -0.00390625, 0.3179931640625, 0.639892578125, 0.9617919921875, 1.28369140625, 1.6055908203125, 1.927490234375, 2.2493896484375, 2.5712890625, 2.8931884765625, 3.215087890625, 3.5369873046875, 3.85888671875, 4.1807861328125, 4.502685546875, 4.8245849609375, 5.146484375, 5.4683837890625, 5.790283203125, 6.1121826171875, 6.43408203125, 6.7559814453125, 7.077880859375, 7.3997802734375, 7.7216796875, 8.0435791015625, 8.365478515625, 8.6873779296875, 9.00927734375, 9.3311767578125, 9.653076171875, 9.9749755859375, 10.296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 16.0, 9.0, 23.0, 24.0, 28.0, 41.0, 28.0, 62.0, 57.0, 95.0, 125.0, 98.0, 73.0, 52.0, 45.0, 40.0, 21.0, 25.0, 21.0, 15.0, 13.0, 12.0, 11.0, 9.0, 3.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014162063598632812, -0.0013765394687652588, -0.0013368725776672363, -0.0012972056865692139, -0.0012575387954711914, -0.001217871904373169, -0.0011782050132751465, -0.001138538122177124, -0.0010988712310791016, -0.001059204339981079, -0.0010195374488830566, -0.0009798705577850342, -0.0009402036666870117, -0.0009005367755889893, -0.0008608698844909668, -0.0008212029933929443, -0.0007815361022949219, -0.0007418692111968994, -0.000702202320098877, -0.0006625354290008545, -0.000622868537902832, -0.0005832016468048096, -0.0005435347557067871, -0.0005038678646087646, -0.0004642009735107422, -0.0004245340824127197, -0.00038486719131469727, -0.0003452003002166748, -0.00030553340911865234, -0.0002658665180206299, -0.00022619962692260742, -0.00018653273582458496, -0.0001468658447265625, -0.00010719895362854004, -6.753206253051758e-05, -2.7865171432495117e-05, 1.1801719665527344e-05, 5.1468610763549805e-05, 9.113550186157227e-05, 0.00013080239295959473, 0.0001704692840576172, 0.00021013617515563965, 0.0002498030662536621, 0.00028946995735168457, 0.00032913684844970703, 0.0003688037395477295, 0.00040847063064575195, 0.0004481375217437744, 0.0004878044128417969, 0.0005274713039398193, 0.0005671381950378418, 0.0006068050861358643, 0.0006464719772338867, 0.0006861388683319092, 0.0007258057594299316, 0.0007654726505279541, 0.0008051395416259766, 0.000844806432723999, 0.0008844733238220215, 0.0009241402149200439, 0.0009638071060180664, 0.0010034739971160889, 0.0010431408882141113, 0.0010828077793121338, 0.0011224746704101562]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 11.0, 16.0, 19.0, 26.0, 43.0, 93.0, 161.0, 321.0, 596.0, 1213.0, 2848.0, 8064.0, 28335.0, 133456.0, 528648.0, 270948.0, 52673.0, 13345.0, 4230.0, 1784.0, 803.0, 353.0, 215.0, 122.0, 66.0, 51.0, 31.0, 17.0, 19.0, 14.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.111083984375, -12.72216796875, -12.333251953125, -11.9443359375, -11.555419921875, -11.16650390625, -10.777587890625, -10.388671875, -9.999755859375, -9.61083984375, -9.221923828125, -8.8330078125, -8.444091796875, -8.05517578125, -7.666259765625, -7.27734375, -6.888427734375, -6.49951171875, -6.110595703125, -5.7216796875, -5.332763671875, -4.94384765625, -4.554931640625, -4.166015625, -3.777099609375, -3.38818359375, -2.999267578125, -2.6103515625, -2.221435546875, -1.83251953125, -1.443603515625, -1.0546875, -0.665771484375, -0.27685546875, 0.112060546875, 0.5009765625, 0.889892578125, 1.27880859375, 1.667724609375, 2.056640625, 2.445556640625, 2.83447265625, 3.223388671875, 3.6123046875, 4.001220703125, 4.39013671875, 4.779052734375, 5.16796875, 5.556884765625, 5.94580078125, 6.334716796875, 6.7236328125, 7.112548828125, 7.50146484375, 7.890380859375, 8.279296875, 8.668212890625, 9.05712890625, 9.446044921875, 9.8349609375, 10.223876953125, 10.61279296875, 11.001708984375, 11.390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 14.0, 21.0, 19.0, 31.0, 35.0, 40.0, 58.0, 71.0, 88.0, 79.0, 96.0, 79.0, 75.0, 54.0, 52.0, 41.0, 29.0, 29.0, 12.0, 11.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.26953125, -7.0362548828125, -6.802978515625, -6.5697021484375, -6.33642578125, -6.1031494140625, -5.869873046875, -5.6365966796875, -5.4033203125, -5.1700439453125, -4.936767578125, -4.7034912109375, -4.47021484375, -4.2369384765625, -4.003662109375, -3.7703857421875, -3.537109375, -3.3038330078125, -3.070556640625, -2.8372802734375, -2.60400390625, -2.3707275390625, -2.137451171875, -1.9041748046875, -1.6708984375, -1.4376220703125, -1.204345703125, -0.9710693359375, -0.73779296875, -0.5045166015625, -0.271240234375, -0.0379638671875, 0.1953125, 0.4285888671875, 0.661865234375, 0.8951416015625, 1.12841796875, 1.3616943359375, 1.594970703125, 1.8282470703125, 2.0615234375, 2.2947998046875, 2.528076171875, 2.7613525390625, 2.99462890625, 3.2279052734375, 3.461181640625, 3.6944580078125, 3.927734375, 4.1610107421875, 4.394287109375, 4.6275634765625, 4.86083984375, 5.0941162109375, 5.327392578125, 5.5606689453125, 5.7939453125, 6.0272216796875, 6.260498046875, 6.4937744140625, 6.72705078125, 6.9603271484375, 7.193603515625, 7.4268798828125, 7.66015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 13.0, 11.0, 16.0, 31.0, 67.0, 104.0, 145.0, 162.0, 170.0, 133.0, 76.0, 36.0, 16.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.40904235839844, -167.1335906982422, -161.85813903808594, -156.5826873779297, -151.3072509765625, -146.03179931640625, -140.75634765625, -135.48089599609375, -130.2054443359375, -124.92999267578125, -119.654541015625, -114.37909698486328, -109.10364532470703, -103.82819366455078, -98.55274963378906, -93.27729797363281, -88.00184631347656, -82.72639465332031, -77.45094299316406, -72.17549896240234, -66.9000473022461, -61.624595642089844, -56.34914779663086, -51.073699951171875, -45.798248291015625, -40.522796630859375, -35.24734878540039, -29.971899032592773, -24.696449279785156, -19.42099952697754, -14.145549774169922, -8.870101928710938, -3.59466552734375, 1.6807842254638672, 6.956233978271484, 12.231683731079102, 17.50713348388672, 22.782583236694336, 28.058032989501953, 33.33348083496094, 38.60893249511719, 43.88438415527344, 49.15983200073242, 54.435279846191406, 59.710731506347656, 64.9861831665039, 70.26162719726562, 75.53707885742188, 80.81253051757812, 86.08798217773438, 91.36343383789062, 96.63887786865234, 101.9143295288086, 107.18978118896484, 112.46522521972656, 117.74067687988281, 123.01612854003906, 128.2915802001953, 133.56703186035156, 138.8424835205078, 144.117919921875, 149.39337158203125, 154.6688232421875, 159.94427490234375, 165.2197265625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 12.0, 8.0, 9.0, 19.0, 12.0, 18.0, 19.0, 19.0, 20.0, 26.0, 37.0, 39.0, 42.0, 29.0, 30.0, 35.0, 29.0, 38.0, 42.0, 40.0, 45.0, 38.0, 41.0, 36.0, 27.0, 28.0, 32.0, 21.0, 22.0, 20.0, 28.0, 21.0, 9.0, 17.0, 13.0, 9.0, 12.0, 6.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.08466339111328, -63.961360931396484, -61.83805847167969, -59.714759826660156, -57.59145736694336, -55.46815490722656, -53.34485626220703, -51.221553802490234, -49.09825134277344, -46.97494888305664, -44.851646423339844, -42.72834777832031, -40.605045318603516, -38.48174285888672, -36.35844421386719, -34.23514175415039, -32.111839294433594, -29.988536834716797, -27.865236282348633, -25.74193572998047, -23.618633270263672, -21.495330810546875, -19.37203025817871, -17.248729705810547, -15.12542724609375, -13.00212574005127, -10.878824234008789, -8.755522727966309, -6.632221221923828, -4.508919715881348, -2.385618209838867, -0.2623167037963867, 1.8609771728515625, 3.984278678894043, 6.107580184936523, 8.230881690979004, 10.354183197021484, 12.477484703063965, 14.600786209106445, 16.72408676147461, 18.847389221191406, 20.970691680908203, 23.093992233276367, 25.21729278564453, 27.340595245361328, 29.463897705078125, 31.58719825744629, 33.71049880981445, 35.83380126953125, 37.95710372924805, 40.080406188964844, 42.203704833984375, 44.32700729370117, 46.45030975341797, 48.5736083984375, 50.6969108581543, 52.820213317871094, 54.94351577758789, 57.06681823730469, 59.19011688232422, 61.313419342041016, 63.43672180175781, 65.56002044677734, 67.6833267211914, 69.80662536621094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 12.0, 14.0, 10.0, 28.0, 27.0, 39.0, 58.0, 96.0, 141.0, 206.0, 298.0, 451.0, 772.0, 1292.0, 2377.0, 4293.0, 8631.0, 17320.0, 41603.0, 128170.0, 1082907.0, 2659429.0, 157327.0, 47718.0, 20063.0, 9325.0, 4873.0, 2670.0, 1498.0, 933.0, 571.0, 360.0, 243.0, 163.0, 114.0, 75.0, 44.0, 37.0, 25.0, 18.0, 12.0, 12.0, 2.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.46875, -15.9708251953125, -15.472900390625, -14.9749755859375, -14.47705078125, -13.9791259765625, -13.481201171875, -12.9832763671875, -12.4853515625, -11.9874267578125, -11.489501953125, -10.9915771484375, -10.49365234375, -9.9957275390625, -9.497802734375, -8.9998779296875, -8.501953125, -8.0040283203125, -7.506103515625, -7.0081787109375, -6.51025390625, -6.0123291015625, -5.514404296875, -5.0164794921875, -4.5185546875, -4.0206298828125, -3.522705078125, -3.0247802734375, -2.52685546875, -2.0289306640625, -1.531005859375, -1.0330810546875, -0.53515625, -0.0372314453125, 0.460693359375, 0.9586181640625, 1.45654296875, 1.9544677734375, 2.452392578125, 2.9503173828125, 3.4482421875, 3.9461669921875, 4.444091796875, 4.9420166015625, 5.43994140625, 5.9378662109375, 6.435791015625, 6.9337158203125, 7.431640625, 7.9295654296875, 8.427490234375, 8.9254150390625, 9.42333984375, 9.9212646484375, 10.419189453125, 10.9171142578125, 11.4150390625, 11.9129638671875, 12.410888671875, 12.9088134765625, 13.40673828125, 13.9046630859375, 14.402587890625, 14.9005126953125, 15.3984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 4.0, 11.0, 10.0, 15.0, 17.0, 20.0, 17.0, 23.0, 25.0, 24.0, 41.0, 27.0, 52.0, 32.0, 61.0, 41.0, 33.0, 51.0, 51.0, 44.0, 39.0, 29.0, 39.0, 40.0, 34.0, 33.0, 16.0, 28.0, 16.0, 27.0, 11.0, 14.0, 13.0, 11.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.3699951171875, -2.284912109375, -2.1998291015625, -2.11474609375, -2.0296630859375, -1.944580078125, -1.8594970703125, -1.7744140625, -1.6893310546875, -1.604248046875, -1.5191650390625, -1.43408203125, -1.3489990234375, -1.263916015625, -1.1788330078125, -1.09375, -1.0086669921875, -0.923583984375, -0.8385009765625, -0.75341796875, -0.6683349609375, -0.583251953125, -0.4981689453125, -0.4130859375, -0.3280029296875, -0.242919921875, -0.1578369140625, -0.07275390625, 0.0123291015625, 0.097412109375, 0.1824951171875, 0.267578125, 0.3526611328125, 0.437744140625, 0.5228271484375, 0.60791015625, 0.6929931640625, 0.778076171875, 0.8631591796875, 0.9482421875, 1.0333251953125, 1.118408203125, 1.2034912109375, 1.28857421875, 1.3736572265625, 1.458740234375, 1.5438232421875, 1.62890625, 1.7139892578125, 1.799072265625, 1.8841552734375, 1.96923828125, 2.0543212890625, 2.139404296875, 2.2244873046875, 2.3095703125, 2.3946533203125, 2.479736328125, 2.5648193359375, 2.64990234375, 2.7349853515625, 2.820068359375, 2.9051513671875, 2.990234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 13.0, 30.0, 16.0, 28.0, 28.0, 34.0, 57.0, 67.0, 72.0, 82.0, 132.0, 272.0, 899.0, 3622.0, 22771.0, 278620.0, 3700009.0, 167118.0, 16214.0, 2712.0, 657.0, 237.0, 120.0, 82.0, 71.0, 56.0, 39.0, 35.0, 35.0, 22.0, 36.0, 14.0, 19.0, 10.0, 7.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -34.1279296875, -33.005859375, -31.8837890625, -30.76171875, -29.6396484375, -28.517578125, -27.3955078125, -26.2734375, -25.1513671875, -24.029296875, -22.9072265625, -21.78515625, -20.6630859375, -19.541015625, -18.4189453125, -17.296875, -16.1748046875, -15.052734375, -13.9306640625, -12.80859375, -11.6865234375, -10.564453125, -9.4423828125, -8.3203125, -7.1982421875, -6.076171875, -4.9541015625, -3.83203125, -2.7099609375, -1.587890625, -0.4658203125, 0.65625, 1.7783203125, 2.900390625, 4.0224609375, 5.14453125, 6.2666015625, 7.388671875, 8.5107421875, 9.6328125, 10.7548828125, 11.876953125, 12.9990234375, 14.12109375, 15.2431640625, 16.365234375, 17.4873046875, 18.609375, 19.7314453125, 20.853515625, 21.9755859375, 23.09765625, 24.2197265625, 25.341796875, 26.4638671875, 27.5859375, 28.7080078125, 29.830078125, 30.9521484375, 32.07421875, 33.1962890625, 34.318359375, 35.4404296875, 36.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 17.0, 12.0, 31.0, 82.0, 144.0, 420.0, 1957.0, 923.0, 263.0, 112.0, 53.0, 31.0, 17.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984375, -16.522705078125, -16.06103515625, -15.599365234375, -15.1376953125, -14.676025390625, -14.21435546875, -13.752685546875, -13.291015625, -12.829345703125, -12.36767578125, -11.906005859375, -11.4443359375, -10.982666015625, -10.52099609375, -10.059326171875, -9.59765625, -9.135986328125, -8.67431640625, -8.212646484375, -7.7509765625, -7.289306640625, -6.82763671875, -6.365966796875, -5.904296875, -5.442626953125, -4.98095703125, -4.519287109375, -4.0576171875, -3.595947265625, -3.13427734375, -2.672607421875, -2.2109375, -1.749267578125, -1.28759765625, -0.825927734375, -0.3642578125, 0.097412109375, 0.55908203125, 1.020751953125, 1.482421875, 1.944091796875, 2.40576171875, 2.867431640625, 3.3291015625, 3.790771484375, 4.25244140625, 4.714111328125, 5.17578125, 5.637451171875, 6.09912109375, 6.560791015625, 7.0224609375, 7.484130859375, 7.94580078125, 8.407470703125, 8.869140625, 9.330810546875, 9.79248046875, 10.254150390625, 10.7158203125, 11.177490234375, 11.63916015625, 12.100830078125, 12.5625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 13.0, 13.0, 12.0, 26.0, 52.0, 59.0, 98.0, 140.0, 147.0, 122.0, 117.0, 73.0, 49.0, 29.0, 23.0, 12.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.19105529785156, -72.3633041381836, -70.53555297851562, -68.70780181884766, -66.88005065917969, -65.05229187011719, -63.22454071044922, -61.39678955078125, -59.56903839111328, -57.74128723144531, -55.913536071777344, -54.08578109741211, -52.25802993774414, -50.43027877807617, -48.60252380371094, -46.77477264404297, -44.947021484375, -43.11927032470703, -41.29151916503906, -39.46376419067383, -37.63601303100586, -35.80826187133789, -33.980506896972656, -32.15275573730469, -30.32500457763672, -28.49725341796875, -26.66950035095215, -24.841747283935547, -23.013996124267578, -21.18624496459961, -19.358491897583008, -17.530738830566406, -15.702987670898438, -13.875235557556152, -12.047483444213867, -10.219731330871582, -8.391979217529297, -6.564227104187012, -4.736474990844727, -2.9087228775024414, -1.0809707641601562, 0.7467813491821289, 2.574533462524414, 4.402285575866699, 6.230037689208984, 8.05778980255127, 9.885541915893555, 11.71329402923584, 13.541046142578125, 15.36879825592041, 17.196550369262695, 19.024303436279297, 20.852054595947266, 22.679805755615234, 24.507558822631836, 26.335311889648438, 28.163063049316406, 29.990814208984375, 31.818567276000977, 33.64632034301758, 35.47407150268555, 37.301822662353516, 39.12957763671875, 40.95732879638672, 42.78507995605469]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 5.0, 14.0, 14.0, 12.0, 19.0, 14.0, 22.0, 25.0, 21.0, 33.0, 34.0, 32.0, 30.0, 29.0, 41.0, 30.0, 30.0, 35.0, 38.0, 41.0, 27.0, 52.0, 37.0, 36.0, 37.0, 22.0, 24.0, 25.0, 19.0, 25.0, 10.0, 19.0, 13.0, 12.0, 16.0, 11.0, 14.0, 8.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-20.922992706298828, -20.303266525268555, -19.683542251586914, -19.06381607055664, -18.444091796875, -17.824365615844727, -17.204641342163086, -16.584915161132812, -15.965190887451172, -15.345465660095215, -14.725740432739258, -14.1060152053833, -13.486289978027344, -12.866564750671387, -12.24683952331543, -11.627113342285156, -11.0073881149292, -10.387662887573242, -9.767937660217285, -9.148212432861328, -8.528487205505371, -7.908761978149414, -7.289036273956299, -6.669311046600342, -6.049585819244385, -5.429860591888428, -4.810135364532471, -4.1904096603393555, -3.5706846714019775, -2.9509594440460205, -2.3312339782714844, -1.7115087509155273, -1.0917835235595703, -0.4720582365989685, 0.1476670503616333, 0.7673923969268799, 1.387117624282837, 2.006842851638794, 2.62656831741333, 3.246293544769287, 3.866018772125244, 4.485743999481201, 5.105469226837158, 5.725194931030273, 6.3449201583862305, 6.9646453857421875, 7.5843706130981445, 8.204095840454102, 8.823821067810059, 9.443546295166016, 10.063271522521973, 10.68299674987793, 11.302721977233887, 11.922447204589844, 12.542173385620117, 13.161897659301758, 13.781623840332031, 14.401349067687988, 15.021074295043945, 15.640799522399902, 16.26052474975586, 16.880250930786133, 17.499975204467773, 18.119701385498047, 18.739425659179688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 7.0, 7.0, 11.0, 14.0, 10.0, 17.0, 29.0, 49.0, 52.0, 74.0, 124.0, 182.0, 286.0, 433.0, 613.0, 1004.0, 1570.0, 2702.0, 4802.0, 8567.0, 15385.0, 29035.0, 55184.0, 105526.0, 194999.0, 263603.0, 169983.0, 90984.0, 47380.0, 24866.0, 13229.0, 7357.0, 4101.0, 2465.0, 1400.0, 837.0, 534.0, 332.0, 266.0, 156.0, 109.0, 66.0, 56.0, 37.0, 28.0, 28.0, 12.0, 10.0, 14.0, 8.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.390625, -10.9892578125, -10.587890625, -10.1865234375, -9.78515625, -9.3837890625, -8.982421875, -8.5810546875, -8.1796875, -7.7783203125, -7.376953125, -6.9755859375, -6.57421875, -6.1728515625, -5.771484375, -5.3701171875, -4.96875, -4.5673828125, -4.166015625, -3.7646484375, -3.36328125, -2.9619140625, -2.560546875, -2.1591796875, -1.7578125, -1.3564453125, -0.955078125, -0.5537109375, -0.15234375, 0.2490234375, 0.650390625, 1.0517578125, 1.453125, 1.8544921875, 2.255859375, 2.6572265625, 3.05859375, 3.4599609375, 3.861328125, 4.2626953125, 4.6640625, 5.0654296875, 5.466796875, 5.8681640625, 6.26953125, 6.6708984375, 7.072265625, 7.4736328125, 7.875, 8.2763671875, 8.677734375, 9.0791015625, 9.48046875, 9.8818359375, 10.283203125, 10.6845703125, 11.0859375, 11.4873046875, 11.888671875, 12.2900390625, 12.69140625, 13.0927734375, 13.494140625, 13.8955078125, 14.296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 13.0, 18.0, 21.0, 18.0, 16.0, 19.0, 21.0, 35.0, 27.0, 38.0, 51.0, 45.0, 41.0, 47.0, 63.0, 39.0, 39.0, 48.0, 39.0, 41.0, 33.0, 37.0, 30.0, 23.0, 21.0, 23.0, 14.0, 19.0, 13.0, 19.0, 14.0, 13.0, 8.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.245452880859375, -2.16082763671875, -2.076202392578125, -1.9915771484375, -1.906951904296875, -1.82232666015625, -1.737701416015625, -1.653076171875, -1.568450927734375, -1.48382568359375, -1.399200439453125, -1.3145751953125, -1.229949951171875, -1.14532470703125, -1.060699462890625, -0.97607421875, -0.891448974609375, -0.80682373046875, -0.722198486328125, -0.6375732421875, -0.552947998046875, -0.46832275390625, -0.383697509765625, -0.299072265625, -0.214447021484375, -0.12982177734375, -0.045196533203125, 0.0394287109375, 0.124053955078125, 0.20867919921875, 0.293304443359375, 0.3779296875, 0.462554931640625, 0.54718017578125, 0.631805419921875, 0.7164306640625, 0.801055908203125, 0.88568115234375, 0.970306396484375, 1.054931640625, 1.139556884765625, 1.22418212890625, 1.308807373046875, 1.3934326171875, 1.478057861328125, 1.56268310546875, 1.647308349609375, 1.73193359375, 1.816558837890625, 1.90118408203125, 1.985809326171875, 2.0704345703125, 2.155059814453125, 2.23968505859375, 2.324310302734375, 2.408935546875, 2.493560791015625, 2.57818603515625, 2.662811279296875, 2.7474365234375, 2.832061767578125, 2.91668701171875, 3.001312255859375, 3.0859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 6.0, 10.0, 12.0, 18.0, 31.0, 31.0, 42.0, 53.0, 67.0, 92.0, 120.0, 159.0, 239.0, 308.0, 405.0, 650.0, 1153.0, 2378.0, 6360.0, 19346.0, 67781.0, 228191.0, 438523.0, 196951.0, 58092.0, 16723.0, 5441.0, 2190.0, 1083.0, 617.0, 374.0, 272.0, 206.0, 161.0, 99.0, 80.0, 60.0, 50.0, 34.0, 32.0, 28.0, 18.0, 21.0, 14.0, 4.0, 5.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-17.65625, -17.128173828125, -16.60009765625, -16.072021484375, -15.5439453125, -15.015869140625, -14.48779296875, -13.959716796875, -13.431640625, -12.903564453125, -12.37548828125, -11.847412109375, -11.3193359375, -10.791259765625, -10.26318359375, -9.735107421875, -9.20703125, -8.678955078125, -8.15087890625, -7.622802734375, -7.0947265625, -6.566650390625, -6.03857421875, -5.510498046875, -4.982421875, -4.454345703125, -3.92626953125, -3.398193359375, -2.8701171875, -2.342041015625, -1.81396484375, -1.285888671875, -0.7578125, -0.229736328125, 0.29833984375, 0.826416015625, 1.3544921875, 1.882568359375, 2.41064453125, 2.938720703125, 3.466796875, 3.994873046875, 4.52294921875, 5.051025390625, 5.5791015625, 6.107177734375, 6.63525390625, 7.163330078125, 7.69140625, 8.219482421875, 8.74755859375, 9.275634765625, 9.8037109375, 10.331787109375, 10.85986328125, 11.387939453125, 11.916015625, 12.444091796875, 12.97216796875, 13.500244140625, 14.0283203125, 14.556396484375, 15.08447265625, 15.612548828125, 16.140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 13.0, 8.0, 8.0, 13.0, 15.0, 23.0, 13.0, 21.0, 28.0, 27.0, 31.0, 34.0, 38.0, 50.0, 35.0, 41.0, 49.0, 42.0, 53.0, 29.0, 37.0, 35.0, 38.0, 29.0, 31.0, 29.0, 32.0, 32.0, 22.0, 17.0, 21.0, 14.0, 11.0, 16.0, 10.0, 13.0, 10.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.46875, -11.112060546875, -10.75537109375, -10.398681640625, -10.0419921875, -9.685302734375, -9.32861328125, -8.971923828125, -8.615234375, -8.258544921875, -7.90185546875, -7.545166015625, -7.1884765625, -6.831787109375, -6.47509765625, -6.118408203125, -5.76171875, -5.405029296875, -5.04833984375, -4.691650390625, -4.3349609375, -3.978271484375, -3.62158203125, -3.264892578125, -2.908203125, -2.551513671875, -2.19482421875, -1.838134765625, -1.4814453125, -1.124755859375, -0.76806640625, -0.411376953125, -0.0546875, 0.302001953125, 0.65869140625, 1.015380859375, 1.3720703125, 1.728759765625, 2.08544921875, 2.442138671875, 2.798828125, 3.155517578125, 3.51220703125, 3.868896484375, 4.2255859375, 4.582275390625, 4.93896484375, 5.295654296875, 5.65234375, 6.009033203125, 6.36572265625, 6.722412109375, 7.0791015625, 7.435791015625, 7.79248046875, 8.149169921875, 8.505859375, 8.862548828125, 9.21923828125, 9.575927734375, 9.9326171875, 10.289306640625, 10.64599609375, 11.002685546875, 11.359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 21.0, 24.0, 40.0, 77.0, 173.0, 394.0, 923.0, 2867.0, 10872.0, 63201.0, 521826.0, 389739.0, 45804.0, 8828.0, 2285.0, 809.0, 288.0, 125.0, 78.0, 42.0, 32.0, 19.0, 12.0, 4.0, 10.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.0682373046875, -13.581787109375, -13.0953369140625, -12.60888671875, -12.1224365234375, -11.635986328125, -11.1495361328125, -10.6630859375, -10.1766357421875, -9.690185546875, -9.2037353515625, -8.71728515625, -8.2308349609375, -7.744384765625, -7.2579345703125, -6.771484375, -6.2850341796875, -5.798583984375, -5.3121337890625, -4.82568359375, -4.3392333984375, -3.852783203125, -3.3663330078125, -2.8798828125, -2.3934326171875, -1.906982421875, -1.4205322265625, -0.93408203125, -0.4476318359375, 0.038818359375, 0.5252685546875, 1.01171875, 1.4981689453125, 1.984619140625, 2.4710693359375, 2.95751953125, 3.4439697265625, 3.930419921875, 4.4168701171875, 4.9033203125, 5.3897705078125, 5.876220703125, 6.3626708984375, 6.84912109375, 7.3355712890625, 7.822021484375, 8.3084716796875, 8.794921875, 9.2813720703125, 9.767822265625, 10.2542724609375, 10.74072265625, 11.2271728515625, 11.713623046875, 12.2000732421875, 12.6865234375, 13.1729736328125, 13.659423828125, 14.1458740234375, 14.63232421875, 15.1187744140625, 15.605224609375, 16.0916748046875, 16.578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 8.0, 16.0, 15.0, 21.0, 25.0, 34.0, 39.0, 39.0, 59.0, 83.0, 131.0, 147.0, 91.0, 51.0, 47.0, 36.0, 24.0, 25.0, 15.0, 18.0, 16.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.001386880874633789, -0.0013422966003417969, -0.0012977123260498047, -0.0012531280517578125, -0.0012085437774658203, -0.0011639595031738281, -0.001119375228881836, -0.0010747909545898438, -0.0010302066802978516, -0.0009856224060058594, -0.0009410381317138672, -0.000896453857421875, -0.0008518695831298828, -0.0008072853088378906, -0.0007627010345458984, -0.0007181167602539062, -0.0006735324859619141, -0.0006289482116699219, -0.0005843639373779297, -0.0005397796630859375, -0.0004951953887939453, -0.0004506111145019531, -0.00040602684020996094, -0.00036144256591796875, -0.00031685829162597656, -0.0002722740173339844, -0.0002276897430419922, -0.00018310546875, -0.0001385211944580078, -9.393692016601562e-05, -4.935264587402344e-05, -4.76837158203125e-06, 3.981590270996094e-05, 8.440017700195312e-05, 0.0001289844512939453, 0.0001735687255859375, 0.0002181529998779297, 0.0002627372741699219, 0.00030732154846191406, 0.00035190582275390625, 0.00039649009704589844, 0.0004410743713378906, 0.0004856586456298828, 0.000530242919921875, 0.0005748271942138672, 0.0006194114685058594, 0.0006639957427978516, 0.0007085800170898438, 0.0007531642913818359, 0.0007977485656738281, 0.0008423328399658203, 0.0008869171142578125, 0.0009315013885498047, 0.0009760856628417969, 0.001020669937133789, 0.0010652542114257812, 0.0011098384857177734, 0.0011544227600097656, 0.0011990070343017578, 0.00124359130859375, 0.0012881755828857422, 0.0013327598571777344, 0.0013773441314697266, 0.0014219284057617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 7.0, 10.0, 21.0, 19.0, 31.0, 46.0, 93.0, 126.0, 224.0, 427.0, 829.0, 1781.0, 4803.0, 19727.0, 168037.0, 721096.0, 109259.0, 14749.0, 4035.0, 1613.0, 692.0, 377.0, 188.0, 122.0, 74.0, 34.0, 32.0, 15.0, 18.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.46875, -17.916015625, -17.36328125, -16.810546875, -16.2578125, -15.705078125, -15.15234375, -14.599609375, -14.046875, -13.494140625, -12.94140625, -12.388671875, -11.8359375, -11.283203125, -10.73046875, -10.177734375, -9.625, -9.072265625, -8.51953125, -7.966796875, -7.4140625, -6.861328125, -6.30859375, -5.755859375, -5.203125, -4.650390625, -4.09765625, -3.544921875, -2.9921875, -2.439453125, -1.88671875, -1.333984375, -0.78125, -0.228515625, 0.32421875, 0.876953125, 1.4296875, 1.982421875, 2.53515625, 3.087890625, 3.640625, 4.193359375, 4.74609375, 5.298828125, 5.8515625, 6.404296875, 6.95703125, 7.509765625, 8.0625, 8.615234375, 9.16796875, 9.720703125, 10.2734375, 10.826171875, 11.37890625, 11.931640625, 12.484375, 13.037109375, 13.58984375, 14.142578125, 14.6953125, 15.248046875, 15.80078125, 16.353515625, 16.90625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 3.0, 14.0, 15.0, 21.0, 33.0, 47.0, 54.0, 83.0, 118.0, 107.0, 112.0, 98.0, 63.0, 51.0, 55.0, 27.0, 22.0, 13.0, 7.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3284912109375, -7.047607421875, -6.7667236328125, -6.48583984375, -6.2049560546875, -5.924072265625, -5.6431884765625, -5.3623046875, -5.0814208984375, -4.800537109375, -4.5196533203125, -4.23876953125, -3.9578857421875, -3.677001953125, -3.3961181640625, -3.115234375, -2.8343505859375, -2.553466796875, -2.2725830078125, -1.99169921875, -1.7108154296875, -1.429931640625, -1.1490478515625, -0.8681640625, -0.5872802734375, -0.306396484375, -0.0255126953125, 0.25537109375, 0.5362548828125, 0.817138671875, 1.0980224609375, 1.37890625, 1.6597900390625, 1.940673828125, 2.2215576171875, 2.50244140625, 2.7833251953125, 3.064208984375, 3.3450927734375, 3.6259765625, 3.9068603515625, 4.187744140625, 4.4686279296875, 4.74951171875, 5.0303955078125, 5.311279296875, 5.5921630859375, 5.873046875, 6.1539306640625, 6.434814453125, 6.7156982421875, 6.99658203125, 7.2774658203125, 7.558349609375, 7.8392333984375, 8.1201171875, 8.4010009765625, 8.681884765625, 8.9627685546875, 9.24365234375, 9.5245361328125, 9.805419921875, 10.0863037109375, 10.3671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 9.0, 26.0, 39.0, 81.0, 156.0, 210.0, 191.0, 134.0, 82.0, 39.0, 18.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.3468017578125, -166.20130920410156, -160.0558319091797, -153.91033935546875, -147.76486206054688, -141.61936950683594, -135.473876953125, -129.32839965820312, -123.18290710449219, -117.03742218017578, -110.89193725585938, -104.74644470214844, -98.60095977783203, -92.45547485351562, -86.30998229980469, -80.16449737548828, -74.01901245117188, -67.87352752685547, -61.7280387878418, -55.582550048828125, -49.43706512451172, -43.29158020019531, -37.14609146118164, -31.00060272216797, -24.855117797851562, -18.709630966186523, -12.564144134521484, -6.418657302856445, -0.27317047119140625, 5.872316360473633, 12.017803192138672, 18.163291931152344, 24.30877685546875, 30.45426368713379, 36.59975051879883, 42.7452392578125, 48.890724182128906, 55.03620910644531, 61.181697845458984, 67.32718658447266, 73.47267150878906, 79.61815643310547, 85.76364135742188, 91.90913391113281, 98.05461883544922, 104.20010375976562, 110.34559631347656, 116.49108123779297, 122.63656616210938, 128.7820587158203, 134.9275360107422, 141.07302856445312, 147.218505859375, 153.36399841308594, 159.50949096679688, 165.65496826171875, 171.8004608154297, 177.94595336914062, 184.0914306640625, 190.23692321777344, 196.38241577148438, 202.52789306640625, 208.6733856201172, 214.81887817382812, 220.96435546875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 10.0, 19.0, 16.0, 11.0, 18.0, 23.0, 21.0, 31.0, 24.0, 25.0, 27.0, 31.0, 39.0, 41.0, 52.0, 48.0, 52.0, 42.0, 42.0, 41.0, 33.0, 43.0, 36.0, 34.0, 32.0, 35.0, 21.0, 22.0, 17.0, 14.0, 12.0, 7.0, 13.0, 11.0, 11.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-72.09889221191406, -70.00700378417969, -67.91511535644531, -65.82323455810547, -63.731346130371094, -61.63945770263672, -59.547569274902344, -57.45568084716797, -55.36379623413086, -53.271907806396484, -51.180023193359375, -49.088134765625, -46.996246337890625, -44.904361724853516, -42.81247329711914, -40.72058868408203, -38.628700256347656, -36.53681182861328, -34.44492721557617, -32.3530387878418, -30.261152267456055, -28.169265747070312, -26.077377319335938, -23.985490798950195, -21.893604278564453, -19.80171775817871, -17.70983123779297, -15.617942810058594, -13.526056289672852, -11.43416976928711, -9.34228229522705, -7.250394821166992, -5.158515930175781, -3.066628932952881, -0.9747419357299805, 1.11714506149292, 3.2090320587158203, 5.3009185791015625, 7.392806053161621, 9.48469352722168, 11.576580047607422, 13.668466567993164, 15.760354042053223, 17.85224151611328, 19.944128036499023, 22.036014556884766, 24.12790298461914, 26.219789505004883, 28.311676025390625, 30.403562545776367, 32.49544906616211, 34.587337493896484, 36.679222106933594, 38.77111053466797, 40.862998962402344, 42.95488739013672, 45.04677200317383, 47.1386604309082, 49.23054504394531, 51.32243347167969, 53.41432189941406, 55.50620651245117, 57.59809494018555, 59.689979553222656, 61.78186798095703]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 12.0, 7.0, 7.0, 18.0, 25.0, 37.0, 52.0, 73.0, 128.0, 167.0, 288.0, 392.0, 636.0, 1073.0, 1724.0, 3093.0, 5907.0, 12133.0, 27312.0, 71997.0, 278254.0, 3078994.0, 537049.0, 105146.0, 36667.0, 15789.0, 7550.0, 3998.0, 2264.0, 1317.0, 812.0, 479.0, 303.0, 207.0, 125.0, 70.0, 53.0, 43.0, 26.0, 22.0, 13.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.7822265625, -15.267578125, -14.7529296875, -14.23828125, -13.7236328125, -13.208984375, -12.6943359375, -12.1796875, -11.6650390625, -11.150390625, -10.6357421875, -10.12109375, -9.6064453125, -9.091796875, -8.5771484375, -8.0625, -7.5478515625, -7.033203125, -6.5185546875, -6.00390625, -5.4892578125, -4.974609375, -4.4599609375, -3.9453125, -3.4306640625, -2.916015625, -2.4013671875, -1.88671875, -1.3720703125, -0.857421875, -0.3427734375, 0.171875, 0.6865234375, 1.201171875, 1.7158203125, 2.23046875, 2.7451171875, 3.259765625, 3.7744140625, 4.2890625, 4.8037109375, 5.318359375, 5.8330078125, 6.34765625, 6.8623046875, 7.376953125, 7.8916015625, 8.40625, 8.9208984375, 9.435546875, 9.9501953125, 10.46484375, 10.9794921875, 11.494140625, 12.0087890625, 12.5234375, 13.0380859375, 13.552734375, 14.0673828125, 14.58203125, 15.0966796875, 15.611328125, 16.1259765625, 16.640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 8.0, 12.0, 13.0, 21.0, 20.0, 18.0, 21.0, 30.0, 25.0, 22.0, 48.0, 29.0, 56.0, 44.0, 50.0, 46.0, 47.0, 52.0, 40.0, 33.0, 43.0, 37.0, 40.0, 38.0, 33.0, 29.0, 27.0, 18.0, 12.0, 15.0, 13.0, 23.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.5657958984375, -2.473388671875, -2.3809814453125, -2.28857421875, -2.1961669921875, -2.103759765625, -2.0113525390625, -1.9189453125, -1.8265380859375, -1.734130859375, -1.6417236328125, -1.54931640625, -1.4569091796875, -1.364501953125, -1.2720947265625, -1.1796875, -1.0872802734375, -0.994873046875, -0.9024658203125, -0.81005859375, -0.7176513671875, -0.625244140625, -0.5328369140625, -0.4404296875, -0.3480224609375, -0.255615234375, -0.1632080078125, -0.07080078125, 0.0216064453125, 0.114013671875, 0.2064208984375, 0.298828125, 0.3912353515625, 0.483642578125, 0.5760498046875, 0.66845703125, 0.7608642578125, 0.853271484375, 0.9456787109375, 1.0380859375, 1.1304931640625, 1.222900390625, 1.3153076171875, 1.40771484375, 1.5001220703125, 1.592529296875, 1.6849365234375, 1.77734375, 1.8697509765625, 1.962158203125, 2.0545654296875, 2.14697265625, 2.2393798828125, 2.331787109375, 2.4241943359375, 2.5166015625, 2.6090087890625, 2.701416015625, 2.7938232421875, 2.88623046875, 2.9786376953125, 3.071044921875, 3.1634521484375, 3.255859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 14.0, 18.0, 21.0, 28.0, 50.0, 59.0, 108.0, 192.0, 441.0, 1197.0, 3423.0, 13214.0, 68803.0, 738083.0, 3156358.0, 176343.0, 26605.0, 6129.0, 1821.0, 679.0, 281.0, 141.0, 61.0, 48.0, 28.0, 19.0, 22.0, 14.0, 14.0, 14.0, 5.0, 7.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0625, -23.2919921875, -22.521484375, -21.7509765625, -20.98046875, -20.2099609375, -19.439453125, -18.6689453125, -17.8984375, -17.1279296875, -16.357421875, -15.5869140625, -14.81640625, -14.0458984375, -13.275390625, -12.5048828125, -11.734375, -10.9638671875, -10.193359375, -9.4228515625, -8.65234375, -7.8818359375, -7.111328125, -6.3408203125, -5.5703125, -4.7998046875, -4.029296875, -3.2587890625, -2.48828125, -1.7177734375, -0.947265625, -0.1767578125, 0.59375, 1.3642578125, 2.134765625, 2.9052734375, 3.67578125, 4.4462890625, 5.216796875, 5.9873046875, 6.7578125, 7.5283203125, 8.298828125, 9.0693359375, 9.83984375, 10.6103515625, 11.380859375, 12.1513671875, 12.921875, 13.6923828125, 14.462890625, 15.2333984375, 16.00390625, 16.7744140625, 17.544921875, 18.3154296875, 19.0859375, 19.8564453125, 20.626953125, 21.3974609375, 22.16796875, 22.9384765625, 23.708984375, 24.4794921875, 25.25]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 8.0, 2.0, 8.0, 15.0, 15.0, 35.0, 31.0, 55.0, 70.0, 113.0, 190.0, 360.0, 759.0, 1230.0, 469.0, 245.0, 163.0, 91.0, 70.0, 51.0, 25.0, 21.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.765625, -10.50457763671875, -10.2435302734375, -9.98248291015625, -9.721435546875, -9.46038818359375, -9.1993408203125, -8.93829345703125, -8.67724609375, -8.41619873046875, -8.1551513671875, -7.89410400390625, -7.633056640625, -7.37200927734375, -7.1109619140625, -6.84991455078125, -6.5888671875, -6.32781982421875, -6.0667724609375, -5.80572509765625, -5.544677734375, -5.28363037109375, -5.0225830078125, -4.76153564453125, -4.50048828125, -4.23944091796875, -3.9783935546875, -3.71734619140625, -3.456298828125, -3.19525146484375, -2.9342041015625, -2.67315673828125, -2.412109375, -2.15106201171875, -1.8900146484375, -1.62896728515625, -1.367919921875, -1.10687255859375, -0.8458251953125, -0.58477783203125, -0.32373046875, -0.06268310546875, 0.1983642578125, 0.45941162109375, 0.720458984375, 0.98150634765625, 1.2425537109375, 1.50360107421875, 1.7646484375, 2.02569580078125, 2.2867431640625, 2.54779052734375, 2.808837890625, 3.06988525390625, 3.3309326171875, 3.59197998046875, 3.85302734375, 4.11407470703125, 4.3751220703125, 4.63616943359375, 4.897216796875, 5.15826416015625, 5.4193115234375, 5.68035888671875, 5.94140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 16.0, 48.0, 91.0, 169.0, 247.0, 217.0, 105.0, 54.0, 26.0, 10.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-160.65032958984375, -157.3536834716797, -154.05703735351562, -150.76040649414062, -147.46376037597656, -144.1671142578125, -140.87046813964844, -137.57382202148438, -134.2771759033203, -130.98052978515625, -127.68389129638672, -124.38724517822266, -121.0905990600586, -117.79396057128906, -114.497314453125, -111.20066833496094, -107.90403747558594, -104.60739135742188, -101.31075286865234, -98.01410675048828, -94.71746063232422, -91.42082214355469, -88.12417602539062, -84.82752990722656, -81.5308837890625, -78.23423767089844, -74.9375991821289, -71.64095306396484, -68.34430694580078, -65.04766845703125, -61.75102233886719, -58.45438003540039, -55.15774154663086, -51.86109924316406, -48.564453125, -45.2678108215332, -41.971168518066406, -38.674522399902344, -35.37788009643555, -32.08123779296875, -28.78459358215332, -25.48794937133789, -22.191307067871094, -18.894662857055664, -15.59801959991455, -12.301376342773438, -9.004732131958008, -5.708089828491211, -2.4114456176757812, 0.8851978778839111, 4.1818413734436035, 7.478485107421875, 10.775128364562988, 14.071771621704102, 17.36841583251953, 20.665058135986328, 23.961702346801758, 27.258346557617188, 30.554988861083984, 33.85163116455078, 37.148277282714844, 40.44491958618164, 43.74156188964844, 47.0382080078125, 50.3348503112793]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 7.0, 8.0, 7.0, 7.0, 17.0, 13.0, 11.0, 16.0, 19.0, 23.0, 20.0, 30.0, 31.0, 23.0, 37.0, 39.0, 32.0, 42.0, 41.0, 38.0, 50.0, 36.0, 40.0, 29.0, 38.0, 47.0, 52.0, 34.0, 23.0, 21.0, 27.0, 16.0, 24.0, 15.0, 9.0, 17.0, 8.0, 6.0, 7.0, 6.0, 7.0, 5.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.069576263427734, -20.323698043823242, -19.57781982421875, -18.83194351196289, -18.0860652923584, -17.340187072753906, -16.594308853149414, -15.848430633544922, -15.102553367614746, -14.356675148010254, -13.610797882080078, -12.864919662475586, -12.119041442871094, -11.373164176940918, -10.627285957336426, -9.88140869140625, -9.135530471801758, -8.389652252197266, -7.64377498626709, -6.897896766662598, -6.152019023895264, -5.40614128112793, -4.6602630615234375, -3.9143853187561035, -3.1685075759887695, -2.4226298332214355, -1.6767518520355225, -0.9308738708496094, -0.1849961280822754, 0.5608816146850586, 1.3067598342895508, 2.0526375770568848, 2.7985172271728516, 3.5443949699401855, 4.2902727127075195, 5.036150932312012, 5.782028675079346, 6.52790641784668, 7.273784637451172, 8.019662857055664, 8.76554012298584, 9.511418342590332, 10.257295608520508, 11.003173828125, 11.749052047729492, 12.494929313659668, 13.24080753326416, 13.986684799194336, 14.732563018798828, 15.47844123840332, 16.224319458007812, 16.970195770263672, 17.716073989868164, 18.461952209472656, 19.20783042907715, 19.95370864868164, 20.6995849609375, 21.445463180541992, 22.191341400146484, 22.937217712402344, 23.683095932006836, 24.428974151611328, 25.17485237121582, 25.920730590820312, 26.666608810424805]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 12.0, 17.0, 29.0, 41.0, 76.0, 113.0, 173.0, 272.0, 464.0, 801.0, 1452.0, 2705.0, 5657.0, 11664.0, 25563.0, 59120.0, 163087.0, 469149.0, 188661.0, 65878.0, 27966.0, 12857.0, 6054.0, 3002.0, 1552.0, 861.0, 495.0, 293.0, 197.0, 126.0, 77.0, 55.0, 30.0, 17.0, 14.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.953125, -19.421875, -18.890625, -18.359375, -17.828125, -17.296875, -16.765625, -16.234375, -15.703125, -15.171875, -14.640625, -14.109375, -13.578125, -13.046875, -12.515625, -11.984375, -11.453125, -10.921875, -10.390625, -9.859375, -9.328125, -8.796875, -8.265625, -7.734375, -7.203125, -6.671875, -6.140625, -5.609375, -5.078125, -4.546875, -4.015625, -3.484375, -2.953125, -2.421875, -1.890625, -1.359375, -0.828125, -0.296875, 0.234375, 0.765625, 1.296875, 1.828125, 2.359375, 2.890625, 3.421875, 3.953125, 4.484375, 5.015625, 5.546875, 6.078125, 6.609375, 7.140625, 7.671875, 8.203125, 8.734375, 9.265625, 9.796875, 10.328125, 10.859375, 11.390625, 11.921875, 12.453125, 12.984375, 13.515625, 14.046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 17.0, 10.0, 9.0, 20.0, 29.0, 16.0, 28.0, 27.0, 37.0, 28.0, 24.0, 41.0, 55.0, 40.0, 62.0, 41.0, 50.0, 39.0, 41.0, 34.0, 42.0, 46.0, 32.0, 42.0, 32.0, 24.0, 20.0, 28.0, 10.0, 16.0, 14.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.30645751953125, -2.2144775390625, -2.12249755859375, -2.030517578125, -1.93853759765625, -1.8465576171875, -1.75457763671875, -1.66259765625, -1.57061767578125, -1.4786376953125, -1.38665771484375, -1.294677734375, -1.20269775390625, -1.1107177734375, -1.01873779296875, -0.9267578125, -0.83477783203125, -0.7427978515625, -0.65081787109375, -0.558837890625, -0.46685791015625, -0.3748779296875, -0.28289794921875, -0.19091796875, -0.09893798828125, -0.0069580078125, 0.08502197265625, 0.177001953125, 0.26898193359375, 0.3609619140625, 0.45294189453125, 0.544921875, 0.63690185546875, 0.7288818359375, 0.82086181640625, 0.912841796875, 1.00482177734375, 1.0968017578125, 1.18878173828125, 1.28076171875, 1.37274169921875, 1.4647216796875, 1.55670166015625, 1.648681640625, 1.74066162109375, 1.8326416015625, 1.92462158203125, 2.0166015625, 2.10858154296875, 2.2005615234375, 2.29254150390625, 2.384521484375, 2.47650146484375, 2.5684814453125, 2.66046142578125, 2.75244140625, 2.84442138671875, 2.9364013671875, 3.02838134765625, 3.120361328125, 3.21234130859375, 3.3043212890625, 3.39630126953125, 3.48828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 16.0, 17.0, 17.0, 22.0, 26.0, 49.0, 59.0, 73.0, 105.0, 125.0, 171.0, 249.0, 335.0, 494.0, 901.0, 1883.0, 5178.0, 15915.0, 53877.0, 194358.0, 545818.0, 161293.0, 45258.0, 13606.0, 4430.0, 1750.0, 863.0, 445.0, 321.0, 237.0, 166.0, 126.0, 90.0, 76.0, 52.0, 39.0, 29.0, 14.0, 17.0, 13.0, 12.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.46875, -15.94482421875, -15.4208984375, -14.89697265625, -14.373046875, -13.84912109375, -13.3251953125, -12.80126953125, -12.27734375, -11.75341796875, -11.2294921875, -10.70556640625, -10.181640625, -9.65771484375, -9.1337890625, -8.60986328125, -8.0859375, -7.56201171875, -7.0380859375, -6.51416015625, -5.990234375, -5.46630859375, -4.9423828125, -4.41845703125, -3.89453125, -3.37060546875, -2.8466796875, -2.32275390625, -1.798828125, -1.27490234375, -0.7509765625, -0.22705078125, 0.296875, 0.82080078125, 1.3447265625, 1.86865234375, 2.392578125, 2.91650390625, 3.4404296875, 3.96435546875, 4.48828125, 5.01220703125, 5.5361328125, 6.06005859375, 6.583984375, 7.10791015625, 7.6318359375, 8.15576171875, 8.6796875, 9.20361328125, 9.7275390625, 10.25146484375, 10.775390625, 11.29931640625, 11.8232421875, 12.34716796875, 12.87109375, 13.39501953125, 13.9189453125, 14.44287109375, 14.966796875, 15.49072265625, 16.0146484375, 16.53857421875, 17.0625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 5.0, 14.0, 12.0, 27.0, 12.0, 12.0, 21.0, 22.0, 33.0, 26.0, 34.0, 31.0, 31.0, 38.0, 42.0, 52.0, 42.0, 44.0, 47.0, 28.0, 42.0, 39.0, 34.0, 41.0, 36.0, 32.0, 27.0, 36.0, 17.0, 18.0, 23.0, 16.0, 14.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-13.171875, -12.8050537109375, -12.438232421875, -12.0714111328125, -11.70458984375, -11.3377685546875, -10.970947265625, -10.6041259765625, -10.2373046875, -9.8704833984375, -9.503662109375, -9.1368408203125, -8.77001953125, -8.4031982421875, -8.036376953125, -7.6695556640625, -7.302734375, -6.9359130859375, -6.569091796875, -6.2022705078125, -5.83544921875, -5.4686279296875, -5.101806640625, -4.7349853515625, -4.3681640625, -4.0013427734375, -3.634521484375, -3.2677001953125, -2.90087890625, -2.5340576171875, -2.167236328125, -1.8004150390625, -1.43359375, -1.0667724609375, -0.699951171875, -0.3331298828125, 0.03369140625, 0.4005126953125, 0.767333984375, 1.1341552734375, 1.5009765625, 1.8677978515625, 2.234619140625, 2.6014404296875, 2.96826171875, 3.3350830078125, 3.701904296875, 4.0687255859375, 4.435546875, 4.8023681640625, 5.169189453125, 5.5360107421875, 5.90283203125, 6.2696533203125, 6.636474609375, 7.0032958984375, 7.3701171875, 7.7369384765625, 8.103759765625, 8.4705810546875, 8.83740234375, 9.2042236328125, 9.571044921875, 9.9378662109375, 10.3046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 2.0, 7.0, 14.0, 23.0, 24.0, 60.0, 82.0, 152.0, 227.0, 411.0, 869.0, 2541.0, 10480.0, 59559.0, 538587.0, 378649.0, 44848.0, 8155.0, 2113.0, 802.0, 377.0, 214.0, 109.0, 89.0, 47.0, 27.0, 22.0, 10.0, 15.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.2490234375, -12.833984375, -12.4189453125, -12.00390625, -11.5888671875, -11.173828125, -10.7587890625, -10.34375, -9.9287109375, -9.513671875, -9.0986328125, -8.68359375, -8.2685546875, -7.853515625, -7.4384765625, -7.0234375, -6.6083984375, -6.193359375, -5.7783203125, -5.36328125, -4.9482421875, -4.533203125, -4.1181640625, -3.703125, -3.2880859375, -2.873046875, -2.4580078125, -2.04296875, -1.6279296875, -1.212890625, -0.7978515625, -0.3828125, 0.0322265625, 0.447265625, 0.8623046875, 1.27734375, 1.6923828125, 2.107421875, 2.5224609375, 2.9375, 3.3525390625, 3.767578125, 4.1826171875, 4.59765625, 5.0126953125, 5.427734375, 5.8427734375, 6.2578125, 6.6728515625, 7.087890625, 7.5029296875, 7.91796875, 8.3330078125, 8.748046875, 9.1630859375, 9.578125, 9.9931640625, 10.408203125, 10.8232421875, 11.23828125, 11.6533203125, 12.068359375, 12.4833984375, 12.8984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 10.0, 13.0, 9.0, 18.0, 18.0, 22.0, 29.0, 39.0, 96.0, 195.0, 223.0, 98.0, 33.0, 40.0, 23.0, 27.0, 21.0, 11.0, 7.0, 5.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001407623291015625, -0.0013535618782043457, -0.0012995004653930664, -0.0012454390525817871, -0.0011913776397705078, -0.0011373162269592285, -0.0010832548141479492, -0.00102919340133667, -0.0009751319885253906, -0.0009210705757141113, -0.000867009162902832, -0.0008129477500915527, -0.0007588863372802734, -0.0007048249244689941, -0.0006507635116577148, -0.0005967020988464355, -0.0005426406860351562, -0.000488579273223877, -0.00043451786041259766, -0.00038045644760131836, -0.00032639503479003906, -0.00027233362197875977, -0.00021827220916748047, -0.00016421079635620117, -0.00011014938354492188, -5.608797073364258e-05, -2.0265579223632812e-06, 5.2034854888916016e-05, 0.00010609626770019531, 0.0001601576805114746, 0.0002142190933227539, 0.0002682805061340332, 0.0003223419189453125, 0.0003764033317565918, 0.0004304647445678711, 0.0004845261573791504, 0.0005385875701904297, 0.000592648983001709, 0.0006467103958129883, 0.0007007718086242676, 0.0007548332214355469, 0.0008088946342468262, 0.0008629560470581055, 0.0009170174598693848, 0.0009710788726806641, 0.0010251402854919434, 0.0010792016983032227, 0.001133263111114502, 0.0011873245239257812, 0.0012413859367370605, 0.0012954473495483398, 0.0013495087623596191, 0.0014035701751708984, 0.0014576315879821777, 0.001511693000793457, 0.0015657544136047363, 0.0016198158264160156, 0.001673877239227295, 0.0017279386520385742, 0.0017820000648498535, 0.0018360614776611328, 0.0018901228904724121, 0.0019441843032836914, 0.0019982457160949707, 0.00205230712890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 11.0, 11.0, 13.0, 25.0, 38.0, 68.0, 106.0, 181.0, 370.0, 805.0, 2653.0, 20759.0, 635327.0, 370033.0, 14534.0, 2191.0, 685.0, 351.0, 178.0, 74.0, 60.0, 31.0, 20.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.953125, -17.170166015625, -16.38720703125, -15.604248046875, -14.8212890625, -14.038330078125, -13.25537109375, -12.472412109375, -11.689453125, -10.906494140625, -10.12353515625, -9.340576171875, -8.5576171875, -7.774658203125, -6.99169921875, -6.208740234375, -5.42578125, -4.642822265625, -3.85986328125, -3.076904296875, -2.2939453125, -1.510986328125, -0.72802734375, 0.054931640625, 0.837890625, 1.620849609375, 2.40380859375, 3.186767578125, 3.9697265625, 4.752685546875, 5.53564453125, 6.318603515625, 7.1015625, 7.884521484375, 8.66748046875, 9.450439453125, 10.2333984375, 11.016357421875, 11.79931640625, 12.582275390625, 13.365234375, 14.148193359375, 14.93115234375, 15.714111328125, 16.4970703125, 17.280029296875, 18.06298828125, 18.845947265625, 19.62890625, 20.411865234375, 21.19482421875, 21.977783203125, 22.7607421875, 23.543701171875, 24.32666015625, 25.109619140625, 25.892578125, 26.675537109375, 27.45849609375, 28.241455078125, 29.0244140625, 29.807373046875, 30.59033203125, 31.373291015625, 32.15625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 4.0, 11.0, 9.0, 16.0, 17.0, 24.0, 29.0, 34.0, 50.0, 62.0, 84.0, 109.0, 105.0, 89.0, 61.0, 65.0, 39.0, 33.0, 26.0, 23.0, 15.0, 14.0, 22.0, 9.0, 5.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.5625, -7.33514404296875, -7.1077880859375, -6.88043212890625, -6.653076171875, -6.42572021484375, -6.1983642578125, -5.97100830078125, -5.74365234375, -5.51629638671875, -5.2889404296875, -5.06158447265625, -4.834228515625, -4.60687255859375, -4.3795166015625, -4.15216064453125, -3.9248046875, -3.69744873046875, -3.4700927734375, -3.24273681640625, -3.015380859375, -2.78802490234375, -2.5606689453125, -2.33331298828125, -2.10595703125, -1.87860107421875, -1.6512451171875, -1.42388916015625, -1.196533203125, -0.96917724609375, -0.7418212890625, -0.51446533203125, -0.287109375, -0.05975341796875, 0.1676025390625, 0.39495849609375, 0.622314453125, 0.84967041015625, 1.0770263671875, 1.30438232421875, 1.53173828125, 1.75909423828125, 1.9864501953125, 2.21380615234375, 2.441162109375, 2.66851806640625, 2.8958740234375, 3.12322998046875, 3.3505859375, 3.57794189453125, 3.8052978515625, 4.03265380859375, 4.260009765625, 4.48736572265625, 4.7147216796875, 4.94207763671875, 5.16943359375, 5.39678955078125, 5.6241455078125, 5.85150146484375, 6.078857421875, 6.30621337890625, 6.5335693359375, 6.76092529296875, 6.98828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 21.0, 49.0, 99.0, 147.0, 210.0, 186.0, 143.0, 63.0, 34.0, 23.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.17317199707031, -59.779273986816406, -54.3853759765625, -48.99147415161133, -43.59757614135742, -38.203678131103516, -32.809776306152344, -27.415878295898438, -22.02198028564453, -16.628082275390625, -11.234182357788086, -5.840282440185547, -0.4463844299316406, 4.947513580322266, 10.341415405273438, 15.735313415527344, 21.12921142578125, 26.523109436035156, 31.917009353637695, 37.310909271240234, 42.70480728149414, 48.09870529174805, 53.49260711669922, 58.886505126953125, 64.28040313720703, 69.67430114746094, 75.06819915771484, 80.46209716796875, 85.85600280761719, 91.24989318847656, 96.643798828125, 102.0376968383789, 107.43157958984375, 112.82547760009766, 118.21937561035156, 123.61328125, 129.00717163085938, 134.4010772705078, 139.79498291015625, 145.18887329101562, 150.582763671875, 155.97666931152344, 161.3705596923828, 166.76446533203125, 172.15835571289062, 177.55226135253906, 182.9461669921875, 188.34005737304688, 193.7339630126953, 199.12786865234375, 204.52175903320312, 209.91566467285156, 215.30955505371094, 220.70346069335938, 226.09735107421875, 231.4912567138672, 236.88516235351562, 242.27906799316406, 247.67295837402344, 253.06686401367188, 258.46075439453125, 263.8546447753906, 269.2485656738281, 274.6424560546875, 280.0363464355469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 9.0, 14.0, 8.0, 12.0, 14.0, 11.0, 14.0, 16.0, 16.0, 26.0, 27.0, 23.0, 31.0, 39.0, 35.0, 44.0, 38.0, 22.0, 60.0, 41.0, 41.0, 44.0, 46.0, 38.0, 38.0, 37.0, 28.0, 37.0, 28.0, 35.0, 24.0, 25.0, 13.0, 8.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.59772491455078, -58.66156005859375, -56.72539520263672, -54.78923034667969, -52.853065490722656, -50.916900634765625, -48.98073959350586, -47.04457473754883, -45.1084098815918, -43.172245025634766, -41.236080169677734, -39.2999153137207, -37.36375427246094, -35.427589416503906, -33.491424560546875, -31.555259704589844, -29.619094848632812, -27.68292999267578, -25.74676513671875, -23.81060218811035, -21.87443733215332, -19.93827247619629, -18.00210952758789, -16.06594467163086, -14.129779815673828, -12.193614959716797, -10.257451057434082, -8.321287155151367, -6.385122299194336, -4.448957443237305, -2.51279354095459, -0.576629638671875, 1.3595314025878906, 3.2956957817077637, 5.231860160827637, 7.16802453994751, 9.104188919067383, 11.040353775024414, 12.976517677307129, 14.912681579589844, 16.848846435546875, 18.785011291503906, 20.721176147460938, 22.657339096069336, 24.593503952026367, 26.5296688079834, 28.465831756591797, 30.401996612548828, 32.33816146850586, 34.27432632446289, 36.21049118041992, 38.14665603637695, 40.08281707763672, 42.01898193359375, 43.95514678955078, 45.89131164550781, 47.827476501464844, 49.763641357421875, 51.699806213378906, 53.63597106933594, 55.57213592529297, 57.50830078125, 59.444461822509766, 61.3806266784668, 63.31679153442383]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 2.0, 7.0, 8.0, 21.0, 16.0, 22.0, 34.0, 38.0, 83.0, 114.0, 224.0, 450.0, 1096.0, 3001.0, 9471.0, 40717.0, 536180.0, 3496137.0, 83700.0, 15684.0, 4394.0, 1508.0, 662.0, 281.0, 167.0, 86.0, 54.0, 39.0, 21.0, 21.0, 7.0, 9.0, 4.0, 3.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.33984375, -34.0859375, -32.83203125, -31.578125, -30.32421875, -29.0703125, -27.81640625, -26.5625, -25.30859375, -24.0546875, -22.80078125, -21.546875, -20.29296875, -19.0390625, -17.78515625, -16.53125, -15.27734375, -14.0234375, -12.76953125, -11.515625, -10.26171875, -9.0078125, -7.75390625, -6.5, -5.24609375, -3.9921875, -2.73828125, -1.484375, -0.23046875, 1.0234375, 2.27734375, 3.53125, 4.78515625, 6.0390625, 7.29296875, 8.546875, 9.80078125, 11.0546875, 12.30859375, 13.5625, 14.81640625, 16.0703125, 17.32421875, 18.578125, 19.83203125, 21.0859375, 22.33984375, 23.59375, 24.84765625, 26.1015625, 27.35546875, 28.609375, 29.86328125, 31.1171875, 32.37109375, 33.625, 34.87890625, 36.1328125, 37.38671875, 38.640625, 39.89453125, 41.1484375, 42.40234375, 43.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 13.0, 13.0, 14.0, 17.0, 19.0, 18.0, 31.0, 29.0, 33.0, 34.0, 40.0, 33.0, 49.0, 58.0, 57.0, 49.0, 39.0, 38.0, 40.0, 51.0, 43.0, 31.0, 37.0, 44.0, 20.0, 20.0, 21.0, 22.0, 16.0, 11.0, 14.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.921875, -2.82684326171875, -2.7318115234375, -2.63677978515625, -2.541748046875, -2.44671630859375, -2.3516845703125, -2.25665283203125, -2.16162109375, -2.06658935546875, -1.9715576171875, -1.87652587890625, -1.781494140625, -1.68646240234375, -1.5914306640625, -1.49639892578125, -1.4013671875, -1.30633544921875, -1.2113037109375, -1.11627197265625, -1.021240234375, -0.92620849609375, -0.8311767578125, -0.73614501953125, -0.64111328125, -0.54608154296875, -0.4510498046875, -0.35601806640625, -0.260986328125, -0.16595458984375, -0.0709228515625, 0.02410888671875, 0.119140625, 0.21417236328125, 0.3092041015625, 0.40423583984375, 0.499267578125, 0.59429931640625, 0.6893310546875, 0.78436279296875, 0.87939453125, 0.97442626953125, 1.0694580078125, 1.16448974609375, 1.259521484375, 1.35455322265625, 1.4495849609375, 1.54461669921875, 1.6396484375, 1.73468017578125, 1.8297119140625, 1.92474365234375, 2.019775390625, 2.11480712890625, 2.2098388671875, 2.30487060546875, 2.39990234375, 2.49493408203125, 2.5899658203125, 2.68499755859375, 2.780029296875, 2.87506103515625, 2.9700927734375, 3.06512451171875, 3.16015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 9.0, 8.0, 20.0, 18.0, 22.0, 28.0, 30.0, 44.0, 44.0, 59.0, 71.0, 126.0, 164.0, 262.0, 557.0, 1348.0, 5035.0, 28460.0, 387352.0, 3639693.0, 112501.0, 13299.0, 2862.0, 934.0, 427.0, 238.0, 118.0, 103.0, 80.0, 81.0, 47.0, 38.0, 31.0, 37.0, 27.0, 22.0, 15.0, 11.0, 16.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.05029296875, -29.9130859375, -28.77587890625, -27.638671875, -26.50146484375, -25.3642578125, -24.22705078125, -23.08984375, -21.95263671875, -20.8154296875, -19.67822265625, -18.541015625, -17.40380859375, -16.2666015625, -15.12939453125, -13.9921875, -12.85498046875, -11.7177734375, -10.58056640625, -9.443359375, -8.30615234375, -7.1689453125, -6.03173828125, -4.89453125, -3.75732421875, -2.6201171875, -1.48291015625, -0.345703125, 0.79150390625, 1.9287109375, 3.06591796875, 4.203125, 5.34033203125, 6.4775390625, 7.61474609375, 8.751953125, 9.88916015625, 11.0263671875, 12.16357421875, 13.30078125, 14.43798828125, 15.5751953125, 16.71240234375, 17.849609375, 18.98681640625, 20.1240234375, 21.26123046875, 22.3984375, 23.53564453125, 24.6728515625, 25.81005859375, 26.947265625, 28.08447265625, 29.2216796875, 30.35888671875, 31.49609375, 32.63330078125, 33.7705078125, 34.90771484375, 36.044921875, 37.18212890625, 38.3193359375, 39.45654296875, 40.59375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 24.0, 19.0, 60.0, 92.0, 212.0, 520.0, 1956.0, 696.0, 250.0, 102.0, 58.0, 33.0, 11.0, 13.0, 9.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.637939453125, -6.21337890625, -5.788818359375, -5.3642578125, -4.939697265625, -4.51513671875, -4.090576171875, -3.666015625, -3.241455078125, -2.81689453125, -2.392333984375, -1.9677734375, -1.543212890625, -1.11865234375, -0.694091796875, -0.26953125, 0.155029296875, 0.57958984375, 1.004150390625, 1.4287109375, 1.853271484375, 2.27783203125, 2.702392578125, 3.126953125, 3.551513671875, 3.97607421875, 4.400634765625, 4.8251953125, 5.249755859375, 5.67431640625, 6.098876953125, 6.5234375, 6.947998046875, 7.37255859375, 7.797119140625, 8.2216796875, 8.646240234375, 9.07080078125, 9.495361328125, 9.919921875, 10.344482421875, 10.76904296875, 11.193603515625, 11.6181640625, 12.042724609375, 12.46728515625, 12.891845703125, 13.31640625, 13.740966796875, 14.16552734375, 14.590087890625, 15.0146484375, 15.439208984375, 15.86376953125, 16.288330078125, 16.712890625, 17.137451171875, 17.56201171875, 17.986572265625, 18.4111328125, 18.835693359375, 19.26025390625, 19.684814453125, 20.109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 40.0, 71.0, 177.0, 221.0, 189.0, 145.0, 87.0, 27.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.99659729003906, -132.76165771484375, -129.52670288085938, -126.29175567626953, -123.05680847167969, -119.82186126708984, -116.5869140625, -113.35196685791016, -110.11701965332031, -106.88207244873047, -103.64712524414062, -100.41217803955078, -97.17723083496094, -93.9422836303711, -90.70733642578125, -87.4723892211914, -84.23744201660156, -81.00249481201172, -77.76754760742188, -74.53260040283203, -71.29765319824219, -68.06270599365234, -64.8277587890625, -61.592811584472656, -58.35786437988281, -55.12291717529297, -51.887969970703125, -48.65302276611328, -45.41807556152344, -42.183128356933594, -38.94818115234375, -35.713233947753906, -32.47828674316406, -29.24333953857422, -26.008392333984375, -22.77344512939453, -19.538497924804688, -16.303550720214844, -13.068603515625, -9.833656311035156, -6.5987091064453125, -3.3637619018554688, -0.128814697265625, 3.1061325073242188, 6.3410797119140625, 9.576026916503906, 12.81097412109375, 16.045921325683594, 19.280868530273438, 22.51581573486328, 25.750762939453125, 28.98571014404297, 32.22065734863281, 35.455604553222656, 38.6905517578125, 41.925498962402344, 45.16044616699219, 48.39539337158203, 51.630340576171875, 54.86528778076172, 58.10023498535156, 61.335182189941406, 64.57012939453125, 67.8050765991211, 71.04002380371094]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 9.0, 5.0, 4.0, 8.0, 16.0, 15.0, 17.0, 22.0, 30.0, 34.0, 29.0, 40.0, 49.0, 45.0, 49.0, 61.0, 54.0, 42.0, 51.0, 36.0, 43.0, 48.0, 45.0, 44.0, 31.0, 31.0, 16.0, 24.0, 18.0, 13.0, 11.0, 11.0, 12.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-36.22332000732422, -35.2440071105957, -34.26469421386719, -33.28538131713867, -32.306068420410156, -31.32675552368164, -30.347442626953125, -29.36812973022461, -28.388816833496094, -27.409503936767578, -26.430191040039062, -25.450878143310547, -24.47156524658203, -23.492252349853516, -22.512939453125, -21.533626556396484, -20.5543155670166, -19.575002670288086, -18.59568977355957, -17.616376876831055, -16.63706398010254, -15.657751083374023, -14.678439140319824, -13.699126243591309, -12.719813346862793, -11.740500450134277, -10.761187553405762, -9.781875610351562, -8.802562713623047, -7.823249340057373, -6.843936920166016, -5.8646240234375, -4.885311126708984, -3.9059982299804688, -2.9266855716705322, -1.9473729133605957, -0.9680600166320801, 0.011252880096435547, 0.990565299987793, 1.9698781967163086, 2.949191093444824, 3.92850399017334, 4.9078168869018555, 5.887129306793213, 6.8664422035217285, 7.845755100250244, 8.825067520141602, 9.804380416870117, 10.783693313598633, 11.763006210327148, 12.742319107055664, 13.72163200378418, 14.700944900512695, 15.680257797241211, 16.659568786621094, 17.63888168334961, 18.618194580078125, 19.59750747680664, 20.576820373535156, 21.556133270263672, 22.535446166992188, 23.514759063720703, 24.49407196044922, 25.473384857177734, 26.45269775390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 20.0, 30.0, 45.0, 46.0, 65.0, 128.0, 160.0, 260.0, 404.0, 806.0, 1502.0, 3110.0, 7103.0, 16944.0, 42840.0, 123992.0, 509438.0, 231819.0, 65666.0, 24904.0, 10255.0, 4374.0, 2079.0, 1015.0, 568.0, 336.0, 215.0, 146.0, 81.0, 54.0, 40.0, 19.0, 18.0, 15.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.777099609375, -15.16357421875, -14.550048828125, -13.9365234375, -13.322998046875, -12.70947265625, -12.095947265625, -11.482421875, -10.868896484375, -10.25537109375, -9.641845703125, -9.0283203125, -8.414794921875, -7.80126953125, -7.187744140625, -6.57421875, -5.960693359375, -5.34716796875, -4.733642578125, -4.1201171875, -3.506591796875, -2.89306640625, -2.279541015625, -1.666015625, -1.052490234375, -0.43896484375, 0.174560546875, 0.7880859375, 1.401611328125, 2.01513671875, 2.628662109375, 3.2421875, 3.855712890625, 4.46923828125, 5.082763671875, 5.6962890625, 6.309814453125, 6.92333984375, 7.536865234375, 8.150390625, 8.763916015625, 9.37744140625, 9.990966796875, 10.6044921875, 11.218017578125, 11.83154296875, 12.445068359375, 13.05859375, 13.672119140625, 14.28564453125, 14.899169921875, 15.5126953125, 16.126220703125, 16.73974609375, 17.353271484375, 17.966796875, 18.580322265625, 19.19384765625, 19.807373046875, 20.4208984375, 21.034423828125, 21.64794921875, 22.261474609375, 22.875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 18.0, 20.0, 9.0, 16.0, 33.0, 28.0, 22.0, 21.0, 38.0, 30.0, 40.0, 44.0, 43.0, 46.0, 54.0, 44.0, 49.0, 49.0, 42.0, 49.0, 37.0, 39.0, 40.0, 30.0, 31.0, 18.0, 17.0, 24.0, 15.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8299560546875, -2.730224609375, -2.6304931640625, -2.53076171875, -2.4310302734375, -2.331298828125, -2.2315673828125, -2.1318359375, -2.0321044921875, -1.932373046875, -1.8326416015625, -1.73291015625, -1.6331787109375, -1.533447265625, -1.4337158203125, -1.333984375, -1.2342529296875, -1.134521484375, -1.0347900390625, -0.93505859375, -0.8353271484375, -0.735595703125, -0.6358642578125, -0.5361328125, -0.4364013671875, -0.336669921875, -0.2369384765625, -0.13720703125, -0.0374755859375, 0.062255859375, 0.1619873046875, 0.26171875, 0.3614501953125, 0.461181640625, 0.5609130859375, 0.66064453125, 0.7603759765625, 0.860107421875, 0.9598388671875, 1.0595703125, 1.1593017578125, 1.259033203125, 1.3587646484375, 1.45849609375, 1.5582275390625, 1.657958984375, 1.7576904296875, 1.857421875, 1.9571533203125, 2.056884765625, 2.1566162109375, 2.25634765625, 2.3560791015625, 2.455810546875, 2.5555419921875, 2.6552734375, 2.7550048828125, 2.854736328125, 2.9544677734375, 3.05419921875, 3.1539306640625, 3.253662109375, 3.3533935546875, 3.453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 10.0, 13.0, 13.0, 15.0, 25.0, 24.0, 25.0, 47.0, 83.0, 121.0, 195.0, 356.0, 643.0, 1302.0, 2881.0, 7113.0, 17785.0, 46996.0, 143077.0, 499383.0, 222601.0, 64866.0, 24185.0, 9365.0, 3835.0, 1671.0, 792.0, 395.0, 237.0, 150.0, 100.0, 60.0, 54.0, 33.0, 33.0, 15.0, 16.0, 13.0, 3.0, 4.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.734375, -14.296630859375, -13.85888671875, -13.421142578125, -12.9833984375, -12.545654296875, -12.10791015625, -11.670166015625, -11.232421875, -10.794677734375, -10.35693359375, -9.919189453125, -9.4814453125, -9.043701171875, -8.60595703125, -8.168212890625, -7.73046875, -7.292724609375, -6.85498046875, -6.417236328125, -5.9794921875, -5.541748046875, -5.10400390625, -4.666259765625, -4.228515625, -3.790771484375, -3.35302734375, -2.915283203125, -2.4775390625, -2.039794921875, -1.60205078125, -1.164306640625, -0.7265625, -0.288818359375, 0.14892578125, 0.586669921875, 1.0244140625, 1.462158203125, 1.89990234375, 2.337646484375, 2.775390625, 3.213134765625, 3.65087890625, 4.088623046875, 4.5263671875, 4.964111328125, 5.40185546875, 5.839599609375, 6.27734375, 6.715087890625, 7.15283203125, 7.590576171875, 8.0283203125, 8.466064453125, 8.90380859375, 9.341552734375, 9.779296875, 10.217041015625, 10.65478515625, 11.092529296875, 11.5302734375, 11.968017578125, 12.40576171875, 12.843505859375, 13.28125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 8.0, 12.0, 8.0, 9.0, 10.0, 11.0, 12.0, 11.0, 22.0, 28.0, 44.0, 24.0, 44.0, 37.0, 46.0, 38.0, 41.0, 50.0, 57.0, 36.0, 44.0, 35.0, 48.0, 39.0, 41.0, 31.0, 35.0, 30.0, 27.0, 17.0, 22.0, 23.0, 15.0, 16.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8682861328125, -12.455322265625, -12.0423583984375, -11.62939453125, -11.2164306640625, -10.803466796875, -10.3905029296875, -9.9775390625, -9.5645751953125, -9.151611328125, -8.7386474609375, -8.32568359375, -7.9127197265625, -7.499755859375, -7.0867919921875, -6.673828125, -6.2608642578125, -5.847900390625, -5.4349365234375, -5.02197265625, -4.6090087890625, -4.196044921875, -3.7830810546875, -3.3701171875, -2.9571533203125, -2.544189453125, -2.1312255859375, -1.71826171875, -1.3052978515625, -0.892333984375, -0.4793701171875, -0.06640625, 0.3465576171875, 0.759521484375, 1.1724853515625, 1.58544921875, 1.9984130859375, 2.411376953125, 2.8243408203125, 3.2373046875, 3.6502685546875, 4.063232421875, 4.4761962890625, 4.88916015625, 5.3021240234375, 5.715087890625, 6.1280517578125, 6.541015625, 6.9539794921875, 7.366943359375, 7.7799072265625, 8.19287109375, 8.6058349609375, 9.018798828125, 9.4317626953125, 9.8447265625, 10.2576904296875, 10.670654296875, 11.0836181640625, 11.49658203125, 11.9095458984375, 12.322509765625, 12.7354736328125, 13.1484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 12.0, 30.0, 38.0, 63.0, 85.0, 145.0, 367.0, 869.0, 3126.0, 14965.0, 214076.0, 765664.0, 40579.0, 5883.0, 1553.0, 573.0, 231.0, 110.0, 62.0, 42.0, 30.0, 15.0, 11.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.89013671875, -15.3271484375, -14.76416015625, -14.201171875, -13.63818359375, -13.0751953125, -12.51220703125, -11.94921875, -11.38623046875, -10.8232421875, -10.26025390625, -9.697265625, -9.13427734375, -8.5712890625, -8.00830078125, -7.4453125, -6.88232421875, -6.3193359375, -5.75634765625, -5.193359375, -4.63037109375, -4.0673828125, -3.50439453125, -2.94140625, -2.37841796875, -1.8154296875, -1.25244140625, -0.689453125, -0.12646484375, 0.4365234375, 0.99951171875, 1.5625, 2.12548828125, 2.6884765625, 3.25146484375, 3.814453125, 4.37744140625, 4.9404296875, 5.50341796875, 6.06640625, 6.62939453125, 7.1923828125, 7.75537109375, 8.318359375, 8.88134765625, 9.4443359375, 10.00732421875, 10.5703125, 11.13330078125, 11.6962890625, 12.25927734375, 12.822265625, 13.38525390625, 13.9482421875, 14.51123046875, 15.07421875, 15.63720703125, 16.2001953125, 16.76318359375, 17.326171875, 17.88916015625, 18.4521484375, 19.01513671875, 19.578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 3.0, 5.0, 5.0, 6.0, 11.0, 9.0, 10.0, 25.0, 28.0, 28.0, 54.0, 103.0, 170.0, 204.0, 118.0, 66.0, 29.0, 20.0, 17.0, 17.0, 9.0, 11.0, 10.0, 7.0, 10.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001369476318359375, -0.001326829195022583, -0.001284182071685791, -0.001241534948348999, -0.001198887825012207, -0.001156240701675415, -0.001113593578338623, -0.001070946455001831, -0.001028299331665039, -0.000985652208328247, -0.0009430050849914551, -0.0009003579616546631, -0.0008577108383178711, -0.0008150637149810791, -0.0007724165916442871, -0.0007297694683074951, -0.0006871223449707031, -0.0006444752216339111, -0.0006018280982971191, -0.0005591809749603271, -0.0005165338516235352, -0.00047388672828674316, -0.00043123960494995117, -0.0003885924816131592, -0.0003459453582763672, -0.0003032982349395752, -0.0002606511116027832, -0.0002180039882659912, -0.00017535686492919922, -0.00013270974159240723, -9.006261825561523e-05, -4.741549491882324e-05, -4.76837158203125e-06, 3.787875175476074e-05, 8.052587509155273e-05, 0.00012317299842834473, 0.00016582012176513672, 0.0002084672451019287, 0.0002511143684387207, 0.0002937614917755127, 0.0003364086151123047, 0.0003790557384490967, 0.00042170286178588867, 0.00046434998512268066, 0.0005069971084594727, 0.0005496442317962646, 0.0005922913551330566, 0.0006349384784698486, 0.0006775856018066406, 0.0007202327251434326, 0.0007628798484802246, 0.0008055269718170166, 0.0008481740951538086, 0.0008908212184906006, 0.0009334683418273926, 0.0009761154651641846, 0.0010187625885009766, 0.0010614097118377686, 0.0011040568351745605, 0.0011467039585113525, 0.0011893510818481445, 0.0012319982051849365, 0.0012746453285217285, 0.0013172924518585205, 0.0013599395751953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 13.0, 7.0, 6.0, 15.0, 24.0, 30.0, 34.0, 59.0, 75.0, 125.0, 189.0, 299.0, 531.0, 781.0, 1374.0, 2482.0, 4879.0, 10943.0, 32042.0, 162570.0, 629396.0, 150680.0, 30768.0, 10625.0, 4721.0, 2405.0, 1309.0, 796.0, 499.0, 281.0, 201.0, 117.0, 89.0, 51.0, 40.0, 18.0, 17.0, 14.0, 14.0, 9.0, 12.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.449462890625, -9.11767578125, -8.785888671875, -8.4541015625, -8.122314453125, -7.79052734375, -7.458740234375, -7.126953125, -6.795166015625, -6.46337890625, -6.131591796875, -5.7998046875, -5.468017578125, -5.13623046875, -4.804443359375, -4.47265625, -4.140869140625, -3.80908203125, -3.477294921875, -3.1455078125, -2.813720703125, -2.48193359375, -2.150146484375, -1.818359375, -1.486572265625, -1.15478515625, -0.822998046875, -0.4912109375, -0.159423828125, 0.17236328125, 0.504150390625, 0.8359375, 1.167724609375, 1.49951171875, 1.831298828125, 2.1630859375, 2.494873046875, 2.82666015625, 3.158447265625, 3.490234375, 3.822021484375, 4.15380859375, 4.485595703125, 4.8173828125, 5.149169921875, 5.48095703125, 5.812744140625, 6.14453125, 6.476318359375, 6.80810546875, 7.139892578125, 7.4716796875, 7.803466796875, 8.13525390625, 8.467041015625, 8.798828125, 9.130615234375, 9.46240234375, 9.794189453125, 10.1259765625, 10.457763671875, 10.78955078125, 11.121337890625, 11.453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 8.0, 13.0, 11.0, 19.0, 40.0, 50.0, 71.0, 67.0, 112.0, 150.0, 125.0, 85.0, 67.0, 41.0, 26.0, 22.0, 18.0, 16.0, 13.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9298095703125, -9.625244140625, -9.3206787109375, -9.01611328125, -8.7115478515625, -8.406982421875, -8.1024169921875, -7.7978515625, -7.4932861328125, -7.188720703125, -6.8841552734375, -6.57958984375, -6.2750244140625, -5.970458984375, -5.6658935546875, -5.361328125, -5.0567626953125, -4.752197265625, -4.4476318359375, -4.14306640625, -3.8385009765625, -3.533935546875, -3.2293701171875, -2.9248046875, -2.6202392578125, -2.315673828125, -2.0111083984375, -1.70654296875, -1.4019775390625, -1.097412109375, -0.7928466796875, -0.48828125, -0.1837158203125, 0.120849609375, 0.4254150390625, 0.72998046875, 1.0345458984375, 1.339111328125, 1.6436767578125, 1.9482421875, 2.2528076171875, 2.557373046875, 2.8619384765625, 3.16650390625, 3.4710693359375, 3.775634765625, 4.0802001953125, 4.384765625, 4.6893310546875, 4.993896484375, 5.2984619140625, 5.60302734375, 5.9075927734375, 6.212158203125, 6.5167236328125, 6.8212890625, 7.1258544921875, 7.430419921875, 7.7349853515625, 8.03955078125, 8.3441162109375, 8.648681640625, 8.9532470703125, 9.2578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 20.0, 19.0, 46.0, 102.0, 139.0, 184.0, 170.0, 125.0, 94.0, 56.0, 29.0, 17.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.27543640136719, -74.3579330444336, -69.4404296875, -64.52291870117188, -59.60541534423828, -54.68791198730469, -49.77040481567383, -44.85289764404297, -39.935394287109375, -35.01789093017578, -30.100383758544922, -25.182878494262695, -20.26537322998047, -15.347867965698242, -10.430362701416016, -5.512855529785156, -0.5953521728515625, 4.322153091430664, 9.23965835571289, 14.157163619995117, 19.074668884277344, 23.99217414855957, 28.909679412841797, 33.827186584472656, 38.74468994140625, 43.662193298339844, 48.5797004699707, 53.49720764160156, 58.414710998535156, 63.33221435546875, 68.24972534179688, 73.16722869873047, 78.08473205566406, 83.00223541259766, 87.91973876953125, 92.83724975585938, 97.75475311279297, 102.67225646972656, 107.58976745605469, 112.50727081298828, 117.42477416992188, 122.34227752685547, 127.25978088378906, 132.1772918701172, 137.09478759765625, 142.01229858398438, 146.9298095703125, 151.84732055664062, 156.7648162841797, 161.6823272705078, 166.59982299804688, 171.517333984375, 176.43484497070312, 181.3523406982422, 186.2698516845703, 191.18734741210938, 196.1048583984375, 201.02236938476562, 205.9398651123047, 210.8573760986328, 215.77487182617188, 220.6923828125, 225.60989379882812, 230.52740478515625, 235.4449005126953]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 22.0, 13.0, 18.0, 23.0, 38.0, 29.0, 29.0, 42.0, 42.0, 46.0, 48.0, 33.0, 34.0, 56.0, 45.0, 41.0, 36.0, 36.0, 42.0, 39.0, 39.0, 39.0, 25.0, 31.0, 18.0, 19.0, 12.0, 13.0, 12.0, 3.0, 6.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-65.46266174316406, -63.459285736083984, -61.455909729003906, -59.45252990722656, -57.449153900146484, -55.445777893066406, -53.44239807128906, -51.439022064208984, -49.435646057128906, -47.43227005004883, -45.42889404296875, -43.425514221191406, -41.42213821411133, -39.41876220703125, -37.415382385253906, -35.41200637817383, -33.40863037109375, -31.405254364013672, -29.40187644958496, -27.39849853515625, -25.395122528076172, -23.391746520996094, -21.388368606567383, -19.384990692138672, -17.381614685058594, -15.3782377243042, -13.374860763549805, -11.37148380279541, -9.368106842041016, -7.364729881286621, -5.361352920532227, -3.357975959777832, -1.3546066284179688, 0.6487703323364258, 2.6521472930908203, 4.655524253845215, 6.658901214599609, 8.662278175354004, 10.665655136108398, 12.669032096862793, 14.672409057617188, 16.675785064697266, 18.679162979125977, 20.682540893554688, 22.685916900634766, 24.689292907714844, 26.692670822143555, 28.696048736572266, 30.699424743652344, 32.70280075073242, 34.7061767578125, 36.709556579589844, 38.71293258666992, 40.71630859375, 42.719688415527344, 44.72306442260742, 46.7264404296875, 48.72981643676758, 50.733192443847656, 52.736572265625, 54.73994827270508, 56.743324279785156, 58.7467041015625, 60.75008010864258, 62.753456115722656]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 10.0, 7.0, 13.0, 25.0, 16.0, 32.0, 24.0, 43.0, 68.0, 97.0, 147.0, 175.0, 278.0, 405.0, 614.0, 980.0, 1613.0, 2821.0, 5023.0, 9800.0, 21426.0, 55353.0, 210935.0, 3191116.0, 535196.0, 94970.0, 32388.0, 14277.0, 7006.0, 3759.0, 2108.0, 1240.0, 759.0, 497.0, 333.0, 211.0, 156.0, 108.0, 80.0, 44.0, 37.0, 22.0, 17.0, 12.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-23.3125, -22.621337890625, -21.93017578125, -21.239013671875, -20.5478515625, -19.856689453125, -19.16552734375, -18.474365234375, -17.783203125, -17.092041015625, -16.40087890625, -15.709716796875, -15.0185546875, -14.327392578125, -13.63623046875, -12.945068359375, -12.25390625, -11.562744140625, -10.87158203125, -10.180419921875, -9.4892578125, -8.798095703125, -8.10693359375, -7.415771484375, -6.724609375, -6.033447265625, -5.34228515625, -4.651123046875, -3.9599609375, -3.268798828125, -2.57763671875, -1.886474609375, -1.1953125, -0.504150390625, 0.18701171875, 0.878173828125, 1.5693359375, 2.260498046875, 2.95166015625, 3.642822265625, 4.333984375, 5.025146484375, 5.71630859375, 6.407470703125, 7.0986328125, 7.789794921875, 8.48095703125, 9.172119140625, 9.86328125, 10.554443359375, 11.24560546875, 11.936767578125, 12.6279296875, 13.319091796875, 14.01025390625, 14.701416015625, 15.392578125, 16.083740234375, 16.77490234375, 17.466064453125, 18.1572265625, 18.848388671875, 19.53955078125, 20.230712890625, 20.921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 12.0, 7.0, 13.0, 18.0, 14.0, 17.0, 27.0, 25.0, 22.0, 43.0, 36.0, 48.0, 38.0, 50.0, 47.0, 56.0, 31.0, 34.0, 48.0, 38.0, 46.0, 32.0, 45.0, 34.0, 39.0, 39.0, 23.0, 18.0, 11.0, 13.0, 18.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.888671875, -2.79107666015625, -2.6934814453125, -2.59588623046875, -2.498291015625, -2.40069580078125, -2.3031005859375, -2.20550537109375, -2.10791015625, -2.01031494140625, -1.9127197265625, -1.81512451171875, -1.717529296875, -1.61993408203125, -1.5223388671875, -1.42474365234375, -1.3271484375, -1.22955322265625, -1.1319580078125, -1.03436279296875, -0.936767578125, -0.83917236328125, -0.7415771484375, -0.64398193359375, -0.54638671875, -0.44879150390625, -0.3511962890625, -0.25360107421875, -0.156005859375, -0.05841064453125, 0.0391845703125, 0.13677978515625, 0.234375, 0.33197021484375, 0.4295654296875, 0.52716064453125, 0.624755859375, 0.72235107421875, 0.8199462890625, 0.91754150390625, 1.01513671875, 1.11273193359375, 1.2103271484375, 1.30792236328125, 1.405517578125, 1.50311279296875, 1.6007080078125, 1.69830322265625, 1.7958984375, 1.89349365234375, 1.9910888671875, 2.08868408203125, 2.186279296875, 2.28387451171875, 2.3814697265625, 2.47906494140625, 2.57666015625, 2.67425537109375, 2.7718505859375, 2.86944580078125, 2.967041015625, 3.06463623046875, 3.1622314453125, 3.25982666015625, 3.357421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 19.0, 18.0, 19.0, 35.0, 34.0, 75.0, 102.0, 162.0, 255.0, 418.0, 692.0, 1376.0, 2557.0, 5616.0, 13397.0, 36560.0, 128500.0, 973631.0, 2761622.0, 189555.0, 48937.0, 16962.0, 6888.0, 3136.0, 1682.0, 775.0, 451.0, 258.0, 154.0, 103.0, 76.0, 61.0, 39.0, 29.0, 17.0, 14.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.110595703125, -18.53369140625, -17.956787109375, -17.3798828125, -16.802978515625, -16.22607421875, -15.649169921875, -15.072265625, -14.495361328125, -13.91845703125, -13.341552734375, -12.7646484375, -12.187744140625, -11.61083984375, -11.033935546875, -10.45703125, -9.880126953125, -9.30322265625, -8.726318359375, -8.1494140625, -7.572509765625, -6.99560546875, -6.418701171875, -5.841796875, -5.264892578125, -4.68798828125, -4.111083984375, -3.5341796875, -2.957275390625, -2.38037109375, -1.803466796875, -1.2265625, -0.649658203125, -0.07275390625, 0.504150390625, 1.0810546875, 1.657958984375, 2.23486328125, 2.811767578125, 3.388671875, 3.965576171875, 4.54248046875, 5.119384765625, 5.6962890625, 6.273193359375, 6.85009765625, 7.427001953125, 8.00390625, 8.580810546875, 9.15771484375, 9.734619140625, 10.3115234375, 10.888427734375, 11.46533203125, 12.042236328125, 12.619140625, 13.196044921875, 13.77294921875, 14.349853515625, 14.9267578125, 15.503662109375, 16.08056640625, 16.657470703125, 17.234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 15.0, 12.0, 23.0, 34.0, 54.0, 61.0, 108.0, 230.0, 486.0, 1653.0, 634.0, 308.0, 147.0, 85.0, 63.0, 47.0, 28.0, 17.0, 11.0, 7.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.953125, -8.6876220703125, -8.422119140625, -8.1566162109375, -7.89111328125, -7.6256103515625, -7.360107421875, -7.0946044921875, -6.8291015625, -6.5635986328125, -6.298095703125, -6.0325927734375, -5.76708984375, -5.5015869140625, -5.236083984375, -4.9705810546875, -4.705078125, -4.4395751953125, -4.174072265625, -3.9085693359375, -3.64306640625, -3.3775634765625, -3.112060546875, -2.8465576171875, -2.5810546875, -2.3155517578125, -2.050048828125, -1.7845458984375, -1.51904296875, -1.2535400390625, -0.988037109375, -0.7225341796875, -0.45703125, -0.1915283203125, 0.073974609375, 0.3394775390625, 0.60498046875, 0.8704833984375, 1.135986328125, 1.4014892578125, 1.6669921875, 1.9324951171875, 2.197998046875, 2.4635009765625, 2.72900390625, 2.9945068359375, 3.260009765625, 3.5255126953125, 3.791015625, 4.0565185546875, 4.322021484375, 4.5875244140625, 4.85302734375, 5.1185302734375, 5.384033203125, 5.6495361328125, 5.9150390625, 6.1805419921875, 6.446044921875, 6.7115478515625, 6.97705078125, 7.2425537109375, 7.508056640625, 7.7735595703125, 8.0390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 11.0, 7.0, 6.0, 9.0, 20.0, 21.0, 38.0, 54.0, 96.0, 109.0, 127.0, 126.0, 109.0, 94.0, 67.0, 35.0, 39.0, 17.0, 9.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.28128051757812, -68.7434310913086, -67.2055892944336, -65.66773986816406, -64.12989044189453, -62.59204864501953, -61.05419921875, -59.516353607177734, -57.97850799560547, -56.4406623840332, -54.90281295776367, -53.364967346191406, -51.82712173461914, -50.289276123046875, -48.751426696777344, -47.21358108520508, -45.67573547363281, -44.13788986206055, -42.600040435791016, -41.06219482421875, -39.524349212646484, -37.98650360107422, -36.44865417480469, -34.91080856323242, -33.37295913696289, -31.835111618041992, -30.297266006469727, -28.759418487548828, -27.221572875976562, -25.683725357055664, -24.145877838134766, -22.6080322265625, -21.070188522338867, -19.53234100341797, -17.994495391845703, -16.456647872924805, -14.918802261352539, -13.38095474243164, -11.843108177185059, -10.305261611938477, -8.767415046691895, -7.2295684814453125, -5.6917219161987305, -4.15387487411499, -2.616028308868408, -1.0781817436218262, 0.45966529846191406, 1.997511863708496, 3.535358428955078, 5.07320499420166, 6.611051559448242, 8.14889907836914, 9.686744689941406, 11.224592208862305, 12.762438774108887, 14.300285339355469, 15.83813190460205, 17.375978469848633, 18.91382598876953, 20.451671600341797, 21.989519119262695, 23.52736473083496, 25.06521224975586, 26.603057861328125, 28.140905380249023]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 11.0, 10.0, 9.0, 14.0, 17.0, 16.0, 26.0, 32.0, 29.0, 41.0, 32.0, 36.0, 46.0, 43.0, 37.0, 42.0, 38.0, 52.0, 35.0, 48.0, 40.0, 37.0, 58.0, 36.0, 29.0, 31.0, 24.0, 22.0, 21.0, 10.0, 19.0, 10.0, 4.0, 7.0, 2.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.436439514160156, -25.6163387298584, -24.79623794555664, -23.976137161254883, -23.156036376953125, -22.335933685302734, -21.515832901000977, -20.69573211669922, -19.87563133239746, -19.055530548095703, -18.235429763793945, -17.415328979492188, -16.595226287841797, -15.775126457214355, -14.955024719238281, -14.134923934936523, -13.314823150634766, -12.494722366333008, -11.67462158203125, -10.854519844055176, -10.034419059753418, -9.21431827545166, -8.394216537475586, -7.574115753173828, -6.75401496887207, -5.9339141845703125, -5.1138129234313965, -4.2937116622924805, -3.4736108779907227, -2.653510093688965, -1.8334088325500488, -1.0133075714111328, -0.1932086944580078, 0.6268923282623291, 1.446993350982666, 2.267094373703003, 3.08719539642334, 3.9072961807250977, 4.727397441864014, 5.54749870300293, 6.3675994873046875, 7.187700271606445, 8.007801055908203, 8.827902793884277, 9.648003578186035, 10.468104362487793, 11.288206100463867, 12.108306884765625, 12.928407669067383, 13.74850845336914, 14.568609237670898, 15.388710975646973, 16.208812713623047, 17.028911590576172, 17.849014282226562, 18.66911506652832, 19.489215850830078, 20.309316635131836, 21.129417419433594, 21.94951820373535, 22.76961898803711, 23.5897216796875, 24.409822463989258, 25.229923248291016, 26.050024032592773]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 12.0, 22.0, 30.0, 48.0, 68.0, 109.0, 217.0, 351.0, 569.0, 1144.0, 2368.0, 5256.0, 12797.0, 34871.0, 94199.0, 246733.0, 375501.0, 170368.0, 63832.0, 23607.0, 8883.0, 3813.0, 1781.0, 866.0, 438.0, 295.0, 152.0, 75.0, 52.0, 33.0, 22.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.793212890625, -17.16455078125, -16.535888671875, -15.9072265625, -15.278564453125, -14.64990234375, -14.021240234375, -13.392578125, -12.763916015625, -12.13525390625, -11.506591796875, -10.8779296875, -10.249267578125, -9.62060546875, -8.991943359375, -8.36328125, -7.734619140625, -7.10595703125, -6.477294921875, -5.8486328125, -5.219970703125, -4.59130859375, -3.962646484375, -3.333984375, -2.705322265625, -2.07666015625, -1.447998046875, -0.8193359375, -0.190673828125, 0.43798828125, 1.066650390625, 1.6953125, 2.323974609375, 2.95263671875, 3.581298828125, 4.2099609375, 4.838623046875, 5.46728515625, 6.095947265625, 6.724609375, 7.353271484375, 7.98193359375, 8.610595703125, 9.2392578125, 9.867919921875, 10.49658203125, 11.125244140625, 11.75390625, 12.382568359375, 13.01123046875, 13.639892578125, 14.2685546875, 14.897216796875, 15.52587890625, 16.154541015625, 16.783203125, 17.411865234375, 18.04052734375, 18.669189453125, 19.2978515625, 19.926513671875, 20.55517578125, 21.183837890625, 21.8125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 9.0, 10.0, 15.0, 16.0, 16.0, 31.0, 26.0, 24.0, 27.0, 42.0, 56.0, 53.0, 53.0, 55.0, 53.0, 50.0, 43.0, 37.0, 46.0, 44.0, 47.0, 35.0, 34.0, 38.0, 21.0, 16.0, 19.0, 20.0, 11.0, 12.0, 7.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.255859375, -3.141693115234375, -3.02752685546875, -2.913360595703125, -2.7991943359375, -2.685028076171875, -2.57086181640625, -2.456695556640625, -2.342529296875, -2.228363037109375, -2.11419677734375, -2.000030517578125, -1.8858642578125, -1.771697998046875, -1.65753173828125, -1.543365478515625, -1.42919921875, -1.315032958984375, -1.20086669921875, -1.086700439453125, -0.9725341796875, -0.858367919921875, -0.74420166015625, -0.630035400390625, -0.515869140625, -0.401702880859375, -0.28753662109375, -0.173370361328125, -0.0592041015625, 0.054962158203125, 0.16912841796875, 0.283294677734375, 0.3974609375, 0.511627197265625, 0.62579345703125, 0.739959716796875, 0.8541259765625, 0.968292236328125, 1.08245849609375, 1.196624755859375, 1.310791015625, 1.424957275390625, 1.53912353515625, 1.653289794921875, 1.7674560546875, 1.881622314453125, 1.99578857421875, 2.109954833984375, 2.22412109375, 2.338287353515625, 2.45245361328125, 2.566619873046875, 2.6807861328125, 2.794952392578125, 2.90911865234375, 3.023284912109375, 3.137451171875, 3.251617431640625, 3.36578369140625, 3.479949951171875, 3.5941162109375, 3.708282470703125, 3.82244873046875, 3.936614990234375, 4.05078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 12.0, 9.0, 13.0, 22.0, 16.0, 32.0, 33.0, 37.0, 63.0, 58.0, 87.0, 78.0, 132.0, 157.0, 223.0, 292.0, 382.0, 513.0, 850.0, 1728.0, 4799.0, 18268.0, 84723.0, 371706.0, 430680.0, 101306.0, 21719.0, 5414.0, 1935.0, 926.0, 583.0, 364.0, 311.0, 234.0, 167.0, 142.0, 118.0, 86.0, 67.0, 46.0, 41.0, 40.0, 30.0, 30.0, 22.0, 15.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.25, -20.587158203125, -19.92431640625, -19.261474609375, -18.5986328125, -17.935791015625, -17.27294921875, -16.610107421875, -15.947265625, -15.284423828125, -14.62158203125, -13.958740234375, -13.2958984375, -12.633056640625, -11.97021484375, -11.307373046875, -10.64453125, -9.981689453125, -9.31884765625, -8.656005859375, -7.9931640625, -7.330322265625, -6.66748046875, -6.004638671875, -5.341796875, -4.678955078125, -4.01611328125, -3.353271484375, -2.6904296875, -2.027587890625, -1.36474609375, -0.701904296875, -0.0390625, 0.623779296875, 1.28662109375, 1.949462890625, 2.6123046875, 3.275146484375, 3.93798828125, 4.600830078125, 5.263671875, 5.926513671875, 6.58935546875, 7.252197265625, 7.9150390625, 8.577880859375, 9.24072265625, 9.903564453125, 10.56640625, 11.229248046875, 11.89208984375, 12.554931640625, 13.2177734375, 13.880615234375, 14.54345703125, 15.206298828125, 15.869140625, 16.531982421875, 17.19482421875, 17.857666015625, 18.5205078125, 19.183349609375, 19.84619140625, 20.509033203125, 21.171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 10.0, 12.0, 13.0, 17.0, 19.0, 17.0, 19.0, 29.0, 28.0, 41.0, 30.0, 27.0, 38.0, 36.0, 32.0, 51.0, 46.0, 51.0, 42.0, 43.0, 43.0, 43.0, 37.0, 42.0, 31.0, 32.0, 26.0, 16.0, 11.0, 14.0, 14.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.390625, -13.9525146484375, -13.514404296875, -13.0762939453125, -12.63818359375, -12.2000732421875, -11.761962890625, -11.3238525390625, -10.8857421875, -10.4476318359375, -10.009521484375, -9.5714111328125, -9.13330078125, -8.6951904296875, -8.257080078125, -7.8189697265625, -7.380859375, -6.9427490234375, -6.504638671875, -6.0665283203125, -5.62841796875, -5.1903076171875, -4.752197265625, -4.3140869140625, -3.8759765625, -3.4378662109375, -2.999755859375, -2.5616455078125, -2.12353515625, -1.6854248046875, -1.247314453125, -0.8092041015625, -0.37109375, 0.0670166015625, 0.505126953125, 0.9432373046875, 1.38134765625, 1.8194580078125, 2.257568359375, 2.6956787109375, 3.1337890625, 3.5718994140625, 4.010009765625, 4.4481201171875, 4.88623046875, 5.3243408203125, 5.762451171875, 6.2005615234375, 6.638671875, 7.0767822265625, 7.514892578125, 7.9530029296875, 8.39111328125, 8.8292236328125, 9.267333984375, 9.7054443359375, 10.1435546875, 10.5816650390625, 11.019775390625, 11.4578857421875, 11.89599609375, 12.3341064453125, 12.772216796875, 13.2103271484375, 13.6484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 19.0, 21.0, 33.0, 65.0, 116.0, 303.0, 723.0, 2587.0, 13211.0, 136857.0, 778676.0, 101832.0, 10671.0, 2196.0, 701.0, 264.0, 120.0, 58.0, 27.0, 21.0, 15.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.515625, -21.88037109375, -21.2451171875, -20.60986328125, -19.974609375, -19.33935546875, -18.7041015625, -18.06884765625, -17.43359375, -16.79833984375, -16.1630859375, -15.52783203125, -14.892578125, -14.25732421875, -13.6220703125, -12.98681640625, -12.3515625, -11.71630859375, -11.0810546875, -10.44580078125, -9.810546875, -9.17529296875, -8.5400390625, -7.90478515625, -7.26953125, -6.63427734375, -5.9990234375, -5.36376953125, -4.728515625, -4.09326171875, -3.4580078125, -2.82275390625, -2.1875, -1.55224609375, -0.9169921875, -0.28173828125, 0.353515625, 0.98876953125, 1.6240234375, 2.25927734375, 2.89453125, 3.52978515625, 4.1650390625, 4.80029296875, 5.435546875, 6.07080078125, 6.7060546875, 7.34130859375, 7.9765625, 8.61181640625, 9.2470703125, 9.88232421875, 10.517578125, 11.15283203125, 11.7880859375, 12.42333984375, 13.05859375, 13.69384765625, 14.3291015625, 14.96435546875, 15.599609375, 16.23486328125, 16.8701171875, 17.50537109375, 18.140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 16.0, 24.0, 23.0, 40.0, 45.0, 70.0, 106.0, 169.0, 193.0, 87.0, 53.0, 43.0, 31.0, 27.0, 12.0, 14.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.003566741943359375, -0.003490731120109558, -0.003414720296859741, -0.0033387094736099243, -0.0032626986503601074, -0.0031866878271102905, -0.0031106770038604736, -0.0030346661806106567, -0.00295865535736084, -0.002882644534111023, -0.002806633710861206, -0.002730622887611389, -0.0026546120643615723, -0.0025786012411117554, -0.0025025904178619385, -0.0024265795946121216, -0.0023505687713623047, -0.002274557948112488, -0.002198547124862671, -0.002122536301612854, -0.002046525478363037, -0.00197051465511322, -0.0018945038318634033, -0.0018184930086135864, -0.0017424821853637695, -0.0016664713621139526, -0.0015904605388641357, -0.0015144497156143188, -0.001438438892364502, -0.001362428069114685, -0.0012864172458648682, -0.0012104064226150513, -0.0011343955993652344, -0.0010583847761154175, -0.0009823739528656006, -0.0009063631296157837, -0.0008303523063659668, -0.0007543414831161499, -0.000678330659866333, -0.0006023198366165161, -0.0005263090133666992, -0.0004502981901168823, -0.00037428736686706543, -0.00029827654361724854, -0.00022226572036743164, -0.00014625489711761475, -7.024407386779785e-05, 5.766749382019043e-06, 8.177757263183594e-05, 0.00015778839588165283, 0.00023379921913146973, 0.0003098100423812866, 0.0003858208656311035, 0.0004618316888809204, 0.0005378425121307373, 0.0006138533353805542, 0.0006898641586303711, 0.000765874981880188, 0.0008418858051300049, 0.0009178966283798218, 0.0009939074516296387, 0.0010699182748794556, 0.0011459290981292725, 0.0012219399213790894, 0.0012979507446289062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 8.0, 10.0, 17.0, 50.0, 71.0, 110.0, 174.0, 388.0, 1011.0, 4323.0, 65754.0, 903294.0, 67108.0, 4298.0, 973.0, 412.0, 208.0, 135.0, 83.0, 43.0, 31.0, 16.0, 11.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.436279296875, -33.46630859375, -32.496337890625, -31.5263671875, -30.556396484375, -29.58642578125, -28.616455078125, -27.646484375, -26.676513671875, -25.70654296875, -24.736572265625, -23.7666015625, -22.796630859375, -21.82666015625, -20.856689453125, -19.88671875, -18.916748046875, -17.94677734375, -16.976806640625, -16.0068359375, -15.036865234375, -14.06689453125, -13.096923828125, -12.126953125, -11.156982421875, -10.18701171875, -9.217041015625, -8.2470703125, -7.277099609375, -6.30712890625, -5.337158203125, -4.3671875, -3.397216796875, -2.42724609375, -1.457275390625, -0.4873046875, 0.482666015625, 1.45263671875, 2.422607421875, 3.392578125, 4.362548828125, 5.33251953125, 6.302490234375, 7.2724609375, 8.242431640625, 9.21240234375, 10.182373046875, 11.15234375, 12.122314453125, 13.09228515625, 14.062255859375, 15.0322265625, 16.002197265625, 16.97216796875, 17.942138671875, 18.912109375, 19.882080078125, 20.85205078125, 21.822021484375, 22.7919921875, 23.761962890625, 24.73193359375, 25.701904296875, 26.671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 11.0, 27.0, 32.0, 37.0, 52.0, 75.0, 104.0, 99.0, 150.0, 105.0, 74.0, 50.0, 43.0, 25.0, 26.0, 20.0, 16.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8515625, -13.4691162109375, -13.086669921875, -12.7042236328125, -12.32177734375, -11.9393310546875, -11.556884765625, -11.1744384765625, -10.7919921875, -10.4095458984375, -10.027099609375, -9.6446533203125, -9.26220703125, -8.8797607421875, -8.497314453125, -8.1148681640625, -7.732421875, -7.3499755859375, -6.967529296875, -6.5850830078125, -6.20263671875, -5.8201904296875, -5.437744140625, -5.0552978515625, -4.6728515625, -4.2904052734375, -3.907958984375, -3.5255126953125, -3.14306640625, -2.7606201171875, -2.378173828125, -1.9957275390625, -1.61328125, -1.2308349609375, -0.848388671875, -0.4659423828125, -0.08349609375, 0.2989501953125, 0.681396484375, 1.0638427734375, 1.4462890625, 1.8287353515625, 2.211181640625, 2.5936279296875, 2.97607421875, 3.3585205078125, 3.740966796875, 4.1234130859375, 4.505859375, 4.8883056640625, 5.270751953125, 5.6531982421875, 6.03564453125, 6.4180908203125, 6.800537109375, 7.1829833984375, 7.5654296875, 7.9478759765625, 8.330322265625, 8.7127685546875, 9.09521484375, 9.4776611328125, 9.860107421875, 10.2425537109375, 10.625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 14.0, 29.0, 98.0, 229.0, 328.0, 194.0, 85.0, 24.0, 9.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.1737365722656, -389.239990234375, -378.3062744140625, -367.3725280761719, -356.4388122558594, -345.50506591796875, -334.57135009765625, -323.6376037597656, -312.703857421875, -301.7701110839844, -290.8363952636719, -279.90264892578125, -268.96893310546875, -258.0351867675781, -247.10145568847656, -236.167724609375, -225.2340087890625, -214.30027770996094, -203.36654663085938, -192.43280029296875, -181.49908447265625, -170.56533813476562, -159.63160705566406, -148.6978759765625, -137.76414489746094, -126.83041381835938, -115.89668273925781, -104.96294403076172, -94.02921295166016, -83.0954818725586, -72.1617431640625, -61.22801208496094, -50.2943115234375, -39.36058044433594, -28.42684555053711, -17.49311065673828, -6.559379577636719, 4.374351501464844, 15.308090209960938, 26.2418212890625, 37.17555236816406, 48.109283447265625, 59.04301834106445, 69.97675323486328, 80.91048431396484, 91.8442153930664, 102.7779541015625, 113.71168518066406, 124.64541625976562, 135.5791473388672, 146.51287841796875, 157.44662475585938, 168.38034057617188, 179.3140869140625, 190.24781799316406, 201.18154907226562, 212.1152801513672, 223.04901123046875, 233.9827423095703, 244.91647338867188, 255.8502197265625, 266.783935546875, 277.7176818847656, 288.65142822265625, 299.58514404296875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 8.0, 9.0, 13.0, 13.0, 12.0, 21.0, 20.0, 23.0, 21.0, 33.0, 36.0, 34.0, 34.0, 44.0, 34.0, 30.0, 30.0, 31.0, 51.0, 44.0, 42.0, 38.0, 52.0, 31.0, 39.0, 28.0, 31.0, 29.0, 28.0, 13.0, 26.0, 15.0, 16.0, 17.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-79.36653137207031, -77.12184143066406, -74.87715148925781, -72.63246154785156, -70.38777160644531, -68.14308166503906, -65.89839172363281, -63.65370178222656, -61.40901184082031, -59.16432189941406, -56.91963195800781, -54.67494201660156, -52.43025207519531, -50.18556213378906, -47.94087219238281, -45.69618225097656, -43.45149230957031, -41.20680236816406, -38.96211242675781, -36.71742248535156, -34.47273254394531, -32.22804260253906, -29.983352661132812, -27.738662719726562, -25.493972778320312, -23.249282836914062, -21.004592895507812, -18.759902954101562, -16.515213012695312, -14.270523071289062, -12.025833129882812, -9.781143188476562, -7.536445617675781, -5.291755676269531, -3.0470657348632812, -0.8023757934570312, 1.4423141479492188, 3.6870040893554688, 5.931694030761719, 8.176383972167969, 10.421073913574219, 12.665763854980469, 14.910453796386719, 17.15514373779297, 19.39983367919922, 21.64452362060547, 23.88921356201172, 26.13390350341797, 28.37859344482422, 30.62328338623047, 32.86797332763672, 35.11266326904297, 37.35735321044922, 39.60204315185547, 41.84673309326172, 44.09142303466797, 46.33611297607422, 48.58080291748047, 50.82549285888672, 53.07018280029297, 55.31487274169922, 57.55956268310547, 59.80425262451172, 62.04894256591797, 64.29363250732422]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 6.0, 16.0, 21.0, 42.0, 36.0, 61.0, 86.0, 130.0, 213.0, 301.0, 422.0, 698.0, 1246.0, 2079.0, 3990.0, 8053.0, 18524.0, 49165.0, 167850.0, 1205398.0, 2424258.0, 211326.0, 58315.0, 21611.0, 9487.0, 4728.0, 2434.0, 1406.0, 822.0, 524.0, 334.0, 190.0, 163.0, 107.0, 51.0, 63.0, 35.0, 23.0, 16.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.328125, -19.7799072265625, -19.231689453125, -18.6834716796875, -18.13525390625, -17.5870361328125, -17.038818359375, -16.4906005859375, -15.9423828125, -15.3941650390625, -14.845947265625, -14.2977294921875, -13.74951171875, -13.2012939453125, -12.653076171875, -12.1048583984375, -11.556640625, -11.0084228515625, -10.460205078125, -9.9119873046875, -9.36376953125, -8.8155517578125, -8.267333984375, -7.7191162109375, -7.1708984375, -6.6226806640625, -6.074462890625, -5.5262451171875, -4.97802734375, -4.4298095703125, -3.881591796875, -3.3333740234375, -2.78515625, -2.2369384765625, -1.688720703125, -1.1405029296875, -0.59228515625, -0.0440673828125, 0.504150390625, 1.0523681640625, 1.6005859375, 2.1488037109375, 2.697021484375, 3.2452392578125, 3.79345703125, 4.3416748046875, 4.889892578125, 5.4381103515625, 5.986328125, 6.5345458984375, 7.082763671875, 7.6309814453125, 8.17919921875, 8.7274169921875, 9.275634765625, 9.8238525390625, 10.3720703125, 10.9202880859375, 11.468505859375, 12.0167236328125, 12.56494140625, 13.1131591796875, 13.661376953125, 14.2095947265625, 14.7578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 11.0, 4.0, 11.0, 21.0, 24.0, 21.0, 17.0, 28.0, 33.0, 37.0, 52.0, 47.0, 36.0, 67.0, 49.0, 64.0, 52.0, 43.0, 42.0, 39.0, 36.0, 36.0, 36.0, 36.0, 34.0, 28.0, 19.0, 15.0, 10.0, 14.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.615234375, -3.493499755859375, -3.37176513671875, -3.250030517578125, -3.1282958984375, -3.006561279296875, -2.88482666015625, -2.763092041015625, -2.641357421875, -2.519622802734375, -2.39788818359375, -2.276153564453125, -2.1544189453125, -2.032684326171875, -1.91094970703125, -1.789215087890625, -1.66748046875, -1.545745849609375, -1.42401123046875, -1.302276611328125, -1.1805419921875, -1.058807373046875, -0.93707275390625, -0.815338134765625, -0.693603515625, -0.571868896484375, -0.45013427734375, -0.328399658203125, -0.2066650390625, -0.084930419921875, 0.03680419921875, 0.158538818359375, 0.2802734375, 0.402008056640625, 0.52374267578125, 0.645477294921875, 0.7672119140625, 0.888946533203125, 1.01068115234375, 1.132415771484375, 1.254150390625, 1.375885009765625, 1.49761962890625, 1.619354248046875, 1.7410888671875, 1.862823486328125, 1.98455810546875, 2.106292724609375, 2.22802734375, 2.349761962890625, 2.47149658203125, 2.593231201171875, 2.7149658203125, 2.836700439453125, 2.95843505859375, 3.080169677734375, 3.201904296875, 3.323638916015625, 3.44537353515625, 3.567108154296875, 3.6888427734375, 3.810577392578125, 3.93231201171875, 4.054046630859375, 4.17578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 8.0, 4.0, 10.0, 11.0, 17.0, 24.0, 26.0, 61.0, 65.0, 121.0, 190.0, 320.0, 510.0, 818.0, 1573.0, 2546.0, 5094.0, 10242.0, 23275.0, 60678.0, 193231.0, 967851.0, 2432273.0, 339201.0, 93972.0, 33561.0, 14069.0, 6648.0, 3447.0, 1820.0, 991.0, 634.0, 370.0, 203.0, 151.0, 106.0, 59.0, 46.0, 21.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.345703125, -12.91796875, -12.490234375, -12.0625, -11.634765625, -11.20703125, -10.779296875, -10.3515625, -9.923828125, -9.49609375, -9.068359375, -8.640625, -8.212890625, -7.78515625, -7.357421875, -6.9296875, -6.501953125, -6.07421875, -5.646484375, -5.21875, -4.791015625, -4.36328125, -3.935546875, -3.5078125, -3.080078125, -2.65234375, -2.224609375, -1.796875, -1.369140625, -0.94140625, -0.513671875, -0.0859375, 0.341796875, 0.76953125, 1.197265625, 1.625, 2.052734375, 2.48046875, 2.908203125, 3.3359375, 3.763671875, 4.19140625, 4.619140625, 5.046875, 5.474609375, 5.90234375, 6.330078125, 6.7578125, 7.185546875, 7.61328125, 8.041015625, 8.46875, 8.896484375, 9.32421875, 9.751953125, 10.1796875, 10.607421875, 11.03515625, 11.462890625, 11.890625, 12.318359375, 12.74609375, 13.173828125, 13.6015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 6.0, 12.0, 11.0, 13.0, 16.0, 40.0, 39.0, 64.0, 91.0, 149.0, 203.0, 328.0, 668.0, 1076.0, 464.0, 303.0, 162.0, 118.0, 69.0, 57.0, 47.0, 20.0, 25.0, 16.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.75225830078125, -8.4888916015625, -8.22552490234375, -7.962158203125, -7.69879150390625, -7.4354248046875, -7.17205810546875, -6.90869140625, -6.64532470703125, -6.3819580078125, -6.11859130859375, -5.855224609375, -5.59185791015625, -5.3284912109375, -5.06512451171875, -4.8017578125, -4.53839111328125, -4.2750244140625, -4.01165771484375, -3.748291015625, -3.48492431640625, -3.2215576171875, -2.95819091796875, -2.69482421875, -2.43145751953125, -2.1680908203125, -1.90472412109375, -1.641357421875, -1.37799072265625, -1.1146240234375, -0.85125732421875, -0.587890625, -0.32452392578125, -0.0611572265625, 0.20220947265625, 0.465576171875, 0.72894287109375, 0.9923095703125, 1.25567626953125, 1.51904296875, 1.78240966796875, 2.0457763671875, 2.30914306640625, 2.572509765625, 2.83587646484375, 3.0992431640625, 3.36260986328125, 3.6259765625, 3.88934326171875, 4.1527099609375, 4.41607666015625, 4.679443359375, 4.94281005859375, 5.2061767578125, 5.46954345703125, 5.73291015625, 5.99627685546875, 6.2596435546875, 6.52301025390625, 6.786376953125, 7.04974365234375, 7.3131103515625, 7.57647705078125, 7.83984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 27.0, 39.0, 116.0, 219.0, 246.0, 190.0, 90.0, 49.0, 15.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.73622131347656, -135.66502380371094, -131.5938262939453, -127.52262878417969, -123.45142364501953, -119.3802261352539, -115.30902862548828, -111.23783111572266, -107.1666259765625, -103.09542846679688, -99.02423095703125, -94.95303344726562, -90.88182830810547, -86.81063079833984, -82.73943328857422, -78.6682357788086, -74.59703826904297, -70.52584075927734, -66.45464324951172, -62.38344192504883, -58.31224060058594, -54.24104309082031, -50.16984558105469, -46.09864807128906, -42.02744674682617, -37.95624923706055, -33.885047912597656, -29.81385040283203, -25.742650985717773, -21.671451568603516, -17.60025405883789, -13.529054641723633, -9.457855224609375, -5.386656284332275, -1.3154573440551758, 2.7557411193847656, 6.826940536499023, 10.898139953613281, 14.969337463378906, 19.040536880493164, 23.111736297607422, 27.18293571472168, 31.254135131835938, 35.32533264160156, 39.39653015136719, 43.46773147583008, 47.5389289855957, 51.610130310058594, 55.68132781982422, 59.752525329589844, 63.823726654052734, 67.89492797851562, 71.96612548828125, 76.03732299804688, 80.1085205078125, 84.17971801757812, 88.25091552734375, 92.32211303710938, 96.393310546875, 100.46450805664062, 104.53571319580078, 108.6069107055664, 112.67810821533203, 116.74930572509766, 120.82051086425781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 19.0, 15.0, 19.0, 21.0, 24.0, 33.0, 40.0, 35.0, 40.0, 51.0, 46.0, 55.0, 58.0, 33.0, 32.0, 44.0, 51.0, 31.0, 40.0, 45.0, 42.0, 28.0, 26.0, 17.0, 20.0, 19.0, 17.0, 18.0, 12.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.3070068359375, -29.253692626953125, -28.200380325317383, -27.14706802368164, -26.093753814697266, -25.04043960571289, -23.98712730407715, -22.933815002441406, -21.88050079345703, -20.827186584472656, -19.773874282836914, -18.720561981201172, -17.667247772216797, -16.613933563232422, -15.56062126159668, -14.507308006286621, -13.453994750976562, -12.400681495666504, -11.347368240356445, -10.294054985046387, -9.240741729736328, -8.18742847442627, -7.134115219116211, -6.080801963806152, -5.027488708496094, -3.974175453186035, -2.9208621978759766, -1.867548942565918, -0.8142356872558594, 0.23907756805419922, 1.2923908233642578, 2.3457040786743164, 3.3990211486816406, 4.452334403991699, 5.505647659301758, 6.558960914611816, 7.612274169921875, 8.665587425231934, 9.718900680541992, 10.77221393585205, 11.82552719116211, 12.878840446472168, 13.932153701782227, 14.985466957092285, 16.038780212402344, 17.09209442138672, 18.14540672302246, 19.198719024658203, 20.252033233642578, 21.305347442626953, 22.358659744262695, 23.411972045898438, 24.465286254882812, 25.518600463867188, 26.57191276550293, 27.625225067138672, 28.678539276123047, 29.731853485107422, 30.785165786743164, 31.838478088378906, 32.89179229736328, 33.945106506347656, 34.99842071533203, 36.05173110961914, 37.105045318603516]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 17.0, 22.0, 26.0, 39.0, 70.0, 105.0, 163.0, 297.0, 467.0, 884.0, 1658.0, 3677.0, 8158.0, 19506.0, 49647.0, 131970.0, 297608.0, 305903.0, 138566.0, 52563.0, 20719.0, 8687.0, 3852.0, 1759.0, 900.0, 475.0, 305.0, 167.0, 109.0, 87.0, 48.0, 35.0, 25.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.953125, -17.392578125, -16.83203125, -16.271484375, -15.7109375, -15.150390625, -14.58984375, -14.029296875, -13.46875, -12.908203125, -12.34765625, -11.787109375, -11.2265625, -10.666015625, -10.10546875, -9.544921875, -8.984375, -8.423828125, -7.86328125, -7.302734375, -6.7421875, -6.181640625, -5.62109375, -5.060546875, -4.5, -3.939453125, -3.37890625, -2.818359375, -2.2578125, -1.697265625, -1.13671875, -0.576171875, -0.015625, 0.544921875, 1.10546875, 1.666015625, 2.2265625, 2.787109375, 3.34765625, 3.908203125, 4.46875, 5.029296875, 5.58984375, 6.150390625, 6.7109375, 7.271484375, 7.83203125, 8.392578125, 8.953125, 9.513671875, 10.07421875, 10.634765625, 11.1953125, 11.755859375, 12.31640625, 12.876953125, 13.4375, 13.998046875, 14.55859375, 15.119140625, 15.6796875, 16.240234375, 16.80078125, 17.361328125, 17.921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 9.0, 15.0, 10.0, 18.0, 20.0, 16.0, 28.0, 35.0, 40.0, 56.0, 34.0, 52.0, 54.0, 49.0, 53.0, 50.0, 40.0, 47.0, 44.0, 43.0, 40.0, 41.0, 39.0, 22.0, 22.0, 16.0, 24.0, 16.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.623046875, -3.495330810546875, -3.36761474609375, -3.239898681640625, -3.1121826171875, -2.984466552734375, -2.85675048828125, -2.729034423828125, -2.601318359375, -2.473602294921875, -2.34588623046875, -2.218170166015625, -2.0904541015625, -1.962738037109375, -1.83502197265625, -1.707305908203125, -1.57958984375, -1.451873779296875, -1.32415771484375, -1.196441650390625, -1.0687255859375, -0.941009521484375, -0.81329345703125, -0.685577392578125, -0.557861328125, -0.430145263671875, -0.30242919921875, -0.174713134765625, -0.0469970703125, 0.080718994140625, 0.20843505859375, 0.336151123046875, 0.4638671875, 0.591583251953125, 0.71929931640625, 0.847015380859375, 0.9747314453125, 1.102447509765625, 1.23016357421875, 1.357879638671875, 1.485595703125, 1.613311767578125, 1.74102783203125, 1.868743896484375, 1.9964599609375, 2.124176025390625, 2.25189208984375, 2.379608154296875, 2.50732421875, 2.635040283203125, 2.76275634765625, 2.890472412109375, 3.0181884765625, 3.145904541015625, 3.27362060546875, 3.401336669921875, 3.529052734375, 3.656768798828125, 3.78448486328125, 3.912200927734375, 4.0399169921875, 4.167633056640625, 4.29534912109375, 4.423065185546875, 4.55078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 6.0, 10.0, 8.0, 12.0, 25.0, 22.0, 31.0, 39.0, 60.0, 91.0, 98.0, 126.0, 158.0, 224.0, 321.0, 448.0, 586.0, 1042.0, 2130.0, 7351.0, 45317.0, 347697.0, 540621.0, 83548.0, 11938.0, 2919.0, 1215.0, 702.0, 472.0, 314.0, 241.0, 186.0, 143.0, 100.0, 77.0, 70.0, 40.0, 32.0, 33.0, 23.0, 18.0, 8.0, 11.0, 11.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.0, -26.07373046875, -25.1474609375, -24.22119140625, -23.294921875, -22.36865234375, -21.4423828125, -20.51611328125, -19.58984375, -18.66357421875, -17.7373046875, -16.81103515625, -15.884765625, -14.95849609375, -14.0322265625, -13.10595703125, -12.1796875, -11.25341796875, -10.3271484375, -9.40087890625, -8.474609375, -7.54833984375, -6.6220703125, -5.69580078125, -4.76953125, -3.84326171875, -2.9169921875, -1.99072265625, -1.064453125, -0.13818359375, 0.7880859375, 1.71435546875, 2.640625, 3.56689453125, 4.4931640625, 5.41943359375, 6.345703125, 7.27197265625, 8.1982421875, 9.12451171875, 10.05078125, 10.97705078125, 11.9033203125, 12.82958984375, 13.755859375, 14.68212890625, 15.6083984375, 16.53466796875, 17.4609375, 18.38720703125, 19.3134765625, 20.23974609375, 21.166015625, 22.09228515625, 23.0185546875, 23.94482421875, 24.87109375, 25.79736328125, 26.7236328125, 27.64990234375, 28.576171875, 29.50244140625, 30.4287109375, 31.35498046875, 32.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 23.0, 9.0, 22.0, 27.0, 27.0, 35.0, 46.0, 38.0, 42.0, 50.0, 66.0, 58.0, 53.0, 56.0, 47.0, 67.0, 64.0, 45.0, 36.0, 31.0, 33.0, 28.0, 24.0, 17.0, 9.0, 12.0, 10.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.75, -25.01025390625, -24.2705078125, -23.53076171875, -22.791015625, -22.05126953125, -21.3115234375, -20.57177734375, -19.83203125, -19.09228515625, -18.3525390625, -17.61279296875, -16.873046875, -16.13330078125, -15.3935546875, -14.65380859375, -13.9140625, -13.17431640625, -12.4345703125, -11.69482421875, -10.955078125, -10.21533203125, -9.4755859375, -8.73583984375, -7.99609375, -7.25634765625, -6.5166015625, -5.77685546875, -5.037109375, -4.29736328125, -3.5576171875, -2.81787109375, -2.078125, -1.33837890625, -0.5986328125, 0.14111328125, 0.880859375, 1.62060546875, 2.3603515625, 3.10009765625, 3.83984375, 4.57958984375, 5.3193359375, 6.05908203125, 6.798828125, 7.53857421875, 8.2783203125, 9.01806640625, 9.7578125, 10.49755859375, 11.2373046875, 11.97705078125, 12.716796875, 13.45654296875, 14.1962890625, 14.93603515625, 15.67578125, 16.41552734375, 17.1552734375, 17.89501953125, 18.634765625, 19.37451171875, 20.1142578125, 20.85400390625, 21.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 14.0, 26.0, 46.0, 59.0, 90.0, 128.0, 261.0, 439.0, 850.0, 1679.0, 3776.0, 10965.0, 38648.0, 163986.0, 467383.0, 267621.0, 65540.0, 16848.0, 5444.0, 2209.0, 1117.0, 558.0, 321.0, 190.0, 121.0, 74.0, 43.0, 27.0, 25.0, 7.0, 12.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.140625, -9.8564453125, -9.572265625, -9.2880859375, -9.00390625, -8.7197265625, -8.435546875, -8.1513671875, -7.8671875, -7.5830078125, -7.298828125, -7.0146484375, -6.73046875, -6.4462890625, -6.162109375, -5.8779296875, -5.59375, -5.3095703125, -5.025390625, -4.7412109375, -4.45703125, -4.1728515625, -3.888671875, -3.6044921875, -3.3203125, -3.0361328125, -2.751953125, -2.4677734375, -2.18359375, -1.8994140625, -1.615234375, -1.3310546875, -1.046875, -0.7626953125, -0.478515625, -0.1943359375, 0.08984375, 0.3740234375, 0.658203125, 0.9423828125, 1.2265625, 1.5107421875, 1.794921875, 2.0791015625, 2.36328125, 2.6474609375, 2.931640625, 3.2158203125, 3.5, 3.7841796875, 4.068359375, 4.3525390625, 4.63671875, 4.9208984375, 5.205078125, 5.4892578125, 5.7734375, 6.0576171875, 6.341796875, 6.6259765625, 6.91015625, 7.1943359375, 7.478515625, 7.7626953125, 8.046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 19.0, 26.0, 29.0, 40.0, 71.0, 66.0, 91.0, 104.0, 108.0, 93.0, 83.0, 56.0, 59.0, 31.0, 31.0, 25.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002105712890625, -0.002047628164291382, -0.0019895434379577637, -0.0019314587116241455, -0.0018733739852905273, -0.0018152892589569092, -0.001757204532623291, -0.0016991198062896729, -0.0016410350799560547, -0.0015829503536224365, -0.0015248656272888184, -0.0014667809009552002, -0.001408696174621582, -0.0013506114482879639, -0.0012925267219543457, -0.0012344419956207275, -0.0011763572692871094, -0.0011182725429534912, -0.001060187816619873, -0.0010021030902862549, -0.0009440183639526367, -0.0008859336376190186, -0.0008278489112854004, -0.0007697641849517822, -0.0007116794586181641, -0.0006535947322845459, -0.0005955100059509277, -0.0005374252796173096, -0.0004793405532836914, -0.00042125582695007324, -0.0003631711006164551, -0.0003050863742828369, -0.00024700164794921875, -0.00018891692161560059, -0.00013083219528198242, -7.274746894836426e-05, -1.4662742614746094e-05, 4.342198371887207e-05, 0.00010150671005249023, 0.0001595914363861084, 0.00021767616271972656, 0.0002757608890533447, 0.0003338456153869629, 0.00039193034172058105, 0.0004500150680541992, 0.0005080997943878174, 0.0005661845207214355, 0.0006242692470550537, 0.0006823539733886719, 0.00074043869972229, 0.0007985234260559082, 0.0008566081523895264, 0.0009146928787231445, 0.0009727776050567627, 0.0010308623313903809, 0.001088947057723999, 0.0011470317840576172, 0.0012051165103912354, 0.0012632012367248535, 0.0013212859630584717, 0.0013793706893920898, 0.001437455415725708, 0.0014955401420593262, 0.0015536248683929443, 0.0016117095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 8.0, 5.0, 8.0, 13.0, 24.0, 27.0, 34.0, 52.0, 78.0, 110.0, 223.0, 378.0, 854.0, 2113.0, 9537.0, 125627.0, 767934.0, 127877.0, 9627.0, 2170.0, 796.0, 446.0, 234.0, 149.0, 69.0, 59.0, 25.0, 16.0, 15.0, 18.0, 9.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.790283203125, -16.22119140625, -15.652099609375, -15.0830078125, -14.513916015625, -13.94482421875, -13.375732421875, -12.806640625, -12.237548828125, -11.66845703125, -11.099365234375, -10.5302734375, -9.961181640625, -9.39208984375, -8.822998046875, -8.25390625, -7.684814453125, -7.11572265625, -6.546630859375, -5.9775390625, -5.408447265625, -4.83935546875, -4.270263671875, -3.701171875, -3.132080078125, -2.56298828125, -1.993896484375, -1.4248046875, -0.855712890625, -0.28662109375, 0.282470703125, 0.8515625, 1.420654296875, 1.98974609375, 2.558837890625, 3.1279296875, 3.697021484375, 4.26611328125, 4.835205078125, 5.404296875, 5.973388671875, 6.54248046875, 7.111572265625, 7.6806640625, 8.249755859375, 8.81884765625, 9.387939453125, 9.95703125, 10.526123046875, 11.09521484375, 11.664306640625, 12.2333984375, 12.802490234375, 13.37158203125, 13.940673828125, 14.509765625, 15.078857421875, 15.64794921875, 16.217041015625, 16.7861328125, 17.355224609375, 17.92431640625, 18.493408203125, 19.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 11.0, 11.0, 15.0, 29.0, 35.0, 54.0, 62.0, 91.0, 74.0, 117.0, 84.0, 82.0, 68.0, 49.0, 46.0, 33.0, 18.0, 26.0, 13.0, 9.0, 7.0, 7.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4296875, -9.126220703125, -8.82275390625, -8.519287109375, -8.2158203125, -7.912353515625, -7.60888671875, -7.305419921875, -7.001953125, -6.698486328125, -6.39501953125, -6.091552734375, -5.7880859375, -5.484619140625, -5.18115234375, -4.877685546875, -4.57421875, -4.270751953125, -3.96728515625, -3.663818359375, -3.3603515625, -3.056884765625, -2.75341796875, -2.449951171875, -2.146484375, -1.843017578125, -1.53955078125, -1.236083984375, -0.9326171875, -0.629150390625, -0.32568359375, -0.022216796875, 0.28125, 0.584716796875, 0.88818359375, 1.191650390625, 1.4951171875, 1.798583984375, 2.10205078125, 2.405517578125, 2.708984375, 3.012451171875, 3.31591796875, 3.619384765625, 3.9228515625, 4.226318359375, 4.52978515625, 4.833251953125, 5.13671875, 5.440185546875, 5.74365234375, 6.047119140625, 6.3505859375, 6.654052734375, 6.95751953125, 7.260986328125, 7.564453125, 7.867919921875, 8.17138671875, 8.474853515625, 8.7783203125, 9.081787109375, 9.38525390625, 9.688720703125, 9.9921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 10.0, 32.0, 42.0, 82.0, 103.0, 142.0, 161.0, 163.0, 116.0, 77.0, 34.0, 22.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-240.88356018066406, -234.98587036132812, -229.08819580078125, -223.1905059814453, -217.29281616210938, -211.3951416015625, -205.49745178222656, -199.59976196289062, -193.70208740234375, -187.8043975830078, -181.90672302246094, -176.009033203125, -170.11134338378906, -164.21365356445312, -158.31597900390625, -152.4182891845703, -146.52059936523438, -140.62290954589844, -134.72523498535156, -128.82754516601562, -122.92985534667969, -117.03217315673828, -111.13449096679688, -105.23680114746094, -99.33911895751953, -93.44143676757812, -87.54374694824219, -81.64606475830078, -75.74838256835938, -69.85069274902344, -63.95301055908203, -58.05532455444336, -52.15763854980469, -46.259952545166016, -40.362266540527344, -34.46458435058594, -28.566898345947266, -22.669212341308594, -16.771530151367188, -10.873844146728516, -4.976158142089844, 0.9215269088745117, 6.819211959838867, 12.716896057128906, 18.614582061767578, 24.51226806640625, 30.409950256347656, 36.30763626098633, 42.205322265625, 48.10300827026367, 54.000694274902344, 59.89837646484375, 65.79606628417969, 71.6937484741211, 77.5914306640625, 83.48912048339844, 89.38680267333984, 95.28448486328125, 101.18217468261719, 107.0798568725586, 112.9775390625, 118.87522888183594, 124.77291107177734, 130.67059326171875, 136.5682830810547]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 16.0, 8.0, 19.0, 20.0, 21.0, 33.0, 41.0, 39.0, 28.0, 34.0, 34.0, 43.0, 38.0, 48.0, 37.0, 40.0, 42.0, 49.0, 40.0, 38.0, 33.0, 37.0, 26.0, 25.0, 22.0, 26.0, 24.0, 22.0, 20.0, 16.0, 16.0, 11.0, 2.0, 6.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.13624572753906, -86.36341094970703, -83.59058380126953, -80.8177490234375, -78.04491424560547, -75.27207946777344, -72.49925231933594, -69.7264175415039, -66.95358276367188, -64.18074798583984, -61.40791702270508, -58.63508605957031, -55.86225128173828, -53.089420318603516, -50.31658935546875, -47.54375457763672, -44.77092361450195, -41.99809265136719, -39.225257873535156, -36.45242691040039, -33.67959213256836, -30.906761169433594, -28.133928298950195, -25.361095428466797, -22.5882625579834, -19.8154296875, -17.0425968170166, -14.26976490020752, -11.496932029724121, -8.724099159240723, -5.951267242431641, -3.178434371948242, -0.40560150146484375, 2.3672311305999756, 5.140063762664795, 7.912896156311035, 10.685729026794434, 13.458561897277832, 16.231393814086914, 19.004226684570312, 21.77705955505371, 24.54989242553711, 27.322725296020508, 30.095558166503906, 32.86838912963867, 35.6412239074707, 38.41405487060547, 41.1868896484375, 43.959720611572266, 46.73255157470703, 49.50538635253906, 52.27821731567383, 55.05105209350586, 57.823883056640625, 60.596717834472656, 63.36954879760742, 66.14237976074219, 68.91521453857422, 71.68804168701172, 74.46087646484375, 77.23371124267578, 80.00654602050781, 82.77937316894531, 85.55220794677734, 88.32504272460938]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 11.0, 10.0, 24.0, 22.0, 41.0, 76.0, 132.0, 242.0, 457.0, 1119.0, 3500.0, 16445.0, 741719.0, 3407528.0, 17047.0, 3650.0, 1150.0, 509.0, 238.0, 138.0, 76.0, 35.0, 36.0, 18.0, 20.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.97021484375, -49.3779296875, -47.78564453125, -46.193359375, -44.60107421875, -43.0087890625, -41.41650390625, -39.82421875, -38.23193359375, -36.6396484375, -35.04736328125, -33.455078125, -31.86279296875, -30.2705078125, -28.67822265625, -27.0859375, -25.49365234375, -23.9013671875, -22.30908203125, -20.716796875, -19.12451171875, -17.5322265625, -15.93994140625, -14.34765625, -12.75537109375, -11.1630859375, -9.57080078125, -7.978515625, -6.38623046875, -4.7939453125, -3.20166015625, -1.609375, -0.01708984375, 1.5751953125, 3.16748046875, 4.759765625, 6.35205078125, 7.9443359375, 9.53662109375, 11.12890625, 12.72119140625, 14.3134765625, 15.90576171875, 17.498046875, 19.09033203125, 20.6826171875, 22.27490234375, 23.8671875, 25.45947265625, 27.0517578125, 28.64404296875, 30.236328125, 31.82861328125, 33.4208984375, 35.01318359375, 36.60546875, 38.19775390625, 39.7900390625, 41.38232421875, 42.974609375, 44.56689453125, 46.1591796875, 47.75146484375, 49.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 18.0, 23.0, 21.0, 22.0, 29.0, 35.0, 34.0, 46.0, 42.0, 53.0, 41.0, 60.0, 51.0, 42.0, 44.0, 33.0, 40.0, 48.0, 38.0, 39.0, 35.0, 34.0, 27.0, 27.0, 14.0, 12.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.783935546875, -3.64990234375, -3.515869140625, -3.3818359375, -3.247802734375, -3.11376953125, -2.979736328125, -2.845703125, -2.711669921875, -2.57763671875, -2.443603515625, -2.3095703125, -2.175537109375, -2.04150390625, -1.907470703125, -1.7734375, -1.639404296875, -1.50537109375, -1.371337890625, -1.2373046875, -1.103271484375, -0.96923828125, -0.835205078125, -0.701171875, -0.567138671875, -0.43310546875, -0.299072265625, -0.1650390625, -0.031005859375, 0.10302734375, 0.237060546875, 0.37109375, 0.505126953125, 0.63916015625, 0.773193359375, 0.9072265625, 1.041259765625, 1.17529296875, 1.309326171875, 1.443359375, 1.577392578125, 1.71142578125, 1.845458984375, 1.9794921875, 2.113525390625, 2.24755859375, 2.381591796875, 2.515625, 2.649658203125, 2.78369140625, 2.917724609375, 3.0517578125, 3.185791015625, 3.31982421875, 3.453857421875, 3.587890625, 3.721923828125, 3.85595703125, 3.989990234375, 4.1240234375, 4.258056640625, 4.39208984375, 4.526123046875, 4.66015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 16.0, 12.0, 13.0, 17.0, 26.0, 34.0, 38.0, 85.0, 114.0, 161.0, 208.0, 327.0, 454.0, 746.0, 1208.0, 2242.0, 4430.0, 9498.0, 26059.0, 104286.0, 3612036.0, 352300.0, 49885.0, 15682.0, 6571.0, 3183.0, 1684.0, 986.0, 642.0, 410.0, 274.0, 181.0, 134.0, 107.0, 70.0, 42.0, 48.0, 17.0, 15.0, 7.0, 15.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.5484619140625, -13.042236328125, -12.5360107421875, -12.02978515625, -11.5235595703125, -11.017333984375, -10.5111083984375, -10.0048828125, -9.4986572265625, -8.992431640625, -8.4862060546875, -7.97998046875, -7.4737548828125, -6.967529296875, -6.4613037109375, -5.955078125, -5.4488525390625, -4.942626953125, -4.4364013671875, -3.93017578125, -3.4239501953125, -2.917724609375, -2.4114990234375, -1.9052734375, -1.3990478515625, -0.892822265625, -0.3865966796875, 0.11962890625, 0.6258544921875, 1.132080078125, 1.6383056640625, 2.14453125, 2.6507568359375, 3.156982421875, 3.6632080078125, 4.16943359375, 4.6756591796875, 5.181884765625, 5.6881103515625, 6.1943359375, 6.7005615234375, 7.206787109375, 7.7130126953125, 8.21923828125, 8.7254638671875, 9.231689453125, 9.7379150390625, 10.244140625, 10.7503662109375, 11.256591796875, 11.7628173828125, 12.26904296875, 12.7752685546875, 13.281494140625, 13.7877197265625, 14.2939453125, 14.8001708984375, 15.306396484375, 15.8126220703125, 16.31884765625, 16.8250732421875, 17.331298828125, 17.8375244140625, 18.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 12.0, 15.0, 30.0, 30.0, 69.0, 130.0, 267.0, 2630.0, 468.0, 170.0, 66.0, 49.0, 29.0, 18.0, 8.0, 13.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.156341552734375, -4.04315185546875, -3.929962158203125, -3.8167724609375, -3.703582763671875, -3.59039306640625, -3.477203369140625, -3.364013671875, -3.250823974609375, -3.13763427734375, -3.024444580078125, -2.9112548828125, -2.798065185546875, -2.68487548828125, -2.571685791015625, -2.45849609375, -2.345306396484375, -2.23211669921875, -2.118927001953125, -2.0057373046875, -1.892547607421875, -1.77935791015625, -1.666168212890625, -1.552978515625, -1.439788818359375, -1.32659912109375, -1.213409423828125, -1.1002197265625, -0.987030029296875, -0.87384033203125, -0.760650634765625, -0.6474609375, -0.534271240234375, -0.42108154296875, -0.307891845703125, -0.1947021484375, -0.081512451171875, 0.03167724609375, 0.144866943359375, 0.258056640625, 0.371246337890625, 0.48443603515625, 0.597625732421875, 0.7108154296875, 0.824005126953125, 0.93719482421875, 1.050384521484375, 1.16357421875, 1.276763916015625, 1.38995361328125, 1.503143310546875, 1.6163330078125, 1.729522705078125, 1.84271240234375, 1.955902099609375, 2.069091796875, 2.182281494140625, 2.29547119140625, 2.408660888671875, 2.5218505859375, 2.635040283203125, 2.74822998046875, 2.861419677734375, 2.974609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 9.0, 11.0, 11.0, 19.0, 16.0, 28.0, 28.0, 31.0, 50.0, 67.0, 72.0, 82.0, 72.0, 73.0, 79.0, 80.0, 65.0, 50.0, 39.0, 30.0, 28.0, 21.0, 13.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.861871719360352, -11.460796356201172, -11.059720993041992, -10.658645629882812, -10.257570266723633, -9.856494903564453, -9.45542049407959, -9.05434513092041, -8.65326976776123, -8.25219440460205, -7.851119041442871, -7.45004415512085, -7.04896879196167, -6.64789342880249, -6.246818542480469, -5.845743179321289, -5.444667816162109, -5.04359245300293, -4.64251708984375, -4.2414422035217285, -3.840366840362549, -3.439291477203369, -3.0382163524627686, -2.637141227722168, -2.2360658645629883, -1.8349906206130981, -1.433915376663208, -1.0328401327133179, -0.6317648887634277, -0.23068952560424805, 0.17038559913635254, 0.5714607238769531, 0.9725360870361328, 1.373611330986023, 1.774686574935913, 2.1757616996765137, 2.5768370628356934, 2.977912425994873, 3.3789875507354736, 3.780062675476074, 4.181138038635254, 4.582213401794434, 4.983288764953613, 5.384363651275635, 5.7854390144348145, 6.186514377593994, 6.587589263916016, 6.988664627075195, 7.389739990234375, 7.790815353393555, 8.191890716552734, 8.592966079711914, 8.994041442871094, 9.395116806030273, 9.796191215515137, 10.197266578674316, 10.598341941833496, 10.999417304992676, 11.400492668151855, 11.801568031311035, 12.202642440795898, 12.603717803955078, 13.004793167114258, 13.405868530273438, 13.806943893432617]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 4.0, 5.0, 5.0, 9.0, 10.0, 7.0, 16.0, 16.0, 29.0, 27.0, 24.0, 34.0, 39.0, 37.0, 39.0, 31.0, 46.0, 48.0, 37.0, 56.0, 45.0, 53.0, 52.0, 54.0, 41.0, 39.0, 32.0, 24.0, 31.0, 26.0, 10.0, 10.0, 8.0, 15.0, 9.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.728302955627441, -8.423388481140137, -8.118474006652832, -7.813559055328369, -7.5086445808410645, -7.20373010635376, -6.898815155029297, -6.593900680541992, -6.2889862060546875, -5.984071731567383, -5.679157257080078, -5.374242305755615, -5.0693278312683105, -4.764413356781006, -4.459498405456543, -4.154583930969238, -3.8496694564819336, -3.544754981994629, -3.239840269088745, -2.9349255561828613, -2.6300110816955566, -2.325096607208252, -2.020181894302368, -1.7152671813964844, -1.4103527069091797, -1.1054381132125854, -0.8005235195159912, -0.495608925819397, -0.19069433212280273, 0.1142202615737915, 0.41913485527038574, 0.7240495681762695, 1.0289630889892578, 1.333877682685852, 1.6387922763824463, 1.9437068700790405, 2.2486214637756348, 2.5535359382629395, 2.8584506511688232, 3.163365364074707, 3.4682798385620117, 3.7731943130493164, 4.078108787536621, 4.383023738861084, 4.687938213348389, 4.992852687835693, 5.297767639160156, 5.602682113647461, 5.907596588134766, 6.21251106262207, 6.517425537109375, 6.822340488433838, 7.127254962921143, 7.432169437408447, 7.73708438873291, 8.041998863220215, 8.34691333770752, 8.651827812194824, 8.956742286682129, 9.261656761169434, 9.566572189331055, 9.87148666381836, 10.176401138305664, 10.481315612792969, 10.786230087280273]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 13.0, 12.0, 18.0, 32.0, 39.0, 58.0, 103.0, 136.0, 213.0, 411.0, 654.0, 1123.0, 2011.0, 4014.0, 7756.0, 16571.0, 35815.0, 77533.0, 153954.0, 239985.0, 231307.0, 142797.0, 70560.0, 32981.0, 15201.0, 7037.0, 3635.0, 1935.0, 1070.0, 608.0, 316.0, 229.0, 139.0, 89.0, 66.0, 45.0, 23.0, 17.0, 12.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3551025390625, -10.975830078125, -10.5965576171875, -10.21728515625, -9.8380126953125, -9.458740234375, -9.0794677734375, -8.7001953125, -8.3209228515625, -7.941650390625, -7.5623779296875, -7.18310546875, -6.8038330078125, -6.424560546875, -6.0452880859375, -5.666015625, -5.2867431640625, -4.907470703125, -4.5281982421875, -4.14892578125, -3.7696533203125, -3.390380859375, -3.0111083984375, -2.6318359375, -2.2525634765625, -1.873291015625, -1.4940185546875, -1.11474609375, -0.7354736328125, -0.356201171875, 0.0230712890625, 0.40234375, 0.7816162109375, 1.160888671875, 1.5401611328125, 1.91943359375, 2.2987060546875, 2.677978515625, 3.0572509765625, 3.4365234375, 3.8157958984375, 4.195068359375, 4.5743408203125, 4.95361328125, 5.3328857421875, 5.712158203125, 6.0914306640625, 6.470703125, 6.8499755859375, 7.229248046875, 7.6085205078125, 7.98779296875, 8.3670654296875, 8.746337890625, 9.1256103515625, 9.5048828125, 9.8841552734375, 10.263427734375, 10.6427001953125, 11.02197265625, 11.4012451171875, 11.780517578125, 12.1597900390625, 12.5390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 7.0, 6.0, 10.0, 14.0, 19.0, 23.0, 19.0, 26.0, 16.0, 41.0, 37.0, 41.0, 47.0, 46.0, 46.0, 44.0, 53.0, 35.0, 48.0, 52.0, 38.0, 41.0, 36.0, 41.0, 29.0, 37.0, 29.0, 28.0, 19.0, 11.0, 7.0, 10.0, 5.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27239990234375, -4.1307373046875, -3.98907470703125, -3.847412109375, -3.70574951171875, -3.5640869140625, -3.42242431640625, -3.28076171875, -3.13909912109375, -2.9974365234375, -2.85577392578125, -2.714111328125, -2.57244873046875, -2.4307861328125, -2.28912353515625, -2.1474609375, -2.00579833984375, -1.8641357421875, -1.72247314453125, -1.580810546875, -1.43914794921875, -1.2974853515625, -1.15582275390625, -1.01416015625, -0.87249755859375, -0.7308349609375, -0.58917236328125, -0.447509765625, -0.30584716796875, -0.1641845703125, -0.02252197265625, 0.119140625, 0.26080322265625, 0.4024658203125, 0.54412841796875, 0.685791015625, 0.82745361328125, 0.9691162109375, 1.11077880859375, 1.25244140625, 1.39410400390625, 1.5357666015625, 1.67742919921875, 1.819091796875, 1.96075439453125, 2.1024169921875, 2.24407958984375, 2.3857421875, 2.52740478515625, 2.6690673828125, 2.81072998046875, 2.952392578125, 3.09405517578125, 3.2357177734375, 3.37738037109375, 3.51904296875, 3.66070556640625, 3.8023681640625, 3.94403076171875, 4.085693359375, 4.22735595703125, 4.3690185546875, 4.51068115234375, 4.65234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 8.0, 22.0, 13.0, 18.0, 30.0, 50.0, 65.0, 73.0, 107.0, 140.0, 214.0, 240.0, 319.0, 509.0, 792.0, 1201.0, 2366.0, 9063.0, 74688.0, 631130.0, 290679.0, 27531.0, 4454.0, 1621.0, 881.0, 638.0, 458.0, 334.0, 233.0, 163.0, 134.0, 89.0, 71.0, 54.0, 33.0, 29.0, 27.0, 15.0, 13.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.96875, -28.027587890625, -27.08642578125, -26.145263671875, -25.2041015625, -24.262939453125, -23.32177734375, -22.380615234375, -21.439453125, -20.498291015625, -19.55712890625, -18.615966796875, -17.6748046875, -16.733642578125, -15.79248046875, -14.851318359375, -13.91015625, -12.968994140625, -12.02783203125, -11.086669921875, -10.1455078125, -9.204345703125, -8.26318359375, -7.322021484375, -6.380859375, -5.439697265625, -4.49853515625, -3.557373046875, -2.6162109375, -1.675048828125, -0.73388671875, 0.207275390625, 1.1484375, 2.089599609375, 3.03076171875, 3.971923828125, 4.9130859375, 5.854248046875, 6.79541015625, 7.736572265625, 8.677734375, 9.618896484375, 10.56005859375, 11.501220703125, 12.4423828125, 13.383544921875, 14.32470703125, 15.265869140625, 16.20703125, 17.148193359375, 18.08935546875, 19.030517578125, 19.9716796875, 20.912841796875, 21.85400390625, 22.795166015625, 23.736328125, 24.677490234375, 25.61865234375, 26.559814453125, 27.5009765625, 28.442138671875, 29.38330078125, 30.324462890625, 31.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 19.0, 16.0, 22.0, 24.0, 30.0, 45.0, 50.0, 57.0, 60.0, 65.0, 68.0, 68.0, 67.0, 56.0, 63.0, 58.0, 46.0, 26.0, 37.0, 32.0, 27.0, 21.0, 10.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.689697265625, -37.78564453125, -36.881591796875, -35.9775390625, -35.073486328125, -34.16943359375, -33.265380859375, -32.361328125, -31.457275390625, -30.55322265625, -29.649169921875, -28.7451171875, -27.841064453125, -26.93701171875, -26.032958984375, -25.12890625, -24.224853515625, -23.32080078125, -22.416748046875, -21.5126953125, -20.608642578125, -19.70458984375, -18.800537109375, -17.896484375, -16.992431640625, -16.08837890625, -15.184326171875, -14.2802734375, -13.376220703125, -12.47216796875, -11.568115234375, -10.6640625, -9.760009765625, -8.85595703125, -7.951904296875, -7.0478515625, -6.143798828125, -5.23974609375, -4.335693359375, -3.431640625, -2.527587890625, -1.62353515625, -0.719482421875, 0.1845703125, 1.088623046875, 1.99267578125, 2.896728515625, 3.80078125, 4.704833984375, 5.60888671875, 6.512939453125, 7.4169921875, 8.321044921875, 9.22509765625, 10.129150390625, 11.033203125, 11.937255859375, 12.84130859375, 13.745361328125, 14.6494140625, 15.553466796875, 16.45751953125, 17.361572265625, 18.265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 17.0, 19.0, 32.0, 30.0, 46.0, 64.0, 118.0, 172.0, 299.0, 549.0, 1125.0, 2232.0, 6220.0, 20764.0, 106445.0, 574049.0, 274360.0, 44071.0, 10883.0, 3623.0, 1571.0, 738.0, 396.0, 237.0, 146.0, 95.0, 61.0, 50.0, 38.0, 16.0, 14.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.96875, -11.56640625, -11.1640625, -10.76171875, -10.359375, -9.95703125, -9.5546875, -9.15234375, -8.75, -8.34765625, -7.9453125, -7.54296875, -7.140625, -6.73828125, -6.3359375, -5.93359375, -5.53125, -5.12890625, -4.7265625, -4.32421875, -3.921875, -3.51953125, -3.1171875, -2.71484375, -2.3125, -1.91015625, -1.5078125, -1.10546875, -0.703125, -0.30078125, 0.1015625, 0.50390625, 0.90625, 1.30859375, 1.7109375, 2.11328125, 2.515625, 2.91796875, 3.3203125, 3.72265625, 4.125, 4.52734375, 4.9296875, 5.33203125, 5.734375, 6.13671875, 6.5390625, 6.94140625, 7.34375, 7.74609375, 8.1484375, 8.55078125, 8.953125, 9.35546875, 9.7578125, 10.16015625, 10.5625, 10.96484375, 11.3671875, 11.76953125, 12.171875, 12.57421875, 12.9765625, 13.37890625, 13.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 10.0, 8.0, 20.0, 19.0, 29.0, 43.0, 52.0, 54.0, 86.0, 87.0, 106.0, 95.0, 87.0, 89.0, 53.0, 39.0, 39.0, 25.0, 10.0, 8.0, 5.0, 3.0, 2.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00232696533203125, -0.0022652000188827515, -0.002203434705734253, -0.0021416693925857544, -0.002079904079437256, -0.0020181387662887573, -0.001956373453140259, -0.0018946081399917603, -0.0018328428268432617, -0.0017710775136947632, -0.0017093122005462646, -0.0016475468873977661, -0.0015857815742492676, -0.001524016261100769, -0.0014622509479522705, -0.001400485634803772, -0.0013387203216552734, -0.001276955008506775, -0.0012151896953582764, -0.0011534243822097778, -0.0010916590690612793, -0.0010298937559127808, -0.0009681284427642822, -0.0009063631296157837, -0.0008445978164672852, -0.0007828325033187866, -0.0007210671901702881, -0.0006593018770217896, -0.000597536563873291, -0.0005357712507247925, -0.00047400593757629395, -0.0004122406244277954, -0.0003504753112792969, -0.00028870999813079834, -0.0002269446849822998, -0.00016517937183380127, -0.00010341405868530273, -4.16487455368042e-05, 2.0116567611694336e-05, 8.188188076019287e-05, 0.0001436471939086914, 0.00020541250705718994, 0.0002671778202056885, 0.000328943133354187, 0.00039070844650268555, 0.0004524737596511841, 0.0005142390727996826, 0.0005760043859481812, 0.0006377696990966797, 0.0006995350122451782, 0.0007613003253936768, 0.0008230656385421753, 0.0008848309516906738, 0.0009465962648391724, 0.001008361577987671, 0.0010701268911361694, 0.001131892204284668, 0.0011936575174331665, 0.001255422830581665, 0.0013171881437301636, 0.0013789534568786621, 0.0014407187700271606, 0.0015024840831756592, 0.0015642493963241577, 0.0016260147094726562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 14.0, 13.0, 16.0, 32.0, 55.0, 94.0, 240.0, 500.0, 1552.0, 7867.0, 184862.0, 826295.0, 22564.0, 2976.0, 817.0, 302.0, 160.0, 85.0, 39.0, 21.0, 10.0, 10.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.456298828125, -32.50634765625, -31.556396484375, -30.6064453125, -29.656494140625, -28.70654296875, -27.756591796875, -26.806640625, -25.856689453125, -24.90673828125, -23.956787109375, -23.0068359375, -22.056884765625, -21.10693359375, -20.156982421875, -19.20703125, -18.257080078125, -17.30712890625, -16.357177734375, -15.4072265625, -14.457275390625, -13.50732421875, -12.557373046875, -11.607421875, -10.657470703125, -9.70751953125, -8.757568359375, -7.8076171875, -6.857666015625, -5.90771484375, -4.957763671875, -4.0078125, -3.057861328125, -2.10791015625, -1.157958984375, -0.2080078125, 0.741943359375, 1.69189453125, 2.641845703125, 3.591796875, 4.541748046875, 5.49169921875, 6.441650390625, 7.3916015625, 8.341552734375, 9.29150390625, 10.241455078125, 11.19140625, 12.141357421875, 13.09130859375, 14.041259765625, 14.9912109375, 15.941162109375, 16.89111328125, 17.841064453125, 18.791015625, 19.740966796875, 20.69091796875, 21.640869140625, 22.5908203125, 23.540771484375, 24.49072265625, 25.440673828125, 26.390625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 11.0, 12.0, 27.0, 43.0, 59.0, 72.0, 103.0, 134.0, 131.0, 128.0, 92.0, 55.0, 44.0, 22.0, 16.0, 17.0, 15.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.78125, -13.210205078125, -12.63916015625, -12.068115234375, -11.4970703125, -10.926025390625, -10.35498046875, -9.783935546875, -9.212890625, -8.641845703125, -8.07080078125, -7.499755859375, -6.9287109375, -6.357666015625, -5.78662109375, -5.215576171875, -4.64453125, -4.073486328125, -3.50244140625, -2.931396484375, -2.3603515625, -1.789306640625, -1.21826171875, -0.647216796875, -0.076171875, 0.494873046875, 1.06591796875, 1.636962890625, 2.2080078125, 2.779052734375, 3.35009765625, 3.921142578125, 4.4921875, 5.063232421875, 5.63427734375, 6.205322265625, 6.7763671875, 7.347412109375, 7.91845703125, 8.489501953125, 9.060546875, 9.631591796875, 10.20263671875, 10.773681640625, 11.3447265625, 11.915771484375, 12.48681640625, 13.057861328125, 13.62890625, 14.199951171875, 14.77099609375, 15.342041015625, 15.9130859375, 16.484130859375, 17.05517578125, 17.626220703125, 18.197265625, 18.768310546875, 19.33935546875, 19.910400390625, 20.4814453125, 21.052490234375, 21.62353515625, 22.194580078125, 22.765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 36.0, 165.0, 378.0, 283.0, 105.0, 26.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-695.87353515625, -679.59033203125, -663.3070678710938, -647.0238647460938, -630.7406005859375, -614.4573974609375, -598.1741943359375, -581.8909301757812, -565.6077270507812, -549.3245239257812, -533.041259765625, -516.758056640625, -500.4748229980469, -484.19158935546875, -467.90838623046875, -451.6251525878906, -435.3419189453125, -419.0586853027344, -402.77545166015625, -386.49224853515625, -370.2090148925781, -353.92578125, -337.642578125, -321.3593444824219, -305.07611083984375, -288.7928771972656, -272.5096435546875, -256.2264404296875, -239.94320678710938, -223.65997314453125, -207.3767547607422, -191.09353637695312, -174.81024169921875, -158.52700805664062, -142.24378967285156, -125.96056365966797, -109.67733764648438, -93.39411163330078, -77.11088562011719, -60.827659606933594, -44.54443359375, -28.261207580566406, -11.977981567382812, 4.305244445800781, 20.588470458984375, 36.87169647216797, 53.15492248535156, 69.43814849853516, 85.72137451171875, 102.00460052490234, 118.28782653808594, 134.571044921875, 150.85427856445312, 167.13751220703125, 183.4207305908203, 199.70394897460938, 215.9871826171875, 232.27041625976562, 248.5536346435547, 264.83685302734375, 281.1200866699219, 297.4033203125, 313.6865234375, 329.9697570800781, 346.25299072265625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 4.0, 9.0, 10.0, 6.0, 15.0, 12.0, 13.0, 22.0, 16.0, 25.0, 25.0, 52.0, 29.0, 42.0, 41.0, 47.0, 45.0, 48.0, 49.0, 67.0, 34.0, 35.0, 45.0, 42.0, 41.0, 27.0, 32.0, 23.0, 16.0, 30.0, 12.0, 12.0, 13.0, 11.0, 6.0, 10.0, 9.0, 6.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-104.74134826660156, -101.6285171508789, -98.51568603515625, -95.40284729003906, -92.2900161743164, -89.17718505859375, -86.06434631347656, -82.9515151977539, -79.83868408203125, -76.7258529663086, -73.61302185058594, -70.50018310546875, -67.3873519897461, -64.27452087402344, -61.161685943603516, -58.048851013183594, -54.93601989746094, -51.82318878173828, -48.71035385131836, -45.59751892089844, -42.48468780517578, -39.371856689453125, -36.2590217590332, -33.14618682861328, -30.033355712890625, -26.920522689819336, -23.807689666748047, -20.694856643676758, -17.58202362060547, -14.46919059753418, -11.35635757446289, -8.243524551391602, -5.1306915283203125, -2.0178585052490234, 1.0949745178222656, 4.207807540893555, 7.320640563964844, 10.433473587036133, 13.546306610107422, 16.65913963317871, 19.77197265625, 22.88480567932129, 25.997638702392578, 29.110471725463867, 32.223304748535156, 35.33613586425781, 38.448970794677734, 41.561805725097656, 44.67463684082031, 47.78746795654297, 50.90030288696289, 54.01313781738281, 57.12596893310547, 60.238800048828125, 63.35163497924805, 66.46446990966797, 69.57730102539062, 72.69013214111328, 75.80296325683594, 78.91580200195312, 82.02863311767578, 85.14146423339844, 88.25430297851562, 91.36713409423828, 94.47996520996094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 9.0, 21.0, 35.0, 41.0, 60.0, 105.0, 210.0, 361.0, 784.0, 1935.0, 5577.0, 24944.0, 465784.0, 3650697.0, 32645.0, 6889.0, 2220.0, 914.0, 388.0, 244.0, 132.0, 72.0, 62.0, 46.0, 21.0, 15.0, 12.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.125, -33.02685546875, -31.9287109375, -30.83056640625, -29.732421875, -28.63427734375, -27.5361328125, -26.43798828125, -25.33984375, -24.24169921875, -23.1435546875, -22.04541015625, -20.947265625, -19.84912109375, -18.7509765625, -17.65283203125, -16.5546875, -15.45654296875, -14.3583984375, -13.26025390625, -12.162109375, -11.06396484375, -9.9658203125, -8.86767578125, -7.76953125, -6.67138671875, -5.5732421875, -4.47509765625, -3.376953125, -2.27880859375, -1.1806640625, -0.08251953125, 1.015625, 2.11376953125, 3.2119140625, 4.31005859375, 5.408203125, 6.50634765625, 7.6044921875, 8.70263671875, 9.80078125, 10.89892578125, 11.9970703125, 13.09521484375, 14.193359375, 15.29150390625, 16.3896484375, 17.48779296875, 18.5859375, 19.68408203125, 20.7822265625, 21.88037109375, 22.978515625, 24.07666015625, 25.1748046875, 26.27294921875, 27.37109375, 28.46923828125, 29.5673828125, 30.66552734375, 31.763671875, 32.86181640625, 33.9599609375, 35.05810546875, 36.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 14.0, 8.0, 14.0, 13.0, 17.0, 19.0, 31.0, 41.0, 40.0, 32.0, 40.0, 35.0, 50.0, 60.0, 51.0, 51.0, 43.0, 47.0, 43.0, 39.0, 42.0, 37.0, 35.0, 28.0, 27.0, 22.0, 18.0, 9.0, 8.0, 12.0, 14.0, 10.0, 4.0, 4.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.843414306640625, -3.70831298828125, -3.573211669921875, -3.4381103515625, -3.303009033203125, -3.16790771484375, -3.032806396484375, -2.897705078125, -2.762603759765625, -2.62750244140625, -2.492401123046875, -2.3572998046875, -2.222198486328125, -2.08709716796875, -1.951995849609375, -1.81689453125, -1.681793212890625, -1.54669189453125, -1.411590576171875, -1.2764892578125, -1.141387939453125, -1.00628662109375, -0.871185302734375, -0.736083984375, -0.600982666015625, -0.46588134765625, -0.330780029296875, -0.1956787109375, -0.060577392578125, 0.07452392578125, 0.209625244140625, 0.3447265625, 0.479827880859375, 0.61492919921875, 0.750030517578125, 0.8851318359375, 1.020233154296875, 1.15533447265625, 1.290435791015625, 1.425537109375, 1.560638427734375, 1.69573974609375, 1.830841064453125, 1.9659423828125, 2.101043701171875, 2.23614501953125, 2.371246337890625, 2.50634765625, 2.641448974609375, 2.77655029296875, 2.911651611328125, 3.0467529296875, 3.181854248046875, 3.31695556640625, 3.452056884765625, 3.587158203125, 3.722259521484375, 3.85736083984375, 3.992462158203125, 4.1275634765625, 4.262664794921875, 4.39776611328125, 4.532867431640625, 4.66796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 6.0, 17.0, 27.0, 31.0, 47.0, 65.0, 99.0, 156.0, 210.0, 277.0, 427.0, 660.0, 996.0, 1423.0, 2486.0, 4067.0, 7324.0, 15124.0, 38313.0, 141681.0, 3428633.0, 433769.0, 69858.0, 23873.0, 10347.0, 5655.0, 3080.0, 1902.0, 1228.0, 872.0, 478.0, 341.0, 217.0, 174.0, 138.0, 84.0, 60.0, 34.0, 29.0, 23.0, 13.0, 11.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.9818115234375, -11.565185546875, -11.1485595703125, -10.73193359375, -10.3153076171875, -9.898681640625, -9.4820556640625, -9.0654296875, -8.6488037109375, -8.232177734375, -7.8155517578125, -7.39892578125, -6.9822998046875, -6.565673828125, -6.1490478515625, -5.732421875, -5.3157958984375, -4.899169921875, -4.4825439453125, -4.06591796875, -3.6492919921875, -3.232666015625, -2.8160400390625, -2.3994140625, -1.9827880859375, -1.566162109375, -1.1495361328125, -0.73291015625, -0.3162841796875, 0.100341796875, 0.5169677734375, 0.93359375, 1.3502197265625, 1.766845703125, 2.1834716796875, 2.60009765625, 3.0167236328125, 3.433349609375, 3.8499755859375, 4.2666015625, 4.6832275390625, 5.099853515625, 5.5164794921875, 5.93310546875, 6.3497314453125, 6.766357421875, 7.1829833984375, 7.599609375, 8.0162353515625, 8.432861328125, 8.8494873046875, 9.26611328125, 9.6827392578125, 10.099365234375, 10.5159912109375, 10.9326171875, 11.3492431640625, 11.765869140625, 12.1824951171875, 12.59912109375, 13.0157470703125, 13.432373046875, 13.8489990234375, 14.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 11.0, 11.0, 14.0, 23.0, 39.0, 46.0, 75.0, 151.0, 323.0, 2387.0, 478.0, 199.0, 95.0, 58.0, 41.0, 26.0, 16.0, 13.0, 8.0, 10.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.01446533203125, -2.8922119140625, -2.76995849609375, -2.647705078125, -2.52545166015625, -2.4031982421875, -2.28094482421875, -2.15869140625, -2.03643798828125, -1.9141845703125, -1.79193115234375, -1.669677734375, -1.54742431640625, -1.4251708984375, -1.30291748046875, -1.1806640625, -1.05841064453125, -0.9361572265625, -0.81390380859375, -0.691650390625, -0.56939697265625, -0.4471435546875, -0.32489013671875, -0.20263671875, -0.08038330078125, 0.0418701171875, 0.16412353515625, 0.286376953125, 0.40863037109375, 0.5308837890625, 0.65313720703125, 0.775390625, 0.89764404296875, 1.0198974609375, 1.14215087890625, 1.264404296875, 1.38665771484375, 1.5089111328125, 1.63116455078125, 1.75341796875, 1.87567138671875, 1.9979248046875, 2.12017822265625, 2.242431640625, 2.36468505859375, 2.4869384765625, 2.60919189453125, 2.7314453125, 2.85369873046875, 2.9759521484375, 3.09820556640625, 3.220458984375, 3.34271240234375, 3.4649658203125, 3.58721923828125, 3.70947265625, 3.83172607421875, 3.9539794921875, 4.07623291015625, 4.198486328125, 4.32073974609375, 4.4429931640625, 4.56524658203125, 4.6875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 36.0, 125.0, 266.0, 280.0, 190.0, 66.0, 24.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.20384216308594, -31.24742317199707, -29.291004180908203, -27.334583282470703, -25.378164291381836, -23.42174530029297, -21.46532440185547, -19.5089054107666, -17.552486419677734, -15.596067428588867, -13.639647483825684, -11.6832275390625, -9.726808547973633, -7.770389556884766, -5.813969612121582, -3.8575496673583984, -1.9011306762695312, 0.05528879165649414, 2.0117082595825195, 3.968127727508545, 5.92454719543457, 7.8809661865234375, 9.837386131286621, 11.793806076049805, 13.750225067138672, 15.706644058227539, 17.663063049316406, 19.619483947753906, 21.575902938842773, 23.53232192993164, 25.48874282836914, 27.445161819458008, 29.401580810546875, 31.357999801635742, 33.31441879272461, 35.27083969116211, 37.227256774902344, 39.183677673339844, 41.140098571777344, 43.096519470214844, 45.05293655395508, 47.00935745239258, 48.96577453613281, 50.92219543457031, 52.87861633300781, 54.83503341674805, 56.79145431518555, 58.74787139892578, 60.70429229736328, 62.66071319580078, 64.61713409423828, 66.57354736328125, 68.52996826171875, 70.48638916015625, 72.44281005859375, 74.39923095703125, 76.35565185546875, 78.31207275390625, 80.26849365234375, 82.22490692138672, 84.18132781982422, 86.13774871826172, 88.09416961669922, 90.05059051513672, 92.00700378417969]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 10.0, 9.0, 19.0, 19.0, 20.0, 23.0, 21.0, 33.0, 31.0, 27.0, 37.0, 29.0, 35.0, 43.0, 42.0, 30.0, 47.0, 44.0, 46.0, 49.0, 34.0, 32.0, 22.0, 35.0, 31.0, 17.0, 38.0, 21.0, 19.0, 19.0, 13.0, 16.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.307706832885742, -10.970895767211914, -10.634084701538086, -10.297273635864258, -9.960461616516113, -9.623650550842285, -9.286839485168457, -8.950028419494629, -8.613216400146484, -8.276405334472656, -7.93959379196167, -7.602782726287842, -7.2659711837768555, -6.929160118103027, -6.592349052429199, -6.255537986755371, -5.918726921081543, -5.581915855407715, -5.2451043128967285, -4.9082932472229, -4.571481704711914, -4.234670639038086, -3.897859573364258, -3.5610482692718506, -3.2242369651794434, -2.887425661087036, -2.550614356994629, -2.213803291320801, -1.8769919872283936, -1.5401806831359863, -1.2033696174621582, -0.866558313369751, -0.5297470092773438, -0.1929357647895813, 0.14387547969818115, 0.48068666458129883, 0.817497968673706, 1.1543092727661133, 1.4911203384399414, 1.8279316425323486, 2.164742946624756, 2.501554250717163, 2.8383655548095703, 3.1751766204833984, 3.5119879245758057, 3.848799228668213, 4.185610294342041, 4.522421836853027, 4.8592329025268555, 5.196043968200684, 5.53285551071167, 5.869666576385498, 6.206478118896484, 6.5432891845703125, 6.880100250244141, 7.216911315917969, 7.553722858428955, 7.890533924102783, 8.22734546661377, 8.564156532287598, 8.900967597961426, 9.23777961730957, 9.574590682983398, 9.911401748657227, 10.248212814331055]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 16.0, 26.0, 39.0, 39.0, 73.0, 107.0, 170.0, 249.0, 385.0, 564.0, 959.0, 1681.0, 2932.0, 5498.0, 10842.0, 22879.0, 49054.0, 103132.0, 191439.0, 251251.0, 198055.0, 108452.0, 51971.0, 24042.0, 11424.0, 5673.0, 3116.0, 1691.0, 1032.0, 662.0, 348.0, 260.0, 153.0, 108.0, 79.0, 50.0, 31.0, 18.0, 5.0, 3.0, 13.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 12.0, 12.0, 16.0, 16.0, 17.0, 24.0, 23.0, 34.0, 31.0, 33.0, 38.0, 35.0, 32.0, 50.0, 55.0, 56.0, 59.0, 39.0, 38.0, 49.0, 34.0, 35.0, 37.0, 28.0, 28.0, 21.0, 16.0, 16.0, 16.0, 12.0, 16.0, 11.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.994140625, -3.856597900390625, -3.71905517578125, -3.581512451171875, -3.4439697265625, -3.306427001953125, -3.16888427734375, -3.031341552734375, -2.893798828125, -2.756256103515625, -2.61871337890625, -2.481170654296875, -2.3436279296875, -2.206085205078125, -2.06854248046875, -1.930999755859375, -1.79345703125, -1.655914306640625, -1.51837158203125, -1.380828857421875, -1.2432861328125, -1.105743408203125, -0.96820068359375, -0.830657958984375, -0.693115234375, -0.555572509765625, -0.41802978515625, -0.280487060546875, -0.1429443359375, -0.005401611328125, 0.13214111328125, 0.269683837890625, 0.4072265625, 0.544769287109375, 0.68231201171875, 0.819854736328125, 0.9573974609375, 1.094940185546875, 1.23248291015625, 1.370025634765625, 1.507568359375, 1.645111083984375, 1.78265380859375, 1.920196533203125, 2.0577392578125, 2.195281982421875, 2.33282470703125, 2.470367431640625, 2.60791015625, 2.745452880859375, 2.88299560546875, 3.020538330078125, 3.1580810546875, 3.295623779296875, 3.43316650390625, 3.570709228515625, 3.708251953125, 3.845794677734375, 3.98333740234375, 4.120880126953125, 4.2584228515625, 4.395965576171875, 4.53350830078125, 4.671051025390625, 4.80859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 16.0, 11.0, 14.0, 30.0, 29.0, 39.0, 69.0, 77.0, 107.0, 146.0, 196.0, 283.0, 333.0, 484.0, 697.0, 1107.0, 1845.0, 5059.0, 31541.0, 387526.0, 557290.0, 48966.0, 6628.0, 2050.0, 1191.0, 719.0, 532.0, 382.0, 273.0, 231.0, 174.0, 136.0, 98.0, 69.0, 58.0, 32.0, 28.0, 16.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-23.84375, -23.076904296875, -22.31005859375, -21.543212890625, -20.7763671875, -20.009521484375, -19.24267578125, -18.475830078125, -17.708984375, -16.942138671875, -16.17529296875, -15.408447265625, -14.6416015625, -13.874755859375, -13.10791015625, -12.341064453125, -11.57421875, -10.807373046875, -10.04052734375, -9.273681640625, -8.5068359375, -7.739990234375, -6.97314453125, -6.206298828125, -5.439453125, -4.672607421875, -3.90576171875, -3.138916015625, -2.3720703125, -1.605224609375, -0.83837890625, -0.071533203125, 0.6953125, 1.462158203125, 2.22900390625, 2.995849609375, 3.7626953125, 4.529541015625, 5.29638671875, 6.063232421875, 6.830078125, 7.596923828125, 8.36376953125, 9.130615234375, 9.8974609375, 10.664306640625, 11.43115234375, 12.197998046875, 12.96484375, 13.731689453125, 14.49853515625, 15.265380859375, 16.0322265625, 16.799072265625, 17.56591796875, 18.332763671875, 19.099609375, 19.866455078125, 20.63330078125, 21.400146484375, 22.1669921875, 22.933837890625, 23.70068359375, 24.467529296875, 25.234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 11.0, 14.0, 14.0, 11.0, 17.0, 17.0, 14.0, 23.0, 19.0, 24.0, 32.0, 42.0, 34.0, 32.0, 42.0, 48.0, 41.0, 49.0, 39.0, 57.0, 40.0, 44.0, 40.0, 38.0, 28.0, 37.0, 26.0, 23.0, 20.0, 16.0, 20.0, 13.0, 13.0, 7.0, 5.0, 4.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.4375, -19.834228515625, -19.23095703125, -18.627685546875, -18.0244140625, -17.421142578125, -16.81787109375, -16.214599609375, -15.611328125, -15.008056640625, -14.40478515625, -13.801513671875, -13.1982421875, -12.594970703125, -11.99169921875, -11.388427734375, -10.78515625, -10.181884765625, -9.57861328125, -8.975341796875, -8.3720703125, -7.768798828125, -7.16552734375, -6.562255859375, -5.958984375, -5.355712890625, -4.75244140625, -4.149169921875, -3.5458984375, -2.942626953125, -2.33935546875, -1.736083984375, -1.1328125, -0.529541015625, 0.07373046875, 0.677001953125, 1.2802734375, 1.883544921875, 2.48681640625, 3.090087890625, 3.693359375, 4.296630859375, 4.89990234375, 5.503173828125, 6.1064453125, 6.709716796875, 7.31298828125, 7.916259765625, 8.51953125, 9.122802734375, 9.72607421875, 10.329345703125, 10.9326171875, 11.535888671875, 12.13916015625, 12.742431640625, 13.345703125, 13.948974609375, 14.55224609375, 15.155517578125, 15.7587890625, 16.362060546875, 16.96533203125, 17.568603515625, 18.171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 18.0, 32.0, 55.0, 105.0, 183.0, 374.0, 1083.0, 7161.0, 727211.0, 306399.0, 4311.0, 865.0, 378.0, 179.0, 68.0, 44.0, 25.0, 20.0, 5.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.555419921875, -31.67333984375, -30.791259765625, -29.9091796875, -29.027099609375, -28.14501953125, -27.262939453125, -26.380859375, -25.498779296875, -24.61669921875, -23.734619140625, -22.8525390625, -21.970458984375, -21.08837890625, -20.206298828125, -19.32421875, -18.442138671875, -17.56005859375, -16.677978515625, -15.7958984375, -14.913818359375, -14.03173828125, -13.149658203125, -12.267578125, -11.385498046875, -10.50341796875, -9.621337890625, -8.7392578125, -7.857177734375, -6.97509765625, -6.093017578125, -5.2109375, -4.328857421875, -3.44677734375, -2.564697265625, -1.6826171875, -0.800537109375, 0.08154296875, 0.963623046875, 1.845703125, 2.727783203125, 3.60986328125, 4.491943359375, 5.3740234375, 6.256103515625, 7.13818359375, 8.020263671875, 8.90234375, 9.784423828125, 10.66650390625, 11.548583984375, 12.4306640625, 13.312744140625, 14.19482421875, 15.076904296875, 15.958984375, 16.841064453125, 17.72314453125, 18.605224609375, 19.4873046875, 20.369384765625, 21.25146484375, 22.133544921875, 23.015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 4.0, 8.0, 13.0, 19.0, 21.0, 40.0, 64.0, 68.0, 119.0, 119.0, 153.0, 88.0, 82.0, 62.0, 43.0, 26.0, 21.0, 12.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002300262451171875, -0.0022467374801635742, -0.0021932125091552734, -0.0021396875381469727, -0.002086162567138672, -0.002032637596130371, -0.0019791126251220703, -0.0019255876541137695, -0.0018720626831054688, -0.001818537712097168, -0.0017650127410888672, -0.0017114877700805664, -0.0016579627990722656, -0.0016044378280639648, -0.001550912857055664, -0.0014973878860473633, -0.0014438629150390625, -0.0013903379440307617, -0.001336812973022461, -0.0012832880020141602, -0.0012297630310058594, -0.0011762380599975586, -0.0011227130889892578, -0.001069188117980957, -0.0010156631469726562, -0.0009621381759643555, -0.0009086132049560547, -0.0008550882339477539, -0.0008015632629394531, -0.0007480382919311523, -0.0006945133209228516, -0.0006409883499145508, -0.00058746337890625, -0.0005339384078979492, -0.00048041343688964844, -0.00042688846588134766, -0.0003733634948730469, -0.0003198385238647461, -0.0002663135528564453, -0.00021278858184814453, -0.00015926361083984375, -0.00010573863983154297, -5.221366882324219e-05, 1.3113021850585938e-06, 5.4836273193359375e-05, 0.00010836124420166016, 0.00016188621520996094, 0.00021541118621826172, 0.0002689361572265625, 0.0003224611282348633, 0.00037598609924316406, 0.00042951107025146484, 0.0004830360412597656, 0.0005365610122680664, 0.0005900859832763672, 0.000643610954284668, 0.0006971359252929688, 0.0007506608963012695, 0.0008041858673095703, 0.0008577108383178711, 0.0009112358093261719, 0.0009647607803344727, 0.0010182857513427734, 0.0010718107223510742, 0.001125335693359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 19.0, 21.0, 40.0, 99.0, 228.0, 806.0, 5583.0, 932535.0, 106097.0, 2314.0, 447.0, 178.0, 91.0, 39.0, 19.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.625, -42.208984375, -40.79296875, -39.376953125, -37.9609375, -36.544921875, -35.12890625, -33.712890625, -32.296875, -30.880859375, -29.46484375, -28.048828125, -26.6328125, -25.216796875, -23.80078125, -22.384765625, -20.96875, -19.552734375, -18.13671875, -16.720703125, -15.3046875, -13.888671875, -12.47265625, -11.056640625, -9.640625, -8.224609375, -6.80859375, -5.392578125, -3.9765625, -2.560546875, -1.14453125, 0.271484375, 1.6875, 3.103515625, 4.51953125, 5.935546875, 7.3515625, 8.767578125, 10.18359375, 11.599609375, 13.015625, 14.431640625, 15.84765625, 17.263671875, 18.6796875, 20.095703125, 21.51171875, 22.927734375, 24.34375, 25.759765625, 27.17578125, 28.591796875, 30.0078125, 31.423828125, 32.83984375, 34.255859375, 35.671875, 37.087890625, 38.50390625, 39.919921875, 41.3359375, 42.751953125, 44.16796875, 45.583984375, 47.0]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 20.0, 25.0, 55.0, 87.0, 160.0, 209.0, 211.0, 117.0, 53.0, 27.0, 13.0, 9.0, 6.0, 5.0, 2.0, 2.0], "bins": [-41.21875, -40.4508056640625, -39.682861328125, -38.9149169921875, -38.14697265625, -37.3790283203125, -36.611083984375, -35.8431396484375, -35.0751953125, -34.3072509765625, -33.539306640625, -32.7713623046875, -32.00341796875, -31.2354736328125, -30.467529296875, -29.6995849609375, -28.931640625, -28.1636962890625, -27.395751953125, -26.6278076171875, -25.85986328125, -25.0919189453125, -24.323974609375, -23.5560302734375, -22.7880859375, -22.0201416015625, -21.252197265625, -20.4842529296875, -19.71630859375, -18.9483642578125, -18.180419921875, -17.4124755859375, -16.64453125, -15.8765869140625, -15.108642578125, -14.3406982421875, -13.57275390625, -12.8048095703125, -12.036865234375, -11.2689208984375, -10.5009765625, -9.7330322265625, -8.965087890625, -8.1971435546875, -7.42919921875, -6.6612548828125, -5.893310546875, -5.1253662109375, -4.357421875, -3.5894775390625, -2.821533203125, -2.0535888671875, -1.28564453125, -0.5177001953125, 0.250244140625, 1.0181884765625, 1.7861328125, 2.5540771484375, 3.322021484375, 4.0899658203125, 4.85791015625, 5.6258544921875, 6.393798828125, 7.1617431640625, 7.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 23.0, 112.0, 613.0, 233.0, 23.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-711.9569702148438, -688.7424926757812, -665.5280151367188, -642.3134765625, -619.0989990234375, -595.884521484375, -572.6700439453125, -549.45556640625, -526.2410888671875, -503.026611328125, -479.8121032714844, -456.5976257324219, -433.38311767578125, -410.16864013671875, -386.95416259765625, -363.73968505859375, -340.525146484375, -317.3106689453125, -294.0961608886719, -270.8816833496094, -247.6671905517578, -224.45269775390625, -201.23822021484375, -178.0237274169922, -154.80923461914062, -131.59474182128906, -108.38025665283203, -85.165771484375, -61.95127868652344, -38.736785888671875, -15.522308349609375, 7.6921844482421875, 30.9066162109375, 54.1211051940918, 77.3355941772461, 100.55007934570312, 123.76457214355469, 146.97906494140625, 170.19354248046875, 193.4080352783203, 216.62252807617188, 239.83702087402344, 263.051513671875, 286.2659912109375, 309.48046875, 332.6949768066406, 355.9094543457031, 379.12396240234375, 402.33843994140625, 425.55291748046875, 448.7674255371094, 471.9819030761719, 495.1964111328125, 518.410888671875, 541.6253662109375, 564.83984375, 588.0543212890625, 611.268798828125, 634.4832763671875, 657.69775390625, 680.9122924804688, 704.1267700195312, 727.3412475585938, 750.5557250976562, 773.770263671875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 3.0, 6.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 22.0, 23.0, 26.0, 28.0, 42.0, 41.0, 45.0, 46.0, 50.0, 52.0, 54.0, 52.0, 56.0, 44.0, 40.0, 46.0, 36.0, 34.0, 20.0, 29.0, 28.0, 18.0, 13.0, 13.0, 12.0, 5.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-121.19415283203125, -117.8420181274414, -114.48988342285156, -111.13775634765625, -107.7856216430664, -104.43348693847656, -101.08135223388672, -97.72921752929688, -94.37709045410156, -91.02495574951172, -87.67282104492188, -84.32069396972656, -80.96855926513672, -77.61642456054688, -74.26428985595703, -70.91215515136719, -67.56002044677734, -64.2078857421875, -60.85575485229492, -57.50362014770508, -54.1514892578125, -50.799354553222656, -47.44721984863281, -44.09508514404297, -40.74295425415039, -37.39081954956055, -34.03868865966797, -30.686553955078125, -27.334421157836914, -23.982288360595703, -20.63015365600586, -17.27802085876465, -13.925888061523438, -10.573755264282227, -7.221621513366699, -3.869487762451172, -0.5173549652099609, 2.83477783203125, 6.186912536621094, 9.539045333862305, 12.891178131103516, 16.243310928344727, 19.595443725585938, 22.94757843017578, 26.299711227416992, 29.651844024658203, 33.00397872924805, 36.356109619140625, 39.70824432373047, 43.06037902832031, 46.41250991821289, 49.764644622802734, 53.11677551269531, 56.468910217285156, 59.821044921875, 63.173179626464844, 66.52531433105469, 69.87744903564453, 73.22958374023438, 76.58171081542969, 79.93384552001953, 83.28598022460938, 86.63811492919922, 89.99024963378906, 93.34237670898438]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 13.0, 19.0, 35.0, 60.0, 94.0, 129.0, 197.0, 376.0, 664.0, 1215.0, 2896.0, 8312.0, 40211.0, 4025306.0, 93984.0, 13036.0, 4050.0, 1685.0, 797.0, 481.0, 254.0, 179.0, 102.0, 57.0, 43.0, 28.0, 10.0, 12.0, 10.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.271240234375, -25.35498046875, -24.438720703125, -23.5224609375, -22.606201171875, -21.68994140625, -20.773681640625, -19.857421875, -18.941162109375, -18.02490234375, -17.108642578125, -16.1923828125, -15.276123046875, -14.35986328125, -13.443603515625, -12.52734375, -11.611083984375, -10.69482421875, -9.778564453125, -8.8623046875, -7.946044921875, -7.02978515625, -6.113525390625, -5.197265625, -4.281005859375, -3.36474609375, -2.448486328125, -1.5322265625, -0.615966796875, 0.30029296875, 1.216552734375, 2.1328125, 3.049072265625, 3.96533203125, 4.881591796875, 5.7978515625, 6.714111328125, 7.63037109375, 8.546630859375, 9.462890625, 10.379150390625, 11.29541015625, 12.211669921875, 13.1279296875, 14.044189453125, 14.96044921875, 15.876708984375, 16.79296875, 17.709228515625, 18.62548828125, 19.541748046875, 20.4580078125, 21.374267578125, 22.29052734375, 23.206787109375, 24.123046875, 25.039306640625, 25.95556640625, 26.871826171875, 27.7880859375, 28.704345703125, 29.62060546875, 30.536865234375, 31.453125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 5.0, 4.0, 3.0, 13.0, 12.0, 22.0, 16.0, 30.0, 27.0, 49.0, 27.0, 48.0, 45.0, 53.0, 57.0, 69.0, 60.0, 54.0, 58.0, 40.0, 41.0, 44.0, 35.0, 34.0, 30.0, 26.0, 21.0, 13.0, 14.0, 9.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.4453125, -6.26812744140625, -6.0909423828125, -5.91375732421875, -5.736572265625, -5.55938720703125, -5.3822021484375, -5.20501708984375, -5.02783203125, -4.85064697265625, -4.6734619140625, -4.49627685546875, -4.319091796875, -4.14190673828125, -3.9647216796875, -3.78753662109375, -3.6103515625, -3.43316650390625, -3.2559814453125, -3.07879638671875, -2.901611328125, -2.72442626953125, -2.5472412109375, -2.37005615234375, -2.19287109375, -2.01568603515625, -1.8385009765625, -1.66131591796875, -1.484130859375, -1.30694580078125, -1.1297607421875, -0.95257568359375, -0.775390625, -0.59820556640625, -0.4210205078125, -0.24383544921875, -0.066650390625, 0.11053466796875, 0.2877197265625, 0.46490478515625, 0.64208984375, 0.81927490234375, 0.9964599609375, 1.17364501953125, 1.350830078125, 1.52801513671875, 1.7052001953125, 1.88238525390625, 2.0595703125, 2.23675537109375, 2.4139404296875, 2.59112548828125, 2.768310546875, 2.94549560546875, 3.1226806640625, 3.29986572265625, 3.47705078125, 3.65423583984375, 3.8314208984375, 4.00860595703125, 4.185791015625, 4.36297607421875, 4.5401611328125, 4.71734619140625, 4.89453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 16.0, 18.0, 22.0, 49.0, 48.0, 73.0, 87.0, 135.0, 174.0, 232.0, 339.0, 476.0, 742.0, 1121.0, 1824.0, 3351.0, 6936.0, 20008.0, 106971.0, 3938167.0, 82046.0, 17133.0, 6257.0, 3034.0, 1644.0, 1018.0, 716.0, 486.0, 314.0, 241.0, 159.0, 119.0, 86.0, 62.0, 51.0, 39.0, 20.0, 13.0, 13.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.970458984375, -16.39404296875, -15.817626953125, -15.2412109375, -14.664794921875, -14.08837890625, -13.511962890625, -12.935546875, -12.359130859375, -11.78271484375, -11.206298828125, -10.6298828125, -10.053466796875, -9.47705078125, -8.900634765625, -8.32421875, -7.747802734375, -7.17138671875, -6.594970703125, -6.0185546875, -5.442138671875, -4.86572265625, -4.289306640625, -3.712890625, -3.136474609375, -2.56005859375, -1.983642578125, -1.4072265625, -0.830810546875, -0.25439453125, 0.322021484375, 0.8984375, 1.474853515625, 2.05126953125, 2.627685546875, 3.2041015625, 3.780517578125, 4.35693359375, 4.933349609375, 5.509765625, 6.086181640625, 6.66259765625, 7.239013671875, 7.8154296875, 8.391845703125, 8.96826171875, 9.544677734375, 10.12109375, 10.697509765625, 11.27392578125, 11.850341796875, 12.4267578125, 13.003173828125, 13.57958984375, 14.156005859375, 14.732421875, 15.308837890625, 15.88525390625, 16.461669921875, 17.0380859375, 17.614501953125, 18.19091796875, 18.767333984375, 19.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 8.0, 7.0, 16.0, 19.0, 35.0, 79.0, 253.0, 3338.0, 169.0, 69.0, 28.0, 23.0, 9.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.578125, -5.39453125, -5.2109375, -5.02734375, -4.84375, -4.66015625, -4.4765625, -4.29296875, -4.109375, -3.92578125, -3.7421875, -3.55859375, -3.375, -3.19140625, -3.0078125, -2.82421875, -2.640625, -2.45703125, -2.2734375, -2.08984375, -1.90625, -1.72265625, -1.5390625, -1.35546875, -1.171875, -0.98828125, -0.8046875, -0.62109375, -0.4375, -0.25390625, -0.0703125, 0.11328125, 0.296875, 0.48046875, 0.6640625, 0.84765625, 1.03125, 1.21484375, 1.3984375, 1.58203125, 1.765625, 1.94921875, 2.1328125, 2.31640625, 2.5, 2.68359375, 2.8671875, 3.05078125, 3.234375, 3.41796875, 3.6015625, 3.78515625, 3.96875, 4.15234375, 4.3359375, 4.51953125, 4.703125, 4.88671875, 5.0703125, 5.25390625, 5.4375, 5.62109375, 5.8046875, 5.98828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 10.0, 35.0, 78.0, 192.0, 302.0, 229.0, 112.0, 23.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.132436752319336, -24.480453491210938, -22.828472137451172, -21.176488876342773, -19.524505615234375, -17.872522354125977, -16.220539093017578, -14.568557739257812, -12.916574478149414, -11.264591217041016, -9.612608909606934, -7.960626125335693, -6.308643341064453, -4.656660079956055, -3.0046777725219727, -1.3526954650878906, 0.2992877960205078, 1.951270580291748, 3.6032533645629883, 5.2552361488342285, 6.907218933105469, 8.559202194213867, 10.21118450164795, 11.863166809082031, 13.51515007019043, 15.167133331298828, 16.819114685058594, 18.471097946166992, 20.12308120727539, 21.77506446838379, 23.427047729492188, 25.079029083251953, 26.73101043701172, 28.382993698120117, 30.034976959228516, 31.68695831298828, 33.33894348144531, 34.99092483520508, 36.642906188964844, 38.294891357421875, 39.94687271118164, 41.598854064941406, 43.25083923339844, 44.9028205871582, 46.55480194091797, 48.206787109375, 49.858768463134766, 51.51074981689453, 53.16273498535156, 54.81471633911133, 56.46670150756836, 58.118682861328125, 59.770668029785156, 61.42264938354492, 63.07463073730469, 64.72661590576172, 66.37860107421875, 68.03058624267578, 69.68256378173828, 71.33454895019531, 72.98653411865234, 74.63851928710938, 76.29049682617188, 77.9424819946289, 79.5944595336914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 11.0, 16.0, 14.0, 12.0, 23.0, 9.0, 14.0, 16.0, 23.0, 21.0, 24.0, 22.0, 29.0, 36.0, 37.0, 45.0, 41.0, 42.0, 44.0, 38.0, 33.0, 55.0, 39.0, 35.0, 27.0, 29.0, 38.0, 32.0, 20.0, 21.0, 26.0, 14.0, 25.0, 25.0, 15.0, 12.0, 13.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.527572631835938, -11.191959381103516, -10.856346130371094, -10.520732879638672, -10.18511962890625, -9.849506378173828, -9.513893127441406, -9.178279876708984, -8.842666625976562, -8.50705337524414, -8.171440124511719, -7.835826873779297, -7.500213623046875, -7.164600372314453, -6.828987121582031, -6.493373870849609, -6.157760143280029, -5.822146892547607, -5.4865336418151855, -5.150920391082764, -4.815307140350342, -4.47969388961792, -4.14408016204834, -3.808467149734497, -3.472853899002075, -3.1372406482696533, -2.8016273975372314, -2.4660139083862305, -2.1304006576538086, -1.7947875261306763, -1.4591741561889648, -1.123560905456543, -0.7879476547241211, -0.45233437418937683, -0.11672109365463257, 0.21889221668243408, 0.554505467414856, 0.8901187181472778, 1.2257320880889893, 1.5613453388214111, 1.896958589553833, 2.232571840286255, 2.5681850910186768, 2.9037985801696777, 3.2394118309020996, 3.5750250816345215, 3.9106383323669434, 4.246251583099365, 4.581864833831787, 4.917478084564209, 5.253091335296631, 5.588704586029053, 5.924317836761475, 6.2599310874938965, 6.595544815063477, 6.931158065795898, 7.26677131652832, 7.602384567260742, 7.937997817993164, 8.273611068725586, 8.609224319458008, 8.94483757019043, 9.280450820922852, 9.616064071655273, 9.951677322387695]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 7.0, 4.0, 17.0, 21.0, 41.0, 47.0, 81.0, 160.0, 251.0, 461.0, 1019.0, 2788.0, 8815.0, 33563.0, 142130.0, 447799.0, 307244.0, 76930.0, 18460.0, 5159.0, 1854.0, 809.0, 357.0, 196.0, 108.0, 66.0, 41.0, 38.0, 31.0, 22.0, 5.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.6474609375, -14.138671875, -13.6298828125, -13.12109375, -12.6123046875, -12.103515625, -11.5947265625, -11.0859375, -10.5771484375, -10.068359375, -9.5595703125, -9.05078125, -8.5419921875, -8.033203125, -7.5244140625, -7.015625, -6.5068359375, -5.998046875, -5.4892578125, -4.98046875, -4.4716796875, -3.962890625, -3.4541015625, -2.9453125, -2.4365234375, -1.927734375, -1.4189453125, -0.91015625, -0.4013671875, 0.107421875, 0.6162109375, 1.125, 1.6337890625, 2.142578125, 2.6513671875, 3.16015625, 3.6689453125, 4.177734375, 4.6865234375, 5.1953125, 5.7041015625, 6.212890625, 6.7216796875, 7.23046875, 7.7392578125, 8.248046875, 8.7568359375, 9.265625, 9.7744140625, 10.283203125, 10.7919921875, 11.30078125, 11.8095703125, 12.318359375, 12.8271484375, 13.3359375, 13.8447265625, 14.353515625, 14.8623046875, 15.37109375, 15.8798828125, 16.388671875, 16.8974609375, 17.40625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 3.0, 7.0, 13.0, 6.0, 19.0, 19.0, 33.0, 37.0, 30.0, 42.0, 33.0, 45.0, 61.0, 47.0, 55.0, 59.0, 57.0, 48.0, 45.0, 37.0, 45.0, 43.0, 33.0, 23.0, 33.0, 18.0, 22.0, 15.0, 16.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-6.5546875, -6.37615966796875, -6.1976318359375, -6.01910400390625, -5.840576171875, -5.66204833984375, -5.4835205078125, -5.30499267578125, -5.12646484375, -4.94793701171875, -4.7694091796875, -4.59088134765625, -4.412353515625, -4.23382568359375, -4.0552978515625, -3.87677001953125, -3.6982421875, -3.51971435546875, -3.3411865234375, -3.16265869140625, -2.984130859375, -2.80560302734375, -2.6270751953125, -2.44854736328125, -2.27001953125, -2.09149169921875, -1.9129638671875, -1.73443603515625, -1.555908203125, -1.37738037109375, -1.1988525390625, -1.02032470703125, -0.841796875, -0.66326904296875, -0.4847412109375, -0.30621337890625, -0.127685546875, 0.05084228515625, 0.2293701171875, 0.40789794921875, 0.58642578125, 0.76495361328125, 0.9434814453125, 1.12200927734375, 1.300537109375, 1.47906494140625, 1.6575927734375, 1.83612060546875, 2.0146484375, 2.19317626953125, 2.3717041015625, 2.55023193359375, 2.728759765625, 2.90728759765625, 3.0858154296875, 3.26434326171875, 3.44287109375, 3.62139892578125, 3.7999267578125, 3.97845458984375, 4.156982421875, 4.33551025390625, 4.5140380859375, 4.69256591796875, 4.87109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 10.0, 16.0, 17.0, 19.0, 42.0, 52.0, 79.0, 117.0, 161.0, 216.0, 286.0, 452.0, 664.0, 1201.0, 2790.0, 13694.0, 189636.0, 769256.0, 58729.0, 6528.0, 1866.0, 899.0, 590.0, 357.0, 252.0, 162.0, 143.0, 89.0, 69.0, 43.0, 38.0, 25.0, 11.0, 17.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.25048828125, -20.3759765625, -19.50146484375, -18.626953125, -17.75244140625, -16.8779296875, -16.00341796875, -15.12890625, -14.25439453125, -13.3798828125, -12.50537109375, -11.630859375, -10.75634765625, -9.8818359375, -9.00732421875, -8.1328125, -7.25830078125, -6.3837890625, -5.50927734375, -4.634765625, -3.76025390625, -2.8857421875, -2.01123046875, -1.13671875, -0.26220703125, 0.6123046875, 1.48681640625, 2.361328125, 3.23583984375, 4.1103515625, 4.98486328125, 5.859375, 6.73388671875, 7.6083984375, 8.48291015625, 9.357421875, 10.23193359375, 11.1064453125, 11.98095703125, 12.85546875, 13.72998046875, 14.6044921875, 15.47900390625, 16.353515625, 17.22802734375, 18.1025390625, 18.97705078125, 19.8515625, 20.72607421875, 21.6005859375, 22.47509765625, 23.349609375, 24.22412109375, 25.0986328125, 25.97314453125, 26.84765625, 27.72216796875, 28.5966796875, 29.47119140625, 30.345703125, 31.22021484375, 32.0947265625, 32.96923828125, 33.84375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 9.0, 17.0, 14.0, 22.0, 23.0, 16.0, 28.0, 29.0, 36.0, 38.0, 44.0, 43.0, 64.0, 40.0, 46.0, 42.0, 51.0, 52.0, 44.0, 38.0, 43.0, 38.0, 25.0, 30.0, 27.0, 22.0, 14.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.515625, -22.7724609375, -22.029296875, -21.2861328125, -20.54296875, -19.7998046875, -19.056640625, -18.3134765625, -17.5703125, -16.8271484375, -16.083984375, -15.3408203125, -14.59765625, -13.8544921875, -13.111328125, -12.3681640625, -11.625, -10.8818359375, -10.138671875, -9.3955078125, -8.65234375, -7.9091796875, -7.166015625, -6.4228515625, -5.6796875, -4.9365234375, -4.193359375, -3.4501953125, -2.70703125, -1.9638671875, -1.220703125, -0.4775390625, 0.265625, 1.0087890625, 1.751953125, 2.4951171875, 3.23828125, 3.9814453125, 4.724609375, 5.4677734375, 6.2109375, 6.9541015625, 7.697265625, 8.4404296875, 9.18359375, 9.9267578125, 10.669921875, 11.4130859375, 12.15625, 12.8994140625, 13.642578125, 14.3857421875, 15.12890625, 15.8720703125, 16.615234375, 17.3583984375, 18.1015625, 18.8447265625, 19.587890625, 20.3310546875, 21.07421875, 21.8173828125, 22.560546875, 23.3037109375, 24.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 9.0, 7.0, 8.0, 9.0, 16.0, 16.0, 17.0, 20.0, 38.0, 56.0, 104.0, 185.0, 357.0, 803.0, 4056.0, 126993.0, 897667.0, 15387.0, 1637.0, 526.0, 209.0, 123.0, 79.0, 56.0, 38.0, 30.0, 14.0, 14.0, 16.0, 10.0, 4.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.484375, -24.694091796875, -23.90380859375, -23.113525390625, -22.3232421875, -21.532958984375, -20.74267578125, -19.952392578125, -19.162109375, -18.371826171875, -17.58154296875, -16.791259765625, -16.0009765625, -15.210693359375, -14.42041015625, -13.630126953125, -12.83984375, -12.049560546875, -11.25927734375, -10.468994140625, -9.6787109375, -8.888427734375, -8.09814453125, -7.307861328125, -6.517578125, -5.727294921875, -4.93701171875, -4.146728515625, -3.3564453125, -2.566162109375, -1.77587890625, -0.985595703125, -0.1953125, 0.594970703125, 1.38525390625, 2.175537109375, 2.9658203125, 3.756103515625, 4.54638671875, 5.336669921875, 6.126953125, 6.917236328125, 7.70751953125, 8.497802734375, 9.2880859375, 10.078369140625, 10.86865234375, 11.658935546875, 12.44921875, 13.239501953125, 14.02978515625, 14.820068359375, 15.6103515625, 16.400634765625, 17.19091796875, 17.981201171875, 18.771484375, 19.561767578125, 20.35205078125, 21.142333984375, 21.9326171875, 22.722900390625, 23.51318359375, 24.303466796875, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 9.0, 4.0, 3.0, 21.0, 19.0, 27.0, 24.0, 30.0, 40.0, 57.0, 71.0, 100.0, 93.0, 89.0, 75.0, 61.0, 39.0, 35.0, 31.0, 31.0, 18.0, 19.0, 13.0, 20.0, 10.0, 12.0, 1.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0012960433959960938, -0.0012586414813995361, -0.0012212395668029785, -0.001183837652206421, -0.0011464357376098633, -0.0011090338230133057, -0.001071631908416748, -0.0010342299938201904, -0.0009968280792236328, -0.0009594261646270752, -0.0009220242500305176, -0.00088462233543396, -0.0008472204208374023, -0.0008098185062408447, -0.0007724165916442871, -0.0007350146770477295, -0.0006976127624511719, -0.0006602108478546143, -0.0006228089332580566, -0.000585407018661499, -0.0005480051040649414, -0.0005106031894683838, -0.00047320127487182617, -0.00043579936027526855, -0.00039839744567871094, -0.0003609955310821533, -0.0003235936164855957, -0.0002861917018890381, -0.00024878978729248047, -0.00021138787269592285, -0.00017398595809936523, -0.00013658404350280762, -9.918212890625e-05, -6.178021430969238e-05, -2.4378299713134766e-05, 1.3023614883422852e-05, 5.042552947998047e-05, 8.782744407653809e-05, 0.0001252293586730957, 0.00016263127326965332, 0.00020003318786621094, 0.00023743510246276855, 0.00027483701705932617, 0.0003122389316558838, 0.0003496408462524414, 0.000387042760848999, 0.00042444467544555664, 0.00046184659004211426, 0.0004992485046386719, 0.0005366504192352295, 0.0005740523338317871, 0.0006114542484283447, 0.0006488561630249023, 0.00068625807762146, 0.0007236599922180176, 0.0007610619068145752, 0.0007984638214111328, 0.0008358657360076904, 0.000873267650604248, 0.0009106695652008057, 0.0009480714797973633, 0.000985473394393921, 0.0010228753089904785, 0.0010602772235870361, 0.0010976791381835938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 3.0, 10.0, 14.0, 25.0, 36.0, 46.0, 98.0, 165.0, 297.0, 562.0, 1311.0, 4644.0, 43848.0, 851379.0, 133982.0, 8484.0, 1951.0, 804.0, 367.0, 200.0, 117.0, 76.0, 36.0, 22.0, 15.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.125, -20.515625, -19.90625, -19.296875, -18.6875, -18.078125, -17.46875, -16.859375, -16.25, -15.640625, -15.03125, -14.421875, -13.8125, -13.203125, -12.59375, -11.984375, -11.375, -10.765625, -10.15625, -9.546875, -8.9375, -8.328125, -7.71875, -7.109375, -6.5, -5.890625, -5.28125, -4.671875, -4.0625, -3.453125, -2.84375, -2.234375, -1.625, -1.015625, -0.40625, 0.203125, 0.8125, 1.421875, 2.03125, 2.640625, 3.25, 3.859375, 4.46875, 5.078125, 5.6875, 6.296875, 6.90625, 7.515625, 8.125, 8.734375, 9.34375, 9.953125, 10.5625, 11.171875, 11.78125, 12.390625, 13.0, 13.609375, 14.21875, 14.828125, 15.4375, 16.046875, 16.65625, 17.265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 16.0, 27.0, 34.0, 51.0, 60.0, 123.0, 158.0, 168.0, 124.0, 78.0, 47.0, 36.0, 23.0, 16.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.053466796875, -12.51318359375, -11.972900390625, -11.4326171875, -10.892333984375, -10.35205078125, -9.811767578125, -9.271484375, -8.731201171875, -8.19091796875, -7.650634765625, -7.1103515625, -6.570068359375, -6.02978515625, -5.489501953125, -4.94921875, -4.408935546875, -3.86865234375, -3.328369140625, -2.7880859375, -2.247802734375, -1.70751953125, -1.167236328125, -0.626953125, -0.086669921875, 0.45361328125, 0.993896484375, 1.5341796875, 2.074462890625, 2.61474609375, 3.155029296875, 3.6953125, 4.235595703125, 4.77587890625, 5.316162109375, 5.8564453125, 6.396728515625, 6.93701171875, 7.477294921875, 8.017578125, 8.557861328125, 9.09814453125, 9.638427734375, 10.1787109375, 10.718994140625, 11.25927734375, 11.799560546875, 12.33984375, 12.880126953125, 13.42041015625, 13.960693359375, 14.5009765625, 15.041259765625, 15.58154296875, 16.121826171875, 16.662109375, 17.202392578125, 17.74267578125, 18.282958984375, 18.8232421875, 19.363525390625, 19.90380859375, 20.444091796875, 20.984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 42.0, 196.0, 406.0, 268.0, 63.0, 9.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-594.6671142578125, -580.3751831054688, -566.083251953125, -551.791259765625, -537.4993286132812, -523.2073974609375, -508.91546630859375, -494.6235046386719, -480.33154296875, -466.03961181640625, -451.7476501464844, -437.4557189941406, -423.16375732421875, -408.871826171875, -394.57989501953125, -380.2879333496094, -365.9960021972656, -351.7040710449219, -337.412109375, -323.12017822265625, -308.8282165527344, -294.5362854003906, -280.24432373046875, -265.952392578125, -251.6604461669922, -237.36849975585938, -223.07655334472656, -208.78460693359375, -194.49267578125, -180.20071411132812, -165.90878295898438, -151.61683654785156, -137.32485961914062, -123.03291320800781, -108.740966796875, -94.44902801513672, -80.1570816040039, -65.8651351928711, -51.57319641113281, -37.28125, -22.989303588867188, -8.697359085083008, 5.594585418701172, 19.88652801513672, 34.17847442626953, 48.470420837402344, 62.762359619140625, 77.05430603027344, 91.34625244140625, 105.63819885253906, 119.93014526367188, 134.22207641601562, 148.5140380859375, 162.80596923828125, 177.09791564941406, 191.38986206054688, 205.6818084716797, 219.9737548828125, 234.2657012939453, 248.55764770507812, 262.8495788574219, 277.14154052734375, 291.4334716796875, 305.72540283203125, 320.0173645019531]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 12.0, 16.0, 17.0, 12.0, 13.0, 25.0, 20.0, 31.0, 35.0, 24.0, 40.0, 44.0, 41.0, 38.0, 45.0, 41.0, 52.0, 50.0, 36.0, 48.0, 33.0, 43.0, 43.0, 32.0, 25.0, 23.0, 25.0, 21.0, 20.0, 13.0, 9.0, 8.0, 12.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.62222290039062, -95.3524169921875, -92.08261108398438, -88.81279754638672, -85.5429916381836, -82.27318572998047, -79.00337982177734, -75.73356628417969, -72.46376037597656, -69.19395446777344, -65.92414855957031, -62.65433883666992, -59.38452911376953, -56.114723205566406, -52.84491729736328, -49.57510757446289, -46.305301666259766, -43.03549575805664, -39.76568603515625, -36.495880126953125, -33.226070404052734, -29.95626449584961, -26.68645668029785, -23.416648864746094, -20.146841049194336, -16.877033233642578, -13.60722541809082, -10.337418556213379, -7.067610740661621, -3.7978038787841797, -0.5279960632324219, 2.741811752319336, 6.011619567871094, 9.281427383422852, 12.55123519897461, 15.82104206085205, 19.090850830078125, 22.36065673828125, 25.630464553833008, 28.900272369384766, 32.170082092285156, 35.43988800048828, 38.70969772338867, 41.9795036315918, 45.24931335449219, 48.51911926269531, 51.78892517089844, 55.05873489379883, 58.32854080200195, 61.59834671020508, 64.86815643310547, 68.1379623413086, 71.40776824951172, 74.67758178710938, 77.9473876953125, 81.21719360351562, 84.48699951171875, 87.75680541992188, 91.026611328125, 94.29642486572266, 97.56623077392578, 100.8360366821289, 104.10584259033203, 107.37565612792969, 110.64546203613281]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 13.0, 16.0, 31.0, 44.0, 73.0, 123.0, 208.0, 368.0, 684.0, 1526.0, 3486.0, 9732.0, 43435.0, 3771377.0, 324038.0, 26608.0, 7176.0, 2696.0, 1208.0, 591.0, 317.0, 203.0, 104.0, 69.0, 44.0, 31.0, 13.0, 15.0, 12.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.078125, -24.31494140625, -23.5517578125, -22.78857421875, -22.025390625, -21.26220703125, -20.4990234375, -19.73583984375, -18.97265625, -18.20947265625, -17.4462890625, -16.68310546875, -15.919921875, -15.15673828125, -14.3935546875, -13.63037109375, -12.8671875, -12.10400390625, -11.3408203125, -10.57763671875, -9.814453125, -9.05126953125, -8.2880859375, -7.52490234375, -6.76171875, -5.99853515625, -5.2353515625, -4.47216796875, -3.708984375, -2.94580078125, -2.1826171875, -1.41943359375, -0.65625, 0.10693359375, 0.8701171875, 1.63330078125, 2.396484375, 3.15966796875, 3.9228515625, 4.68603515625, 5.44921875, 6.21240234375, 6.9755859375, 7.73876953125, 8.501953125, 9.26513671875, 10.0283203125, 10.79150390625, 11.5546875, 12.31787109375, 13.0810546875, 13.84423828125, 14.607421875, 15.37060546875, 16.1337890625, 16.89697265625, 17.66015625, 18.42333984375, 19.1865234375, 19.94970703125, 20.712890625, 21.47607421875, 22.2392578125, 23.00244140625, 23.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 10.0, 14.0, 18.0, 30.0, 37.0, 53.0, 50.0, 62.0, 72.0, 74.0, 82.0, 72.0, 78.0, 65.0, 53.0, 49.0, 47.0, 26.0, 17.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.36566162109375, -7.1180419921875, -6.87042236328125, -6.622802734375, -6.37518310546875, -6.1275634765625, -5.87994384765625, -5.63232421875, -5.38470458984375, -5.1370849609375, -4.88946533203125, -4.641845703125, -4.39422607421875, -4.1466064453125, -3.89898681640625, -3.6513671875, -3.40374755859375, -3.1561279296875, -2.90850830078125, -2.660888671875, -2.41326904296875, -2.1656494140625, -1.91802978515625, -1.67041015625, -1.42279052734375, -1.1751708984375, -0.92755126953125, -0.679931640625, -0.43231201171875, -0.1846923828125, 0.06292724609375, 0.310546875, 0.55816650390625, 0.8057861328125, 1.05340576171875, 1.301025390625, 1.54864501953125, 1.7962646484375, 2.04388427734375, 2.29150390625, 2.53912353515625, 2.7867431640625, 3.03436279296875, 3.281982421875, 3.52960205078125, 3.7772216796875, 4.02484130859375, 4.2724609375, 4.52008056640625, 4.7677001953125, 5.01531982421875, 5.262939453125, 5.51055908203125, 5.7581787109375, 6.00579833984375, 6.25341796875, 6.50103759765625, 6.7486572265625, 6.99627685546875, 7.243896484375, 7.49151611328125, 7.7391357421875, 7.98675537109375, 8.234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 11.0, 12.0, 13.0, 10.0, 33.0, 37.0, 63.0, 98.0, 124.0, 202.0, 324.0, 470.0, 725.0, 1270.0, 2251.0, 4501.0, 9980.0, 27988.0, 131674.0, 3771402.0, 187312.0, 33414.0, 11329.0, 4914.0, 2395.0, 1456.0, 829.0, 488.0, 324.0, 203.0, 113.0, 89.0, 74.0, 46.0, 28.0, 25.0, 13.0, 11.0, 13.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.46142578125, -12.0400390625, -11.61865234375, -11.197265625, -10.77587890625, -10.3544921875, -9.93310546875, -9.51171875, -9.09033203125, -8.6689453125, -8.24755859375, -7.826171875, -7.40478515625, -6.9833984375, -6.56201171875, -6.140625, -5.71923828125, -5.2978515625, -4.87646484375, -4.455078125, -4.03369140625, -3.6123046875, -3.19091796875, -2.76953125, -2.34814453125, -1.9267578125, -1.50537109375, -1.083984375, -0.66259765625, -0.2412109375, 0.18017578125, 0.6015625, 1.02294921875, 1.4443359375, 1.86572265625, 2.287109375, 2.70849609375, 3.1298828125, 3.55126953125, 3.97265625, 4.39404296875, 4.8154296875, 5.23681640625, 5.658203125, 6.07958984375, 6.5009765625, 6.92236328125, 7.34375, 7.76513671875, 8.1865234375, 8.60791015625, 9.029296875, 9.45068359375, 9.8720703125, 10.29345703125, 10.71484375, 11.13623046875, 11.5576171875, 11.97900390625, 12.400390625, 12.82177734375, 13.2431640625, 13.66455078125, 14.0859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 13.0, 19.0, 28.0, 33.0, 87.0, 248.0, 2590.0, 675.0, 168.0, 63.0, 52.0, 26.0, 21.0, 14.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.76104736328125, -6.5181884765625, -6.27532958984375, -6.032470703125, -5.78961181640625, -5.5467529296875, -5.30389404296875, -5.06103515625, -4.81817626953125, -4.5753173828125, -4.33245849609375, -4.089599609375, -3.84674072265625, -3.6038818359375, -3.36102294921875, -3.1181640625, -2.87530517578125, -2.6324462890625, -2.38958740234375, -2.146728515625, -1.90386962890625, -1.6610107421875, -1.41815185546875, -1.17529296875, -0.93243408203125, -0.6895751953125, -0.44671630859375, -0.203857421875, 0.03900146484375, 0.2818603515625, 0.52471923828125, 0.767578125, 1.01043701171875, 1.2532958984375, 1.49615478515625, 1.739013671875, 1.98187255859375, 2.2247314453125, 2.46759033203125, 2.71044921875, 2.95330810546875, 3.1961669921875, 3.43902587890625, 3.681884765625, 3.92474365234375, 4.1676025390625, 4.41046142578125, 4.6533203125, 4.89617919921875, 5.1390380859375, 5.38189697265625, 5.624755859375, 5.86761474609375, 6.1104736328125, 6.35333251953125, 6.59619140625, 6.83905029296875, 7.0819091796875, 7.32476806640625, 7.567626953125, 7.81048583984375, 8.0533447265625, 8.29620361328125, 8.5390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 13.0, 23.0, 37.0, 68.0, 82.0, 101.0, 127.0, 153.0, 100.0, 101.0, 59.0, 39.0, 30.0, 21.0, 14.0, 6.0, 9.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.00275421142578, -17.037540435791016, -16.07232666015625, -15.1071138381958, -14.141900062561035, -13.17668628692627, -12.21147346496582, -11.246259689331055, -10.281045913696289, -9.315832138061523, -8.350618362426758, -7.385405540466309, -6.420191764831543, -5.454977989196777, -4.48976469039917, -3.5245513916015625, -2.559337615966797, -1.5941240787506104, -0.6289105415344238, 0.3363029956817627, 1.3015165328979492, 2.266730308532715, 3.2319436073303223, 4.19715690612793, 5.162370681762695, 6.127584457397461, 7.092797756195068, 8.058011054992676, 9.023224830627441, 9.988438606262207, 10.953651428222656, 11.918865203857422, 12.884078979492188, 13.849292755126953, 14.814506530761719, 15.779719352722168, 16.74493408203125, 17.710147857666016, 18.67535972595215, 19.640573501586914, 20.60578727722168, 21.571001052856445, 22.53621482849121, 23.501428604125977, 24.46664047241211, 25.431854248046875, 26.39706802368164, 27.362281799316406, 28.327495574951172, 29.292709350585938, 30.257923126220703, 31.22313690185547, 32.188350677490234, 33.153564453125, 34.118778228759766, 35.08399200439453, 36.04920196533203, 37.0144157409668, 37.97962951660156, 38.94484329223633, 39.910057067871094, 40.87527084350586, 41.840484619140625, 42.805694580078125, 43.770912170410156]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 9.0, 4.0, 9.0, 13.0, 23.0, 18.0, 24.0, 15.0, 33.0, 25.0, 33.0, 30.0, 37.0, 32.0, 30.0, 25.0, 40.0, 53.0, 56.0, 50.0, 42.0, 41.0, 48.0, 35.0, 29.0, 21.0, 24.0, 24.0, 24.0, 27.0, 21.0, 23.0, 13.0, 17.0, 10.0, 7.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.932306289672852, -12.515914916992188, -12.099523544311523, -11.68313217163086, -11.266739845275879, -10.850348472595215, -10.43395709991455, -10.017565727233887, -9.601173400878906, -9.184782028198242, -8.768390655517578, -8.351999282836914, -7.935606956481934, -7.5192155838012695, -7.1028242111206055, -6.686432838439941, -6.270041465759277, -5.853650093078613, -5.437258243560791, -5.020866870880127, -4.604475021362305, -4.188083648681641, -3.7716922760009766, -3.3553006649017334, -2.9389090538024902, -2.522517442703247, -2.106125831604004, -1.6897344589233398, -1.2733428478240967, -0.8569512367248535, -0.44055986404418945, -0.02416825294494629, 0.3922233581542969, 0.8086149096488953, 1.2250064611434937, 1.6413979530334473, 2.0577895641326904, 2.4741811752319336, 2.8905725479125977, 3.306964159011841, 3.723355770111084, 4.139747142791748, 4.55613899230957, 4.972530364990234, 5.388921737670898, 5.805313587188721, 6.221704959869385, 6.638096809387207, 7.054488182067871, 7.470879554748535, 7.887271404266357, 8.30366325378418, 8.720054626464844, 9.136445999145508, 9.552837371826172, 9.969228744506836, 10.3856201171875, 10.802011489868164, 11.218402862548828, 11.634794235229492, 12.051186561584473, 12.467577934265137, 12.8839693069458, 13.300360679626465, 13.716753005981445]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 10.0, 11.0, 15.0, 18.0, 20.0, 51.0, 90.0, 121.0, 244.0, 411.0, 792.0, 1816.0, 4240.0, 11600.0, 37067.0, 129310.0, 406521.0, 319418.0, 94755.0, 27179.0, 8660.0, 3298.0, 1367.0, 682.0, 372.0, 192.0, 104.0, 73.0, 42.0, 30.0, 13.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.8404541015625, -14.266845703125, -13.6932373046875, -13.11962890625, -12.5460205078125, -11.972412109375, -11.3988037109375, -10.8251953125, -10.2515869140625, -9.677978515625, -9.1043701171875, -8.53076171875, -7.9571533203125, -7.383544921875, -6.8099365234375, -6.236328125, -5.6627197265625, -5.089111328125, -4.5155029296875, -3.94189453125, -3.3682861328125, -2.794677734375, -2.2210693359375, -1.6474609375, -1.0738525390625, -0.500244140625, 0.0733642578125, 0.64697265625, 1.2205810546875, 1.794189453125, 2.3677978515625, 2.94140625, 3.5150146484375, 4.088623046875, 4.6622314453125, 5.23583984375, 5.8094482421875, 6.383056640625, 6.9566650390625, 7.5302734375, 8.1038818359375, 8.677490234375, 9.2510986328125, 9.82470703125, 10.3983154296875, 10.971923828125, 11.5455322265625, 12.119140625, 12.6927490234375, 13.266357421875, 13.8399658203125, 14.41357421875, 14.9871826171875, 15.560791015625, 16.1343994140625, 16.7080078125, 17.2816162109375, 17.855224609375, 18.4288330078125, 19.00244140625, 19.5760498046875, 20.149658203125, 20.7232666015625, 21.296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 10.0, 6.0, 17.0, 33.0, 34.0, 51.0, 47.0, 51.0, 82.0, 75.0, 80.0, 71.0, 76.0, 73.0, 59.0, 47.0, 43.0, 31.0, 31.0, 20.0, 16.0, 9.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9854736328125, -7.728759765625, -7.4720458984375, -7.21533203125, -6.9586181640625, -6.701904296875, -6.4451904296875, -6.1884765625, -5.9317626953125, -5.675048828125, -5.4183349609375, -5.16162109375, -4.9049072265625, -4.648193359375, -4.3914794921875, -4.134765625, -3.8780517578125, -3.621337890625, -3.3646240234375, -3.10791015625, -2.8511962890625, -2.594482421875, -2.3377685546875, -2.0810546875, -1.8243408203125, -1.567626953125, -1.3109130859375, -1.05419921875, -0.7974853515625, -0.540771484375, -0.2840576171875, -0.02734375, 0.2293701171875, 0.486083984375, 0.7427978515625, 0.99951171875, 1.2562255859375, 1.512939453125, 1.7696533203125, 2.0263671875, 2.2830810546875, 2.539794921875, 2.7965087890625, 3.05322265625, 3.3099365234375, 3.566650390625, 3.8233642578125, 4.080078125, 4.3367919921875, 4.593505859375, 4.8502197265625, 5.10693359375, 5.3636474609375, 5.620361328125, 5.8770751953125, 6.1337890625, 6.3905029296875, 6.647216796875, 6.9039306640625, 7.16064453125, 7.4173583984375, 7.674072265625, 7.9307861328125, 8.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 18.0, 11.0, 28.0, 41.0, 69.0, 89.0, 137.0, 285.0, 615.0, 1597.0, 7916.0, 354026.0, 669276.0, 11116.0, 1836.0, 685.0, 337.0, 200.0, 92.0, 67.0, 22.0, 26.0, 17.0, 14.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.25, -65.57177734375, -63.8935546875, -62.21533203125, -60.537109375, -58.85888671875, -57.1806640625, -55.50244140625, -53.82421875, -52.14599609375, -50.4677734375, -48.78955078125, -47.111328125, -45.43310546875, -43.7548828125, -42.07666015625, -40.3984375, -38.72021484375, -37.0419921875, -35.36376953125, -33.685546875, -32.00732421875, -30.3291015625, -28.65087890625, -26.97265625, -25.29443359375, -23.6162109375, -21.93798828125, -20.259765625, -18.58154296875, -16.9033203125, -15.22509765625, -13.546875, -11.86865234375, -10.1904296875, -8.51220703125, -6.833984375, -5.15576171875, -3.4775390625, -1.79931640625, -0.12109375, 1.55712890625, 3.2353515625, 4.91357421875, 6.591796875, 8.27001953125, 9.9482421875, 11.62646484375, 13.3046875, 14.98291015625, 16.6611328125, 18.33935546875, 20.017578125, 21.69580078125, 23.3740234375, 25.05224609375, 26.73046875, 28.40869140625, 30.0869140625, 31.76513671875, 33.443359375, 35.12158203125, 36.7998046875, 38.47802734375, 40.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 7.0, 10.0, 11.0, 15.0, 18.0, 27.0, 22.0, 45.0, 40.0, 52.0, 46.0, 58.0, 61.0, 59.0, 45.0, 62.0, 46.0, 64.0, 44.0, 47.0, 31.0, 38.0, 32.0, 18.0, 20.0, 10.0, 13.0, 8.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.390625, -24.551513671875, -23.71240234375, -22.873291015625, -22.0341796875, -21.195068359375, -20.35595703125, -19.516845703125, -18.677734375, -17.838623046875, -16.99951171875, -16.160400390625, -15.3212890625, -14.482177734375, -13.64306640625, -12.803955078125, -11.96484375, -11.125732421875, -10.28662109375, -9.447509765625, -8.6083984375, -7.769287109375, -6.93017578125, -6.091064453125, -5.251953125, -4.412841796875, -3.57373046875, -2.734619140625, -1.8955078125, -1.056396484375, -0.21728515625, 0.621826171875, 1.4609375, 2.300048828125, 3.13916015625, 3.978271484375, 4.8173828125, 5.656494140625, 6.49560546875, 7.334716796875, 8.173828125, 9.012939453125, 9.85205078125, 10.691162109375, 11.5302734375, 12.369384765625, 13.20849609375, 14.047607421875, 14.88671875, 15.725830078125, 16.56494140625, 17.404052734375, 18.2431640625, 19.082275390625, 19.92138671875, 20.760498046875, 21.599609375, 22.438720703125, 23.27783203125, 24.116943359375, 24.9560546875, 25.795166015625, 26.63427734375, 27.473388671875, 28.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 17.0, 24.0, 55.0, 95.0, 227.0, 520.0, 1627.0, 8040.0, 118375.0, 861153.0, 51678.0, 4831.0, 1169.0, 385.0, 171.0, 75.0, 42.0, 29.0, 15.0, 14.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.128173828125, -8.63134765625, -8.134521484375, -7.6376953125, -7.140869140625, -6.64404296875, -6.147216796875, -5.650390625, -5.153564453125, -4.65673828125, -4.159912109375, -3.6630859375, -3.166259765625, -2.66943359375, -2.172607421875, -1.67578125, -1.178955078125, -0.68212890625, -0.185302734375, 0.3115234375, 0.808349609375, 1.30517578125, 1.802001953125, 2.298828125, 2.795654296875, 3.29248046875, 3.789306640625, 4.2861328125, 4.782958984375, 5.27978515625, 5.776611328125, 6.2734375, 6.770263671875, 7.26708984375, 7.763916015625, 8.2607421875, 8.757568359375, 9.25439453125, 9.751220703125, 10.248046875, 10.744873046875, 11.24169921875, 11.738525390625, 12.2353515625, 12.732177734375, 13.22900390625, 13.725830078125, 14.22265625, 14.719482421875, 15.21630859375, 15.713134765625, 16.2099609375, 16.706787109375, 17.20361328125, 17.700439453125, 18.197265625, 18.694091796875, 19.19091796875, 19.687744140625, 20.1845703125, 20.681396484375, 21.17822265625, 21.675048828125, 22.171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 22.0, 25.0, 30.0, 65.0, 92.0, 168.0, 220.0, 142.0, 96.0, 50.0, 29.0, 17.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002590179443359375, -0.0024915337562561035, -0.002392888069152832, -0.0022942423820495605, -0.002195596694946289, -0.0020969510078430176, -0.001998305320739746, -0.0018996596336364746, -0.0018010139465332031, -0.0017023682594299316, -0.0016037225723266602, -0.0015050768852233887, -0.0014064311981201172, -0.0013077855110168457, -0.0012091398239135742, -0.0011104941368103027, -0.0010118484497070312, -0.0009132027626037598, -0.0008145570755004883, -0.0007159113883972168, -0.0006172657012939453, -0.0005186200141906738, -0.00041997432708740234, -0.00032132863998413086, -0.00022268295288085938, -0.0001240372657775879, -2.5391578674316406e-05, 7.325410842895508e-05, 0.00017189979553222656, 0.00027054548263549805, 0.00036919116973876953, 0.000467836856842041, 0.0005664825439453125, 0.000665128231048584, 0.0007637739181518555, 0.000862419605255127, 0.0009610652923583984, 0.00105971097946167, 0.0011583566665649414, 0.0012570023536682129, 0.0013556480407714844, 0.0014542937278747559, 0.0015529394149780273, 0.0016515851020812988, 0.0017502307891845703, 0.0018488764762878418, 0.0019475221633911133, 0.0020461678504943848, 0.0021448135375976562, 0.0022434592247009277, 0.0023421049118041992, 0.0024407505989074707, 0.002539396286010742, 0.0026380419731140137, 0.002736687660217285, 0.0028353333473205566, 0.002933979034423828, 0.0030326247215270996, 0.003131270408630371, 0.0032299160957336426, 0.003328561782836914, 0.0034272074699401855, 0.003525853157043457, 0.0036244988441467285, 0.00372314453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 0.0, 2.0, 6.0, 13.0, 16.0, 9.0, 23.0, 42.0, 50.0, 90.0, 118.0, 227.0, 410.0, 876.0, 2545.0, 12340.0, 151381.0, 808073.0, 61994.0, 6967.0, 1810.0, 711.0, 326.0, 176.0, 102.0, 70.0, 59.0, 39.0, 20.0, 12.0, 10.0, 7.0, 8.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.625, -12.1796875, -11.734375, -11.2890625, -10.84375, -10.3984375, -9.953125, -9.5078125, -9.0625, -8.6171875, -8.171875, -7.7265625, -7.28125, -6.8359375, -6.390625, -5.9453125, -5.5, -5.0546875, -4.609375, -4.1640625, -3.71875, -3.2734375, -2.828125, -2.3828125, -1.9375, -1.4921875, -1.046875, -0.6015625, -0.15625, 0.2890625, 0.734375, 1.1796875, 1.625, 2.0703125, 2.515625, 2.9609375, 3.40625, 3.8515625, 4.296875, 4.7421875, 5.1875, 5.6328125, 6.078125, 6.5234375, 6.96875, 7.4140625, 7.859375, 8.3046875, 8.75, 9.1953125, 9.640625, 10.0859375, 10.53125, 10.9765625, 11.421875, 11.8671875, 12.3125, 12.7578125, 13.203125, 13.6484375, 14.09375, 14.5390625, 14.984375, 15.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 4.0, 7.0, 14.0, 12.0, 11.0, 17.0, 27.0, 21.0, 37.0, 41.0, 42.0, 67.0, 96.0, 90.0, 103.0, 80.0, 73.0, 49.0, 41.0, 30.0, 26.0, 24.0, 17.0, 11.0, 13.0, 5.0, 9.0, 12.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.68731689453125, -5.4410400390625, -5.19476318359375, -4.948486328125, -4.70220947265625, -4.4559326171875, -4.20965576171875, -3.96337890625, -3.71710205078125, -3.4708251953125, -3.22454833984375, -2.978271484375, -2.73199462890625, -2.4857177734375, -2.23944091796875, -1.9931640625, -1.74688720703125, -1.5006103515625, -1.25433349609375, -1.008056640625, -0.76177978515625, -0.5155029296875, -0.26922607421875, -0.02294921875, 0.22332763671875, 0.4696044921875, 0.71588134765625, 0.962158203125, 1.20843505859375, 1.4547119140625, 1.70098876953125, 1.947265625, 2.19354248046875, 2.4398193359375, 2.68609619140625, 2.932373046875, 3.17864990234375, 3.4249267578125, 3.67120361328125, 3.91748046875, 4.16375732421875, 4.4100341796875, 4.65631103515625, 4.902587890625, 5.14886474609375, 5.3951416015625, 5.64141845703125, 5.8876953125, 6.13397216796875, 6.3802490234375, 6.62652587890625, 6.872802734375, 7.11907958984375, 7.3653564453125, 7.61163330078125, 7.85791015625, 8.10418701171875, 8.3504638671875, 8.59674072265625, 8.843017578125, 9.08929443359375, 9.3355712890625, 9.58184814453125, 9.828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 12.0, 16.0, 36.0, 60.0, 111.0, 159.0, 161.0, 157.0, 129.0, 74.0, 28.0, 20.0, 17.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.7603759765625, -159.92202758789062, -154.08367919921875, -148.24534606933594, -142.40699768066406, -136.5686492919922, -130.7303009033203, -124.89196014404297, -119.05361938476562, -113.21527099609375, -107.3769302368164, -101.53858184814453, -95.70024108886719, -89.86189270019531, -84.02354431152344, -78.1852035522461, -72.34685516357422, -66.50850677490234, -60.670166015625, -54.831817626953125, -48.99347686767578, -43.155128479003906, -37.3167839050293, -31.478439331054688, -25.640094757080078, -19.80175018310547, -13.963404655456543, -8.125059127807617, -2.286714553833008, 3.5516300201416016, 9.389976501464844, 15.228321075439453, 21.066665649414062, 26.905010223388672, 32.74335479736328, 38.581703186035156, 44.4200439453125, 50.258392333984375, 56.096736907958984, 61.935081481933594, 67.77342224121094, 73.61177062988281, 79.45011138916016, 85.28845977783203, 91.12680053710938, 96.96514892578125, 102.80349731445312, 108.64183807373047, 114.48018646240234, 120.31853485107422, 126.15687561035156, 131.99522399902344, 137.8335723876953, 143.67190551757812, 149.51025390625, 155.34860229492188, 161.18695068359375, 167.02529907226562, 172.8636474609375, 178.7019805908203, 184.5403289794922, 190.37867736816406, 196.21702575683594, 202.05535888671875, 207.89370727539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 17.0, 18.0, 14.0, 14.0, 15.0, 36.0, 23.0, 31.0, 33.0, 42.0, 27.0, 37.0, 61.0, 44.0, 48.0, 59.0, 39.0, 48.0, 46.0, 42.0, 31.0, 36.0, 26.0, 26.0, 21.0, 21.0, 23.0, 14.0, 8.0, 8.0, 10.0, 8.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.928466796875, -86.89380645751953, -83.85914611816406, -80.8244857788086, -77.78982543945312, -74.75516510009766, -71.72050476074219, -68.68584442138672, -65.65118408203125, -62.61652374267578, -59.58186340332031, -56.547203063964844, -53.512542724609375, -50.477882385253906, -47.44322204589844, -44.40856170654297, -41.373905181884766, -38.3392448425293, -35.30458450317383, -32.26992416381836, -29.23526382446289, -26.200603485107422, -23.165945053100586, -20.131284713745117, -17.09662437438965, -14.06196403503418, -11.027303695678711, -7.992644309997559, -4.95798397064209, -1.923323631286621, 1.1113357543945312, 4.14599609375, 7.180656433105469, 10.215316772460938, 13.249977111816406, 16.284637451171875, 19.319297790527344, 22.353958129882812, 25.38861656188965, 28.423276901245117, 31.457937240600586, 34.49259567260742, 37.52725601196289, 40.56191635131836, 43.59657669067383, 46.6312370300293, 49.665897369384766, 52.700557708740234, 55.7352180480957, 58.76987838745117, 61.80453872680664, 64.83919525146484, 67.87385559082031, 70.90851593017578, 73.94317626953125, 76.97783660888672, 80.01249694824219, 83.04715728759766, 86.08181762695312, 89.1164779663086, 92.15113830566406, 95.18579864501953, 98.220458984375, 101.25511932373047, 104.28977966308594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 9.0, 16.0, 23.0, 32.0, 41.0, 59.0, 77.0, 141.0, 210.0, 358.0, 592.0, 998.0, 1724.0, 3194.0, 6415.0, 14281.0, 36363.0, 120781.0, 807056.0, 2760203.0, 326489.0, 70209.0, 24095.0, 10104.0, 4705.0, 2523.0, 1371.0, 788.0, 488.0, 311.0, 191.0, 119.0, 86.0, 59.0, 38.0, 32.0, 20.0, 13.0, 6.0, 15.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.390625, -9.0806884765625, -8.770751953125, -8.4608154296875, -8.15087890625, -7.8409423828125, -7.531005859375, -7.2210693359375, -6.9111328125, -6.6011962890625, -6.291259765625, -5.9813232421875, -5.67138671875, -5.3614501953125, -5.051513671875, -4.7415771484375, -4.431640625, -4.1217041015625, -3.811767578125, -3.5018310546875, -3.19189453125, -2.8819580078125, -2.572021484375, -2.2620849609375, -1.9521484375, -1.6422119140625, -1.332275390625, -1.0223388671875, -0.71240234375, -0.4024658203125, -0.092529296875, 0.2174072265625, 0.52734375, 0.8372802734375, 1.147216796875, 1.4571533203125, 1.76708984375, 2.0770263671875, 2.386962890625, 2.6968994140625, 3.0068359375, 3.3167724609375, 3.626708984375, 3.9366455078125, 4.24658203125, 4.5565185546875, 4.866455078125, 5.1763916015625, 5.486328125, 5.7962646484375, 6.106201171875, 6.4161376953125, 6.72607421875, 7.0360107421875, 7.345947265625, 7.6558837890625, 7.9658203125, 8.2757568359375, 8.585693359375, 8.8956298828125, 9.20556640625, 9.5155029296875, 9.825439453125, 10.1353759765625, 10.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 12.0, 7.0, 8.0, 10.0, 20.0, 22.0, 23.0, 27.0, 31.0, 49.0, 56.0, 44.0, 52.0, 58.0, 62.0, 62.0, 69.0, 47.0, 56.0, 42.0, 35.0, 36.0, 32.0, 24.0, 29.0, 15.0, 15.0, 8.0, 10.0, 4.0, 8.0, 9.0, 7.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.88671875, -5.6990966796875, -5.511474609375, -5.3238525390625, -5.13623046875, -4.9486083984375, -4.760986328125, -4.5733642578125, -4.3857421875, -4.1981201171875, -4.010498046875, -3.8228759765625, -3.63525390625, -3.4476318359375, -3.260009765625, -3.0723876953125, -2.884765625, -2.6971435546875, -2.509521484375, -2.3218994140625, -2.13427734375, -1.9466552734375, -1.759033203125, -1.5714111328125, -1.3837890625, -1.1961669921875, -1.008544921875, -0.8209228515625, -0.63330078125, -0.4456787109375, -0.258056640625, -0.0704345703125, 0.1171875, 0.3048095703125, 0.492431640625, 0.6800537109375, 0.86767578125, 1.0552978515625, 1.242919921875, 1.4305419921875, 1.6181640625, 1.8057861328125, 1.993408203125, 2.1810302734375, 2.36865234375, 2.5562744140625, 2.743896484375, 2.9315185546875, 3.119140625, 3.3067626953125, 3.494384765625, 3.6820068359375, 3.86962890625, 4.0572509765625, 4.244873046875, 4.4324951171875, 4.6201171875, 4.8077392578125, 4.995361328125, 5.1829833984375, 5.37060546875, 5.5582275390625, 5.745849609375, 5.9334716796875, 6.12109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 8.0, 15.0, 17.0, 44.0, 53.0, 90.0, 190.0, 421.0, 1279.0, 4323.0, 18795.0, 142568.0, 3637602.0, 346968.0, 32064.0, 6854.0, 1888.0, 591.0, 237.0, 99.0, 64.0, 38.0, 15.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.517578125, -17.84765625, -17.177734375, -16.5078125, -15.837890625, -15.16796875, -14.498046875, -13.828125, -13.158203125, -12.48828125, -11.818359375, -11.1484375, -10.478515625, -9.80859375, -9.138671875, -8.46875, -7.798828125, -7.12890625, -6.458984375, -5.7890625, -5.119140625, -4.44921875, -3.779296875, -3.109375, -2.439453125, -1.76953125, -1.099609375, -0.4296875, 0.240234375, 0.91015625, 1.580078125, 2.25, 2.919921875, 3.58984375, 4.259765625, 4.9296875, 5.599609375, 6.26953125, 6.939453125, 7.609375, 8.279296875, 8.94921875, 9.619140625, 10.2890625, 10.958984375, 11.62890625, 12.298828125, 12.96875, 13.638671875, 14.30859375, 14.978515625, 15.6484375, 16.318359375, 16.98828125, 17.658203125, 18.328125, 18.998046875, 19.66796875, 20.337890625, 21.0078125, 21.677734375, 22.34765625, 23.017578125, 23.6875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 15.0, 13.0, 12.0, 27.0, 29.0, 52.0, 72.0, 123.0, 203.0, 354.0, 658.0, 875.0, 596.0, 342.0, 200.0, 141.0, 90.0, 46.0, 49.0, 29.0, 25.0, 22.0, 11.0, 13.0, 12.0, 6.0, 3.0, 9.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.5479736328125, -13.142822265625, -12.7376708984375, -12.33251953125, -11.9273681640625, -11.522216796875, -11.1170654296875, -10.7119140625, -10.3067626953125, -9.901611328125, -9.4964599609375, -9.09130859375, -8.6861572265625, -8.281005859375, -7.8758544921875, -7.470703125, -7.0655517578125, -6.660400390625, -6.2552490234375, -5.85009765625, -5.4449462890625, -5.039794921875, -4.6346435546875, -4.2294921875, -3.8243408203125, -3.419189453125, -3.0140380859375, -2.60888671875, -2.2037353515625, -1.798583984375, -1.3934326171875, -0.98828125, -0.5831298828125, -0.177978515625, 0.2271728515625, 0.63232421875, 1.0374755859375, 1.442626953125, 1.8477783203125, 2.2529296875, 2.6580810546875, 3.063232421875, 3.4683837890625, 3.87353515625, 4.2786865234375, 4.683837890625, 5.0889892578125, 5.494140625, 5.8992919921875, 6.304443359375, 6.7095947265625, 7.11474609375, 7.5198974609375, 7.925048828125, 8.3302001953125, 8.7353515625, 9.1405029296875, 9.545654296875, 9.9508056640625, 10.35595703125, 10.7611083984375, 11.166259765625, 11.5714111328125, 11.9765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 23.0, 86.0, 251.0, 318.0, 187.0, 79.0, 24.0, 14.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.29956817626953, -98.4058609008789, -89.51216125488281, -80.61845397949219, -71.72474670410156, -62.83104705810547, -53.937339782714844, -45.043636322021484, -36.149932861328125, -27.256229400634766, -18.362524032592773, -9.468818664550781, -0.5751152038574219, 8.318588256835938, 17.212295532226562, 26.105998992919922, 34.99970245361328, 43.89340591430664, 52.787109375, 61.680816650390625, 70.57452392578125, 79.46822357177734, 88.36193084716797, 97.25563049316406, 106.14933776855469, 115.04304504394531, 123.9367446899414, 132.8304443359375, 141.72415161132812, 150.61785888671875, 159.51156616210938, 168.4052734375, 177.29898071289062, 186.19268798828125, 195.08639526367188, 203.9801025390625, 212.87379455566406, 221.7675018310547, 230.6612091064453, 239.55491638183594, 248.4486083984375, 257.3423156738281, 266.23602294921875, 275.1297302246094, 284.0234375, 292.9171142578125, 301.81085205078125, 310.70452880859375, 319.5982666015625, 328.4919738769531, 337.38568115234375, 346.2793884277344, 355.173095703125, 364.0667724609375, 372.96051025390625, 381.85418701171875, 390.7478942871094, 399.6416015625, 408.5353088378906, 417.42901611328125, 426.3227233886719, 435.2164306640625, 444.110107421875, 453.0038146972656, 461.89752197265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 2.0, 9.0, 15.0, 30.0, 24.0, 29.0, 29.0, 45.0, 44.0, 43.0, 42.0, 53.0, 43.0, 65.0, 54.0, 57.0, 58.0, 48.0, 46.0, 48.0, 34.0, 36.0, 29.0, 18.0, 17.0, 16.0, 20.0, 8.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.30931091308594, -65.72479248046875, -63.14027404785156, -60.555755615234375, -57.97124099731445, -55.386722564697266, -52.80220413208008, -50.217689514160156, -47.63317108154297, -45.04865264892578, -42.464134216308594, -39.879615783691406, -37.295101165771484, -34.7105827331543, -32.12606430053711, -29.541547775268555, -26.957027435302734, -24.372509002685547, -21.787992477416992, -19.203474044799805, -16.61895751953125, -14.034439086914062, -11.449920654296875, -8.86540412902832, -6.280885696411133, -3.6963679790496826, -1.1118502616882324, 1.4726676940917969, 4.057185173034668, 6.641702651977539, 9.226221084594727, 11.810737609863281, 14.395256042480469, 16.979774475097656, 19.56429100036621, 22.1488094329834, 24.733325958251953, 27.31784439086914, 29.902362823486328, 32.48687744140625, 35.07139587402344, 37.655914306640625, 40.24043273925781, 42.824951171875, 45.40946578979492, 47.99398422241211, 50.5785026550293, 53.16301727294922, 55.74753952026367, 58.33205795288086, 60.91657638549805, 63.50109100341797, 66.08560943603516, 68.67012786865234, 71.25464630126953, 73.83916473388672, 76.4236831665039, 79.0082015991211, 81.59272003173828, 84.17723846435547, 86.76175689697266, 89.34626770019531, 91.9307861328125, 94.51530456542969, 97.09982299804688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 8.0, 8.0, 19.0, 25.0, 26.0, 33.0, 75.0, 129.0, 174.0, 277.0, 428.0, 704.0, 998.0, 1930.0, 3369.0, 6166.0, 12047.0, 24929.0, 52666.0, 121172.0, 296287.0, 299336.0, 123068.0, 53084.0, 24996.0, 12180.0, 6215.0, 3347.0, 1846.0, 1122.0, 701.0, 416.0, 276.0, 164.0, 114.0, 64.0, 41.0, 32.0, 33.0, 8.0, 14.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.428955078125, -9.09228515625, -8.755615234375, -8.4189453125, -8.082275390625, -7.74560546875, -7.408935546875, -7.072265625, -6.735595703125, -6.39892578125, -6.062255859375, -5.7255859375, -5.388916015625, -5.05224609375, -4.715576171875, -4.37890625, -4.042236328125, -3.70556640625, -3.368896484375, -3.0322265625, -2.695556640625, -2.35888671875, -2.022216796875, -1.685546875, -1.348876953125, -1.01220703125, -0.675537109375, -0.3388671875, -0.002197265625, 0.33447265625, 0.671142578125, 1.0078125, 1.344482421875, 1.68115234375, 2.017822265625, 2.3544921875, 2.691162109375, 3.02783203125, 3.364501953125, 3.701171875, 4.037841796875, 4.37451171875, 4.711181640625, 5.0478515625, 5.384521484375, 5.72119140625, 6.057861328125, 6.39453125, 6.731201171875, 7.06787109375, 7.404541015625, 7.7412109375, 8.077880859375, 8.41455078125, 8.751220703125, 9.087890625, 9.424560546875, 9.76123046875, 10.097900390625, 10.4345703125, 10.771240234375, 11.10791015625, 11.444580078125, 11.78125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 14.0, 6.0, 11.0, 19.0, 17.0, 25.0, 32.0, 30.0, 31.0, 39.0, 54.0, 43.0, 46.0, 46.0, 53.0, 53.0, 37.0, 47.0, 51.0, 44.0, 31.0, 55.0, 23.0, 36.0, 22.0, 21.0, 25.0, 20.0, 10.0, 5.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.828125, -4.65985107421875, -4.4915771484375, -4.32330322265625, -4.155029296875, -3.98675537109375, -3.8184814453125, -3.65020751953125, -3.48193359375, -3.31365966796875, -3.1453857421875, -2.97711181640625, -2.808837890625, -2.64056396484375, -2.4722900390625, -2.30401611328125, -2.1357421875, -1.96746826171875, -1.7991943359375, -1.63092041015625, -1.462646484375, -1.29437255859375, -1.1260986328125, -0.95782470703125, -0.78955078125, -0.62127685546875, -0.4530029296875, -0.28472900390625, -0.116455078125, 0.05181884765625, 0.2200927734375, 0.38836669921875, 0.556640625, 0.72491455078125, 0.8931884765625, 1.06146240234375, 1.229736328125, 1.39801025390625, 1.5662841796875, 1.73455810546875, 1.90283203125, 2.07110595703125, 2.2393798828125, 2.40765380859375, 2.575927734375, 2.74420166015625, 2.9124755859375, 3.08074951171875, 3.2490234375, 3.41729736328125, 3.5855712890625, 3.75384521484375, 3.922119140625, 4.09039306640625, 4.2586669921875, 4.42694091796875, 4.59521484375, 4.76348876953125, 4.9317626953125, 5.10003662109375, 5.268310546875, 5.43658447265625, 5.6048583984375, 5.77313232421875, 5.94140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 9.0, 8.0, 11.0, 12.0, 28.0, 36.0, 57.0, 64.0, 108.0, 185.0, 351.0, 688.0, 1750.0, 8350.0, 168364.0, 837132.0, 25841.0, 3349.0, 1076.0, 476.0, 239.0, 165.0, 71.0, 50.0, 30.0, 31.0, 19.0, 14.0, 7.0, 5.0, 9.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-43.0625, -41.68359375, -40.3046875, -38.92578125, -37.546875, -36.16796875, -34.7890625, -33.41015625, -32.03125, -30.65234375, -29.2734375, -27.89453125, -26.515625, -25.13671875, -23.7578125, -22.37890625, -21.0, -19.62109375, -18.2421875, -16.86328125, -15.484375, -14.10546875, -12.7265625, -11.34765625, -9.96875, -8.58984375, -7.2109375, -5.83203125, -4.453125, -3.07421875, -1.6953125, -0.31640625, 1.0625, 2.44140625, 3.8203125, 5.19921875, 6.578125, 7.95703125, 9.3359375, 10.71484375, 12.09375, 13.47265625, 14.8515625, 16.23046875, 17.609375, 18.98828125, 20.3671875, 21.74609375, 23.125, 24.50390625, 25.8828125, 27.26171875, 28.640625, 30.01953125, 31.3984375, 32.77734375, 34.15625, 35.53515625, 36.9140625, 38.29296875, 39.671875, 41.05078125, 42.4296875, 43.80859375, 45.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 1.0, 7.0, 8.0, 11.0, 15.0, 12.0, 16.0, 18.0, 25.0, 25.0, 23.0, 39.0, 32.0, 51.0, 50.0, 63.0, 58.0, 58.0, 63.0, 71.0, 48.0, 49.0, 47.0, 38.0, 25.0, 30.0, 25.0, 20.0, 8.0, 12.0, 15.0, 8.0, 1.0, 8.0, 0.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.09375, -23.235107421875, -22.37646484375, -21.517822265625, -20.6591796875, -19.800537109375, -18.94189453125, -18.083251953125, -17.224609375, -16.365966796875, -15.50732421875, -14.648681640625, -13.7900390625, -12.931396484375, -12.07275390625, -11.214111328125, -10.35546875, -9.496826171875, -8.63818359375, -7.779541015625, -6.9208984375, -6.062255859375, -5.20361328125, -4.344970703125, -3.486328125, -2.627685546875, -1.76904296875, -0.910400390625, -0.0517578125, 0.806884765625, 1.66552734375, 2.524169921875, 3.3828125, 4.241455078125, 5.10009765625, 5.958740234375, 6.8173828125, 7.676025390625, 8.53466796875, 9.393310546875, 10.251953125, 11.110595703125, 11.96923828125, 12.827880859375, 13.6865234375, 14.545166015625, 15.40380859375, 16.262451171875, 17.12109375, 17.979736328125, 18.83837890625, 19.697021484375, 20.5556640625, 21.414306640625, 22.27294921875, 23.131591796875, 23.990234375, 24.848876953125, 25.70751953125, 26.566162109375, 27.4248046875, 28.283447265625, 29.14208984375, 30.000732421875, 30.859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 14.0, 15.0, 29.0, 33.0, 45.0, 69.0, 109.0, 197.0, 387.0, 917.0, 2615.0, 13813.0, 205774.0, 780736.0, 36310.0, 4888.0, 1325.0, 535.0, 276.0, 126.0, 108.0, 54.0, 36.0, 26.0, 21.0, 21.0, 9.0, 5.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.1875, -12.7509765625, -12.314453125, -11.8779296875, -11.44140625, -11.0048828125, -10.568359375, -10.1318359375, -9.6953125, -9.2587890625, -8.822265625, -8.3857421875, -7.94921875, -7.5126953125, -7.076171875, -6.6396484375, -6.203125, -5.7666015625, -5.330078125, -4.8935546875, -4.45703125, -4.0205078125, -3.583984375, -3.1474609375, -2.7109375, -2.2744140625, -1.837890625, -1.4013671875, -0.96484375, -0.5283203125, -0.091796875, 0.3447265625, 0.78125, 1.2177734375, 1.654296875, 2.0908203125, 2.52734375, 2.9638671875, 3.400390625, 3.8369140625, 4.2734375, 4.7099609375, 5.146484375, 5.5830078125, 6.01953125, 6.4560546875, 6.892578125, 7.3291015625, 7.765625, 8.2021484375, 8.638671875, 9.0751953125, 9.51171875, 9.9482421875, 10.384765625, 10.8212890625, 11.2578125, 11.6943359375, 12.130859375, 12.5673828125, 13.00390625, 13.4404296875, 13.876953125, 14.3134765625, 14.75]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 12.0, 12.0, 15.0, 23.0, 23.0, 31.0, 55.0, 95.0, 136.0, 183.0, 125.0, 80.0, 59.0, 28.0, 35.0, 20.0, 21.0, 10.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00276947021484375, -0.0026991814374923706, -0.002628892660140991, -0.002558603882789612, -0.0024883151054382324, -0.002418026328086853, -0.0023477375507354736, -0.0022774487733840942, -0.002207159996032715, -0.0021368712186813354, -0.002066582441329956, -0.0019962936639785767, -0.0019260048866271973, -0.0018557161092758179, -0.0017854273319244385, -0.001715138554573059, -0.0016448497772216797, -0.0015745609998703003, -0.001504272222518921, -0.0014339834451675415, -0.0013636946678161621, -0.0012934058904647827, -0.0012231171131134033, -0.001152828335762024, -0.0010825395584106445, -0.0010122507810592651, -0.0009419620037078857, -0.0008716732263565063, -0.000801384449005127, -0.0007310956716537476, -0.0006608068943023682, -0.0005905181169509888, -0.0005202293395996094, -0.00044994056224823, -0.0003796517848968506, -0.0003093630075454712, -0.0002390742301940918, -0.0001687854528427124, -9.849667549133301e-05, -2.8207898139953613e-05, 4.208087921142578e-05, 0.00011236965656280518, 0.00018265843391418457, 0.00025294721126556396, 0.00032323598861694336, 0.00039352476596832275, 0.00046381354331970215, 0.0005341023206710815, 0.0006043910980224609, 0.0006746798753738403, 0.0007449686527252197, 0.0008152574300765991, 0.0008855462074279785, 0.0009558349847793579, 0.0010261237621307373, 0.0010964125394821167, 0.001166701316833496, 0.0012369900941848755, 0.0013072788715362549, 0.0013775676488876343, 0.0014478564262390137, 0.001518145203590393, 0.0015884339809417725, 0.0016587227582931519, 0.0017290115356445312]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 8.0, 15.0, 16.0, 9.0, 22.0, 30.0, 33.0, 82.0, 107.0, 147.0, 276.0, 480.0, 1009.0, 2084.0, 6492.0, 35878.0, 579863.0, 384504.0, 28029.0, 5598.0, 1877.0, 809.0, 420.0, 261.0, 150.0, 108.0, 60.0, 39.0, 26.0, 25.0, 18.0, 14.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.796875, -10.423828125, -10.05078125, -9.677734375, -9.3046875, -8.931640625, -8.55859375, -8.185546875, -7.8125, -7.439453125, -7.06640625, -6.693359375, -6.3203125, -5.947265625, -5.57421875, -5.201171875, -4.828125, -4.455078125, -4.08203125, -3.708984375, -3.3359375, -2.962890625, -2.58984375, -2.216796875, -1.84375, -1.470703125, -1.09765625, -0.724609375, -0.3515625, 0.021484375, 0.39453125, 0.767578125, 1.140625, 1.513671875, 1.88671875, 2.259765625, 2.6328125, 3.005859375, 3.37890625, 3.751953125, 4.125, 4.498046875, 4.87109375, 5.244140625, 5.6171875, 5.990234375, 6.36328125, 6.736328125, 7.109375, 7.482421875, 7.85546875, 8.228515625, 8.6015625, 8.974609375, 9.34765625, 9.720703125, 10.09375, 10.466796875, 10.83984375, 11.212890625, 11.5859375, 11.958984375, 12.33203125, 12.705078125, 13.078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 7.0, 2.0, 6.0, 4.0, 5.0, 5.0, 17.0, 17.0, 23.0, 21.0, 29.0, 32.0, 42.0, 69.0, 88.0, 101.0, 105.0, 79.0, 80.0, 47.0, 46.0, 42.0, 22.0, 20.0, 21.0, 13.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.51708984375, -8.2685546875, -8.02001953125, -7.771484375, -7.52294921875, -7.2744140625, -7.02587890625, -6.77734375, -6.52880859375, -6.2802734375, -6.03173828125, -5.783203125, -5.53466796875, -5.2861328125, -5.03759765625, -4.7890625, -4.54052734375, -4.2919921875, -4.04345703125, -3.794921875, -3.54638671875, -3.2978515625, -3.04931640625, -2.80078125, -2.55224609375, -2.3037109375, -2.05517578125, -1.806640625, -1.55810546875, -1.3095703125, -1.06103515625, -0.8125, -0.56396484375, -0.3154296875, -0.06689453125, 0.181640625, 0.43017578125, 0.6787109375, 0.92724609375, 1.17578125, 1.42431640625, 1.6728515625, 1.92138671875, 2.169921875, 2.41845703125, 2.6669921875, 2.91552734375, 3.1640625, 3.41259765625, 3.6611328125, 3.90966796875, 4.158203125, 4.40673828125, 4.6552734375, 4.90380859375, 5.15234375, 5.40087890625, 5.6494140625, 5.89794921875, 6.146484375, 6.39501953125, 6.6435546875, 6.89208984375, 7.140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 21.0, 72.0, 228.0, 357.0, 209.0, 64.0, 23.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.30621337890625, -214.85260009765625, -204.39898681640625, -193.94537353515625, -183.49176025390625, -173.03814697265625, -162.58453369140625, -152.13092041015625, -141.67730712890625, -131.22369384765625, -120.77008056640625, -110.31646728515625, -99.86285400390625, -89.40924072265625, -78.95561981201172, -68.50200653076172, -58.04838562011719, -47.59477233886719, -37.14115905761719, -26.687541961669922, -16.233928680419922, -5.780315399169922, 4.673301696777344, 15.126914978027344, 25.580528259277344, 36.034141540527344, 46.487754821777344, 56.94137191772461, 67.39498901367188, 77.84860229492188, 88.30221557617188, 98.75582885742188, 109.20944213867188, 119.66305541992188, 130.11666870117188, 140.57028198242188, 151.02389526367188, 161.47750854492188, 171.93112182617188, 182.38473510742188, 192.83834838867188, 203.29196166992188, 213.74557495117188, 224.19918823242188, 234.65280151367188, 245.10641479492188, 255.56002807617188, 266.0136413574219, 276.46728515625, 286.9208984375, 297.37451171875, 307.828125, 318.28173828125, 328.7353515625, 339.18896484375, 349.642578125, 360.09619140625, 370.5498046875, 381.00341796875, 391.45703125, 401.91064453125, 412.3642578125, 422.81787109375, 433.271484375, 443.72509765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 9.0, 9.0, 10.0, 15.0, 18.0, 18.0, 11.0, 23.0, 25.0, 18.0, 36.0, 29.0, 32.0, 35.0, 41.0, 54.0, 56.0, 52.0, 54.0, 57.0, 50.0, 39.0, 37.0, 30.0, 29.0, 25.0, 32.0, 27.0, 26.0, 15.0, 17.0, 17.0, 14.0, 8.0, 13.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-100.84375, -97.78082275390625, -94.7178955078125, -91.65496826171875, -88.592041015625, -85.52912139892578, -82.46619415283203, -79.40326690673828, -76.34033966064453, -73.27741241455078, -70.21448516845703, -67.15155792236328, -64.08863830566406, -61.02570724487305, -57.96278381347656, -54.89985656738281, -51.83692932128906, -48.77400207519531, -45.71107482910156, -42.64815139770508, -39.58522415161133, -36.52229690551758, -33.459373474121094, -30.396446228027344, -27.333518981933594, -24.270591735839844, -21.207666397094727, -18.14474105834961, -15.08181381225586, -12.018887519836426, -8.955961227416992, -5.893035888671875, -2.8301162719726562, 0.23281002044677734, 3.295736312866211, 6.3586626052856445, 9.421588897705078, 12.484515190124512, 15.547441482543945, 18.610366821289062, 21.673294067382812, 24.736221313476562, 27.79914665222168, 30.862071990966797, 33.92499923706055, 36.9879264831543, 40.05084991455078, 43.11377716064453, 46.17670440673828, 49.23963165283203, 52.30255889892578, 55.365482330322266, 58.428409576416016, 61.491336822509766, 64.55426025390625, 67.6171875, 70.68011474609375, 73.7430419921875, 76.80596923828125, 79.868896484375, 82.93182373046875, 85.99474334716797, 89.05767059326172, 92.12059783935547, 95.18352508544922]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 17.0, 33.0, 47.0, 75.0, 134.0, 276.0, 1533.0, 4142497.0, 48625.0, 548.0, 206.0, 109.0, 80.0, 42.0, 12.0, 14.0, 9.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9375, -85.73828125, -82.5390625, -79.33984375, -76.140625, -72.94140625, -69.7421875, -66.54296875, -63.34375, -60.14453125, -56.9453125, -53.74609375, -50.546875, -47.34765625, -44.1484375, -40.94921875, -37.75, -34.55078125, -31.3515625, -28.15234375, -24.953125, -21.75390625, -18.5546875, -15.35546875, -12.15625, -8.95703125, -5.7578125, -2.55859375, 0.640625, 3.83984375, 7.0390625, 10.23828125, 13.4375, 16.63671875, 19.8359375, 23.03515625, 26.234375, 29.43359375, 32.6328125, 35.83203125, 39.03125, 42.23046875, 45.4296875, 48.62890625, 51.828125, 55.02734375, 58.2265625, 61.42578125, 64.625, 67.82421875, 71.0234375, 74.22265625, 77.421875, 80.62109375, 83.8203125, 87.01953125, 90.21875, 93.41796875, 96.6171875, 99.81640625, 103.015625, 106.21484375, 109.4140625, 112.61328125, 115.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 14.0, 6.0, 23.0, 32.0, 27.0, 39.0, 60.0, 61.0, 71.0, 83.0, 75.0, 76.0, 73.0, 79.0, 56.0, 53.0, 40.0, 33.0, 24.0, 23.0, 14.0, 11.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.87994384765625, -7.6348876953125, -7.38983154296875, -7.144775390625, -6.89971923828125, -6.6546630859375, -6.40960693359375, -6.16455078125, -5.91949462890625, -5.6744384765625, -5.42938232421875, -5.184326171875, -4.93927001953125, -4.6942138671875, -4.44915771484375, -4.2041015625, -3.95904541015625, -3.7139892578125, -3.46893310546875, -3.223876953125, -2.97882080078125, -2.7337646484375, -2.48870849609375, -2.24365234375, -1.99859619140625, -1.7535400390625, -1.50848388671875, -1.263427734375, -1.01837158203125, -0.7733154296875, -0.52825927734375, -0.283203125, -0.03814697265625, 0.2069091796875, 0.45196533203125, 0.697021484375, 0.94207763671875, 1.1871337890625, 1.43218994140625, 1.67724609375, 1.92230224609375, 2.1673583984375, 2.41241455078125, 2.657470703125, 2.90252685546875, 3.1475830078125, 3.39263916015625, 3.6376953125, 3.88275146484375, 4.1278076171875, 4.37286376953125, 4.617919921875, 4.86297607421875, 5.1080322265625, 5.35308837890625, 5.59814453125, 5.84320068359375, 6.0882568359375, 6.33331298828125, 6.578369140625, 6.82342529296875, 7.0684814453125, 7.31353759765625, 7.55859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 8.0, 17.0, 17.0, 18.0, 61.0, 89.0, 187.0, 339.0, 746.0, 1488.0, 3316.0, 7818.0, 20905.0, 78085.0, 738732.0, 3063094.0, 213607.0, 41030.0, 13418.0, 5756.0, 2690.0, 1338.0, 704.0, 396.0, 184.0, 96.0, 52.0, 35.0, 21.0, 8.0, 5.0, 8.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.015625, -10.6517333984375, -10.287841796875, -9.9239501953125, -9.56005859375, -9.1961669921875, -8.832275390625, -8.4683837890625, -8.1044921875, -7.7406005859375, -7.376708984375, -7.0128173828125, -6.64892578125, -6.2850341796875, -5.921142578125, -5.5572509765625, -5.193359375, -4.8294677734375, -4.465576171875, -4.1016845703125, -3.73779296875, -3.3739013671875, -3.010009765625, -2.6461181640625, -2.2822265625, -1.9183349609375, -1.554443359375, -1.1905517578125, -0.82666015625, -0.4627685546875, -0.098876953125, 0.2650146484375, 0.62890625, 0.9927978515625, 1.356689453125, 1.7205810546875, 2.08447265625, 2.4483642578125, 2.812255859375, 3.1761474609375, 3.5400390625, 3.9039306640625, 4.267822265625, 4.6317138671875, 4.99560546875, 5.3594970703125, 5.723388671875, 6.0872802734375, 6.451171875, 6.8150634765625, 7.178955078125, 7.5428466796875, 7.90673828125, 8.2706298828125, 8.634521484375, 8.9984130859375, 9.3623046875, 9.7261962890625, 10.090087890625, 10.4539794921875, 10.81787109375, 11.1817626953125, 11.545654296875, 11.9095458984375, 12.2734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 12.0, 11.0, 15.0, 26.0, 24.0, 37.0, 72.0, 91.0, 142.0, 243.0, 469.0, 799.0, 800.0, 503.0, 292.0, 159.0, 98.0, 67.0, 42.0, 33.0, 24.0, 18.0, 18.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.390625, -9.0677490234375, -8.744873046875, -8.4219970703125, -8.09912109375, -7.7762451171875, -7.453369140625, -7.1304931640625, -6.8076171875, -6.4847412109375, -6.161865234375, -5.8389892578125, -5.51611328125, -5.1932373046875, -4.870361328125, -4.5474853515625, -4.224609375, -3.9017333984375, -3.578857421875, -3.2559814453125, -2.93310546875, -2.6102294921875, -2.287353515625, -1.9644775390625, -1.6416015625, -1.3187255859375, -0.995849609375, -0.6729736328125, -0.35009765625, -0.0272216796875, 0.295654296875, 0.6185302734375, 0.94140625, 1.2642822265625, 1.587158203125, 1.9100341796875, 2.23291015625, 2.5557861328125, 2.878662109375, 3.2015380859375, 3.5244140625, 3.8472900390625, 4.170166015625, 4.4930419921875, 4.81591796875, 5.1387939453125, 5.461669921875, 5.7845458984375, 6.107421875, 6.4302978515625, 6.753173828125, 7.0760498046875, 7.39892578125, 7.7218017578125, 8.044677734375, 8.3675537109375, 8.6904296875, 9.0133056640625, 9.336181640625, 9.6590576171875, 9.98193359375, 10.3048095703125, 10.627685546875, 10.9505615234375, 11.2734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 11.0, 14.0, 20.0, 48.0, 68.0, 133.0, 169.0, 163.0, 130.0, 96.0, 53.0, 27.0, 16.0, 17.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15904235839844, -59.059532165527344, -55.96002197265625, -52.860511779785156, -49.76100158691406, -46.66149139404297, -43.56197738647461, -40.462467193603516, -37.36295700073242, -34.26344680786133, -31.163936614990234, -28.064424514770508, -24.964914321899414, -21.86540412902832, -18.765892028808594, -15.6663818359375, -12.566871643066406, -9.467361450195312, -6.367850303649902, -3.268339157104492, -0.16882896423339844, 2.9306812286376953, 6.030193328857422, 9.129703521728516, 12.22921371459961, 15.328723907470703, 18.428234100341797, 21.527746200561523, 24.627256393432617, 27.72676658630371, 30.826278686523438, 33.92578887939453, 37.025299072265625, 40.12480926513672, 43.22431945800781, 46.323829650878906, 49.42333984375, 52.522850036621094, 55.62236404418945, 58.72187423706055, 61.82138442993164, 64.9208984375, 68.0204086303711, 71.11991882324219, 74.21942901611328, 77.31893920898438, 80.41844940185547, 83.51795959472656, 86.61746978759766, 89.71697998046875, 92.81649017333984, 95.91600036621094, 99.01551055908203, 102.11502075195312, 105.21453857421875, 108.31404113769531, 111.41355895996094, 114.51306915283203, 117.61257934570312, 120.71208953857422, 123.81159973144531, 126.9111099243164, 130.0106201171875, 133.11013793945312, 136.2096405029297]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 8.0, 17.0, 25.0, 37.0, 38.0, 32.0, 41.0, 38.0, 41.0, 61.0, 66.0, 68.0, 56.0, 42.0, 51.0, 45.0, 38.0, 39.0, 43.0, 40.0, 26.0, 20.0, 17.0, 19.0, 15.0, 14.0, 10.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.64141082763672, -45.89904022216797, -44.15666961669922, -42.41429901123047, -40.67192840576172, -38.92955780029297, -37.18718338012695, -35.4448127746582, -33.70244216918945, -31.960071563720703, -30.217700958251953, -28.47532844543457, -26.73295783996582, -24.99058723449707, -23.248214721679688, -21.505844116210938, -19.763473510742188, -18.021102905273438, -16.278732299804688, -14.536359786987305, -12.793989181518555, -11.051618576049805, -9.309247016906738, -7.566875457763672, -5.824504852294922, -4.082133769989014, -2.3397626876831055, -0.5973916053771973, 1.144979476928711, 2.887350082397461, 4.629721641540527, 6.372093200683594, 8.114459991455078, 9.856830596923828, 11.599202156066895, 13.341573715209961, 15.083944320678711, 16.82631492614746, 18.568687438964844, 20.311058044433594, 22.053428649902344, 23.795799255371094, 25.538169860839844, 27.280542373657227, 29.022912979125977, 30.765283584594727, 32.50765609741211, 34.25002670288086, 35.99239730834961, 37.73476791381836, 39.47713851928711, 41.21950912475586, 42.961883544921875, 44.704254150390625, 46.446624755859375, 48.188995361328125, 49.931365966796875, 51.673736572265625, 53.416107177734375, 55.158477783203125, 56.900848388671875, 58.643218994140625, 60.38559341430664, 62.12796401977539, 63.87033462524414]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 13.0, 21.0, 30.0, 44.0, 66.0, 126.0, 204.0, 342.0, 646.0, 1353.0, 2779.0, 6186.0, 14034.0, 34194.0, 91336.0, 291574.0, 396674.0, 129155.0, 46125.0, 18544.0, 8131.0, 3516.0, 1657.0, 821.0, 370.0, 251.0, 131.0, 79.0, 58.0, 24.0, 24.0, 14.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.3046875, -12.92626953125, -12.5478515625, -12.16943359375, -11.791015625, -11.41259765625, -11.0341796875, -10.65576171875, -10.27734375, -9.89892578125, -9.5205078125, -9.14208984375, -8.763671875, -8.38525390625, -8.0068359375, -7.62841796875, -7.25, -6.87158203125, -6.4931640625, -6.11474609375, -5.736328125, -5.35791015625, -4.9794921875, -4.60107421875, -4.22265625, -3.84423828125, -3.4658203125, -3.08740234375, -2.708984375, -2.33056640625, -1.9521484375, -1.57373046875, -1.1953125, -0.81689453125, -0.4384765625, -0.06005859375, 0.318359375, 0.69677734375, 1.0751953125, 1.45361328125, 1.83203125, 2.21044921875, 2.5888671875, 2.96728515625, 3.345703125, 3.72412109375, 4.1025390625, 4.48095703125, 4.859375, 5.23779296875, 5.6162109375, 5.99462890625, 6.373046875, 6.75146484375, 7.1298828125, 7.50830078125, 7.88671875, 8.26513671875, 8.6435546875, 9.02197265625, 9.400390625, 9.77880859375, 10.1572265625, 10.53564453125, 10.9140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 12.0, 9.0, 14.0, 14.0, 16.0, 27.0, 33.0, 41.0, 50.0, 54.0, 50.0, 64.0, 57.0, 78.0, 66.0, 73.0, 58.0, 61.0, 37.0, 43.0, 31.0, 27.0, 19.0, 21.0, 17.0, 12.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.87176513671875, -7.6575927734375, -7.44342041015625, -7.229248046875, -7.01507568359375, -6.8009033203125, -6.58673095703125, -6.37255859375, -6.15838623046875, -5.9442138671875, -5.73004150390625, -5.515869140625, -5.30169677734375, -5.0875244140625, -4.87335205078125, -4.6591796875, -4.44500732421875, -4.2308349609375, -4.01666259765625, -3.802490234375, -3.58831787109375, -3.3741455078125, -3.15997314453125, -2.94580078125, -2.73162841796875, -2.5174560546875, -2.30328369140625, -2.089111328125, -1.87493896484375, -1.6607666015625, -1.44659423828125, -1.232421875, -1.01824951171875, -0.8040771484375, -0.58990478515625, -0.375732421875, -0.16156005859375, 0.0526123046875, 0.26678466796875, 0.48095703125, 0.69512939453125, 0.9093017578125, 1.12347412109375, 1.337646484375, 1.55181884765625, 1.7659912109375, 1.98016357421875, 2.1943359375, 2.40850830078125, 2.6226806640625, 2.83685302734375, 3.051025390625, 3.26519775390625, 3.4793701171875, 3.69354248046875, 3.90771484375, 4.12188720703125, 4.3360595703125, 4.55023193359375, 4.764404296875, 4.97857666015625, 5.1927490234375, 5.40692138671875, 5.62109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 16.0, 28.0, 40.0, 59.0, 101.0, 174.0, 305.0, 632.0, 1518.0, 5438.0, 34976.0, 545917.0, 420516.0, 31123.0, 5023.0, 1423.0, 556.0, 274.0, 146.0, 84.0, 60.0, 42.0, 35.0, 17.0, 15.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.413818359375, -24.59326171875, -23.772705078125, -22.9521484375, -22.131591796875, -21.31103515625, -20.490478515625, -19.669921875, -18.849365234375, -18.02880859375, -17.208251953125, -16.3876953125, -15.567138671875, -14.74658203125, -13.926025390625, -13.10546875, -12.284912109375, -11.46435546875, -10.643798828125, -9.8232421875, -9.002685546875, -8.18212890625, -7.361572265625, -6.541015625, -5.720458984375, -4.89990234375, -4.079345703125, -3.2587890625, -2.438232421875, -1.61767578125, -0.797119140625, 0.0234375, 0.843994140625, 1.66455078125, 2.485107421875, 3.3056640625, 4.126220703125, 4.94677734375, 5.767333984375, 6.587890625, 7.408447265625, 8.22900390625, 9.049560546875, 9.8701171875, 10.690673828125, 11.51123046875, 12.331787109375, 13.15234375, 13.972900390625, 14.79345703125, 15.614013671875, 16.4345703125, 17.255126953125, 18.07568359375, 18.896240234375, 19.716796875, 20.537353515625, 21.35791015625, 22.178466796875, 22.9990234375, 23.819580078125, 24.64013671875, 25.460693359375, 26.28125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 13.0, 15.0, 29.0, 33.0, 30.0, 34.0, 39.0, 49.0, 46.0, 57.0, 51.0, 59.0, 55.0, 60.0, 62.0, 58.0, 28.0, 39.0, 35.0, 26.0, 28.0, 27.0, 10.0, 18.0, 12.0, 12.0, 10.0, 9.0, 5.0, 1.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.109375, -19.44091796875, -18.7724609375, -18.10400390625, -17.435546875, -16.76708984375, -16.0986328125, -15.43017578125, -14.76171875, -14.09326171875, -13.4248046875, -12.75634765625, -12.087890625, -11.41943359375, -10.7509765625, -10.08251953125, -9.4140625, -8.74560546875, -8.0771484375, -7.40869140625, -6.740234375, -6.07177734375, -5.4033203125, -4.73486328125, -4.06640625, -3.39794921875, -2.7294921875, -2.06103515625, -1.392578125, -0.72412109375, -0.0556640625, 0.61279296875, 1.28125, 1.94970703125, 2.6181640625, 3.28662109375, 3.955078125, 4.62353515625, 5.2919921875, 5.96044921875, 6.62890625, 7.29736328125, 7.9658203125, 8.63427734375, 9.302734375, 9.97119140625, 10.6396484375, 11.30810546875, 11.9765625, 12.64501953125, 13.3134765625, 13.98193359375, 14.650390625, 15.31884765625, 15.9873046875, 16.65576171875, 17.32421875, 17.99267578125, 18.6611328125, 19.32958984375, 19.998046875, 20.66650390625, 21.3349609375, 22.00341796875, 22.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 17.0, 23.0, 45.0, 83.0, 165.0, 330.0, 1036.0, 5303.0, 173858.0, 852774.0, 12304.0, 1694.0, 469.0, 183.0, 89.0, 54.0, 29.0, 19.0, 13.0, 4.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.8125, -23.135498046875, -22.45849609375, -21.781494140625, -21.1044921875, -20.427490234375, -19.75048828125, -19.073486328125, -18.396484375, -17.719482421875, -17.04248046875, -16.365478515625, -15.6884765625, -15.011474609375, -14.33447265625, -13.657470703125, -12.98046875, -12.303466796875, -11.62646484375, -10.949462890625, -10.2724609375, -9.595458984375, -8.91845703125, -8.241455078125, -7.564453125, -6.887451171875, -6.21044921875, -5.533447265625, -4.8564453125, -4.179443359375, -3.50244140625, -2.825439453125, -2.1484375, -1.471435546875, -0.79443359375, -0.117431640625, 0.5595703125, 1.236572265625, 1.91357421875, 2.590576171875, 3.267578125, 3.944580078125, 4.62158203125, 5.298583984375, 5.9755859375, 6.652587890625, 7.32958984375, 8.006591796875, 8.68359375, 9.360595703125, 10.03759765625, 10.714599609375, 11.3916015625, 12.068603515625, 12.74560546875, 13.422607421875, 14.099609375, 14.776611328125, 15.45361328125, 16.130615234375, 16.8076171875, 17.484619140625, 18.16162109375, 18.838623046875, 19.515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 5.0, 14.0, 7.0, 11.0, 7.0, 12.0, 19.0, 22.0, 14.0, 40.0, 34.0, 56.0, 64.0, 83.0, 118.0, 112.0, 82.0, 49.0, 48.0, 33.0, 28.0, 35.0, 20.0, 17.0, 7.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013256072998046875, -0.0012864917516708374, -0.0012473762035369873, -0.0012082606554031372, -0.0011691451072692871, -0.001130029559135437, -0.001090914011001587, -0.0010517984628677368, -0.0010126829147338867, -0.0009735673666000366, -0.0009344518184661865, -0.0008953362703323364, -0.0008562207221984863, -0.0008171051740646362, -0.0007779896259307861, -0.000738874077796936, -0.0006997585296630859, -0.0006606429815292358, -0.0006215274333953857, -0.0005824118852615356, -0.0005432963371276855, -0.0005041807889938354, -0.00046506524085998535, -0.00042594969272613525, -0.00038683414459228516, -0.00034771859645843506, -0.00030860304832458496, -0.00026948750019073486, -0.00023037195205688477, -0.00019125640392303467, -0.00015214085578918457, -0.00011302530765533447, -7.390975952148438e-05, -3.479421138763428e-05, 4.32133674621582e-06, 4.343688488006592e-05, 8.255243301391602e-05, 0.00012166798114776611, 0.0001607835292816162, 0.0001998990774154663, 0.0002390146255493164, 0.0002781301736831665, 0.0003172457218170166, 0.0003563612699508667, 0.0003954768180847168, 0.0004345923662185669, 0.000473707914352417, 0.0005128234624862671, 0.0005519390106201172, 0.0005910545587539673, 0.0006301701068878174, 0.0006692856550216675, 0.0007084012031555176, 0.0007475167512893677, 0.0007866322994232178, 0.0008257478475570679, 0.000864863395690918, 0.0009039789438247681, 0.0009430944919586182, 0.0009822100400924683, 0.0010213255882263184, 0.0010604411363601685, 0.0010995566844940186, 0.0011386722326278687, 0.0011777877807617188]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 17.0, 20.0, 42.0, 74.0, 167.0, 387.0, 1019.0, 4143.0, 47402.0, 914051.0, 73900.0, 5253.0, 1256.0, 404.0, 179.0, 104.0, 39.0, 26.0, 19.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.2398681640625, -12.721923828125, -12.2039794921875, -11.68603515625, -11.1680908203125, -10.650146484375, -10.1322021484375, -9.6142578125, -9.0963134765625, -8.578369140625, -8.0604248046875, -7.54248046875, -7.0245361328125, -6.506591796875, -5.9886474609375, -5.470703125, -4.9527587890625, -4.434814453125, -3.9168701171875, -3.39892578125, -2.8809814453125, -2.363037109375, -1.8450927734375, -1.3271484375, -0.8092041015625, -0.291259765625, 0.2266845703125, 0.74462890625, 1.2625732421875, 1.780517578125, 2.2984619140625, 2.81640625, 3.3343505859375, 3.852294921875, 4.3702392578125, 4.88818359375, 5.4061279296875, 5.924072265625, 6.4420166015625, 6.9599609375, 7.4779052734375, 7.995849609375, 8.5137939453125, 9.03173828125, 9.5496826171875, 10.067626953125, 10.5855712890625, 11.103515625, 11.6214599609375, 12.139404296875, 12.6573486328125, 13.17529296875, 13.6932373046875, 14.211181640625, 14.7291259765625, 15.2470703125, 15.7650146484375, 16.282958984375, 16.8009033203125, 17.31884765625, 17.8367919921875, 18.354736328125, 18.8726806640625, 19.390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 27.0, 32.0, 41.0, 53.0, 73.0, 81.0, 116.0, 116.0, 104.0, 84.0, 74.0, 38.0, 33.0, 28.0, 14.0, 11.0, 7.0, 9.0, 3.0, 9.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.4442138671875, -5.177490234375, -4.9107666015625, -4.64404296875, -4.3773193359375, -4.110595703125, -3.8438720703125, -3.5771484375, -3.3104248046875, -3.043701171875, -2.7769775390625, -2.51025390625, -2.2435302734375, -1.976806640625, -1.7100830078125, -1.443359375, -1.1766357421875, -0.909912109375, -0.6431884765625, -0.37646484375, -0.1097412109375, 0.156982421875, 0.4237060546875, 0.6904296875, 0.9571533203125, 1.223876953125, 1.4906005859375, 1.75732421875, 2.0240478515625, 2.290771484375, 2.5574951171875, 2.82421875, 3.0909423828125, 3.357666015625, 3.6243896484375, 3.89111328125, 4.1578369140625, 4.424560546875, 4.6912841796875, 4.9580078125, 5.2247314453125, 5.491455078125, 5.7581787109375, 6.02490234375, 6.2916259765625, 6.558349609375, 6.8250732421875, 7.091796875, 7.3585205078125, 7.625244140625, 7.8919677734375, 8.15869140625, 8.4254150390625, 8.692138671875, 8.9588623046875, 9.2255859375, 9.4923095703125, 9.759033203125, 10.0257568359375, 10.29248046875, 10.5592041015625, 10.825927734375, 11.0926513671875, 11.359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 12.0, 17.0, 49.0, 104.0, 149.0, 250.0, 207.0, 108.0, 45.0, 26.0, 14.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.82061767578125, -161.58380126953125, -156.3470001220703, -151.1101837158203, -145.8733673095703, -140.63656616210938, -135.39974975585938, -130.16293334960938, -124.9261245727539, -119.68931579589844, -114.45249938964844, -109.21569061279297, -103.9788818359375, -98.7420654296875, -93.50525665283203, -88.26844787597656, -83.03163146972656, -77.7948226928711, -72.5580062866211, -67.32119750976562, -62.08438491821289, -56.847572326660156, -51.61076354980469, -46.37395095825195, -41.13713836669922, -35.900325775146484, -30.663515090942383, -25.42670440673828, -20.189891815185547, -14.953079223632812, -9.716268539428711, -4.479457855224609, 0.757354736328125, 5.994166374206543, 11.230978012084961, 16.467788696289062, 21.704601287841797, 26.94141387939453, 32.17822265625, 37.415035247802734, 42.65184783935547, 47.8886604309082, 53.12547302246094, 58.362281799316406, 63.59909439086914, 68.83590698242188, 74.07271575927734, 79.30952453613281, 84.54634094238281, 89.78314971923828, 95.01996612548828, 100.25677490234375, 105.49359130859375, 110.73040008544922, 115.96720886230469, 121.20402526855469, 126.44083404541016, 131.67764282226562, 136.91445922851562, 142.15127563476562, 147.38807678222656, 152.62489318847656, 157.86170959472656, 163.0985107421875, 168.3353271484375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 13.0, 18.0, 22.0, 21.0, 35.0, 41.0, 45.0, 43.0, 66.0, 79.0, 79.0, 101.0, 82.0, 57.0, 60.0, 30.0, 47.0, 36.0, 19.0, 21.0, 20.0, 15.0, 9.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-160.51768493652344, -156.69285583496094, -152.8680419921875, -149.043212890625, -145.21839904785156, -141.39356994628906, -137.56875610351562, -133.74392700195312, -129.91909790039062, -126.09427642822266, -122.26945495605469, -118.44462585449219, -114.61980438232422, -110.79498291015625, -106.97016143798828, -103.14533996582031, -99.32052612304688, -95.4957046508789, -91.67088317871094, -87.84605407714844, -84.02123260498047, -80.1964111328125, -76.37158966064453, -72.54676818847656, -68.72193908691406, -64.8971176147461, -61.07229232788086, -57.24747085571289, -53.42264938354492, -49.59782409667969, -45.77300262451172, -41.94818115234375, -38.12335968017578, -34.29853820800781, -30.47371482849121, -26.64889144897461, -22.82406997680664, -18.99924659729004, -15.174423217773438, -11.349601745605469, -7.524778366088867, -3.699955701828003, 0.12486696243286133, 3.9496898651123047, 7.77451229095459, 11.599334716796875, 15.424158096313477, 19.248979568481445, 23.073802947998047, 26.89862632751465, 30.723447799682617, 34.54827117919922, 38.37309265136719, 42.197914123535156, 46.02273941040039, 49.84756088256836, 53.672386169433594, 57.49720764160156, 61.3220329284668, 65.1468505859375, 68.9716796875, 72.79650115966797, 76.62132263183594, 80.4461441040039, 84.27096557617188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 26.0, 26.0, 41.0, 99.0, 174.0, 365.0, 1067.0, 3576.0, 24636.0, 1001600.0, 3099298.0, 55508.0, 5590.0, 1374.0, 479.0, 210.0, 85.0, 48.0, 25.0, 16.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.6083984375, -18.935546875, -18.2626953125, -17.58984375, -16.9169921875, -16.244140625, -15.5712890625, -14.8984375, -14.2255859375, -13.552734375, -12.8798828125, -12.20703125, -11.5341796875, -10.861328125, -10.1884765625, -9.515625, -8.8427734375, -8.169921875, -7.4970703125, -6.82421875, -6.1513671875, -5.478515625, -4.8056640625, -4.1328125, -3.4599609375, -2.787109375, -2.1142578125, -1.44140625, -0.7685546875, -0.095703125, 0.5771484375, 1.25, 1.9228515625, 2.595703125, 3.2685546875, 3.94140625, 4.6142578125, 5.287109375, 5.9599609375, 6.6328125, 7.3056640625, 7.978515625, 8.6513671875, 9.32421875, 9.9970703125, 10.669921875, 11.3427734375, 12.015625, 12.6884765625, 13.361328125, 14.0341796875, 14.70703125, 15.3798828125, 16.052734375, 16.7255859375, 17.3984375, 18.0712890625, 18.744140625, 19.4169921875, 20.08984375, 20.7626953125, 21.435546875, 22.1083984375, 22.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 24.0, 25.0, 36.0, 47.0, 51.0, 38.0, 49.0, 50.0, 61.0, 67.0, 72.0, 55.0, 48.0, 58.0, 62.0, 38.0, 27.0, 22.0, 28.0, 24.0, 18.0, 10.0, 7.0, 7.0, 8.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.71258544921875, -6.5384521484375, -6.36431884765625, -6.190185546875, -6.01605224609375, -5.8419189453125, -5.66778564453125, -5.49365234375, -5.31951904296875, -5.1453857421875, -4.97125244140625, -4.797119140625, -4.62298583984375, -4.4488525390625, -4.27471923828125, -4.1005859375, -3.92645263671875, -3.7523193359375, -3.57818603515625, -3.404052734375, -3.22991943359375, -3.0557861328125, -2.88165283203125, -2.70751953125, -2.53338623046875, -2.3592529296875, -2.18511962890625, -2.010986328125, -1.83685302734375, -1.6627197265625, -1.48858642578125, -1.314453125, -1.14031982421875, -0.9661865234375, -0.79205322265625, -0.617919921875, -0.44378662109375, -0.2696533203125, -0.09552001953125, 0.07861328125, 0.25274658203125, 0.4268798828125, 0.60101318359375, 0.775146484375, 0.94927978515625, 1.1234130859375, 1.29754638671875, 1.4716796875, 1.64581298828125, 1.8199462890625, 1.99407958984375, 2.168212890625, 2.34234619140625, 2.5164794921875, 2.69061279296875, 2.86474609375, 3.03887939453125, 3.2130126953125, 3.38714599609375, 3.561279296875, 3.73541259765625, 3.9095458984375, 4.08367919921875, 4.2578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 10.0, 12.0, 15.0, 24.0, 36.0, 45.0, 40.0, 86.0, 157.0, 282.0, 603.0, 1486.0, 3395.0, 9498.0, 30531.0, 128485.0, 1171253.0, 2531952.0, 243601.0, 49212.0, 14454.0, 5039.0, 2094.0, 908.0, 462.0, 239.0, 108.0, 95.0, 40.0, 37.0, 27.0, 15.0, 7.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.73876953125, -10.4150390625, -10.09130859375, -9.767578125, -9.44384765625, -9.1201171875, -8.79638671875, -8.47265625, -8.14892578125, -7.8251953125, -7.50146484375, -7.177734375, -6.85400390625, -6.5302734375, -6.20654296875, -5.8828125, -5.55908203125, -5.2353515625, -4.91162109375, -4.587890625, -4.26416015625, -3.9404296875, -3.61669921875, -3.29296875, -2.96923828125, -2.6455078125, -2.32177734375, -1.998046875, -1.67431640625, -1.3505859375, -1.02685546875, -0.703125, -0.37939453125, -0.0556640625, 0.26806640625, 0.591796875, 0.91552734375, 1.2392578125, 1.56298828125, 1.88671875, 2.21044921875, 2.5341796875, 2.85791015625, 3.181640625, 3.50537109375, 3.8291015625, 4.15283203125, 4.4765625, 4.80029296875, 5.1240234375, 5.44775390625, 5.771484375, 6.09521484375, 6.4189453125, 6.74267578125, 7.06640625, 7.39013671875, 7.7138671875, 8.03759765625, 8.361328125, 8.68505859375, 9.0087890625, 9.33251953125, 9.65625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 6.0, 12.0, 7.0, 14.0, 13.0, 21.0, 37.0, 30.0, 34.0, 63.0, 101.0, 151.0, 237.0, 308.0, 421.0, 629.0, 590.0, 462.0, 270.0, 201.0, 117.0, 84.0, 68.0, 40.0, 28.0, 27.0, 27.0, 23.0, 13.0, 5.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7969970703125, -9.445556640625, -9.0941162109375, -8.74267578125, -8.3912353515625, -8.039794921875, -7.6883544921875, -7.3369140625, -6.9854736328125, -6.634033203125, -6.2825927734375, -5.93115234375, -5.5797119140625, -5.228271484375, -4.8768310546875, -4.525390625, -4.1739501953125, -3.822509765625, -3.4710693359375, -3.11962890625, -2.7681884765625, -2.416748046875, -2.0653076171875, -1.7138671875, -1.3624267578125, -1.010986328125, -0.6595458984375, -0.30810546875, 0.0433349609375, 0.394775390625, 0.7462158203125, 1.09765625, 1.4490966796875, 1.800537109375, 2.1519775390625, 2.50341796875, 2.8548583984375, 3.206298828125, 3.5577392578125, 3.9091796875, 4.2606201171875, 4.612060546875, 4.9635009765625, 5.31494140625, 5.6663818359375, 6.017822265625, 6.3692626953125, 6.720703125, 7.0721435546875, 7.423583984375, 7.7750244140625, 8.12646484375, 8.4779052734375, 8.829345703125, 9.1807861328125, 9.5322265625, 9.8836669921875, 10.235107421875, 10.5865478515625, 10.93798828125, 11.2894287109375, 11.640869140625, 11.9923095703125, 12.34375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 30.0, 114.0, 323.0, 322.0, 141.0, 35.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.8511962890625, -238.32566833496094, -229.80014038085938, -221.2746124267578, -212.74908447265625, -204.2235565185547, -195.69802856445312, -187.1724853515625, -178.64697265625, -170.12144470214844, -161.59591674804688, -153.0703887939453, -144.54486083984375, -136.0193328857422, -127.4937973022461, -118.96826934814453, -110.44273376464844, -101.91720581054688, -93.39167785644531, -84.86614990234375, -76.34062194824219, -67.81509399414062, -59.28955841064453, -50.76403045654297, -42.238502502441406, -33.712974548339844, -25.18744468688965, -16.661914825439453, -8.13638687133789, 0.3891410827636719, 8.9146728515625, 17.440200805664062, 25.965728759765625, 34.49125671386719, 43.01678466796875, 51.54231643676758, 60.06784439086914, 68.59336853027344, 77.11890411376953, 85.6444320678711, 94.16996002197266, 102.69548797607422, 111.22101593017578, 119.74655151367188, 128.27207946777344, 136.797607421875, 145.32313537597656, 153.84866333007812, 162.3741912841797, 170.89971923828125, 179.4252471923828, 187.95077514648438, 196.47630310058594, 205.0018310546875, 213.52737426757812, 222.05288696289062, 230.57843017578125, 239.1039581298828, 247.62948608398438, 256.155029296875, 264.6805419921875, 273.2060852050781, 281.7315979003906, 290.25714111328125, 298.78265380859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 11.0, 4.0, 5.0, 17.0, 11.0, 17.0, 9.0, 17.0, 21.0, 20.0, 30.0, 30.0, 26.0, 37.0, 38.0, 33.0, 45.0, 47.0, 42.0, 49.0, 49.0, 43.0, 54.0, 43.0, 39.0, 44.0, 33.0, 27.0, 36.0, 28.0, 14.0, 18.0, 10.0, 7.0, 15.0, 2.0, 11.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.165855407714844, -55.31768035888672, -53.469505310058594, -51.62133026123047, -49.773155212402344, -47.92498016357422, -46.076805114746094, -44.22863006591797, -42.380455017089844, -40.53227996826172, -38.684104919433594, -36.83592987060547, -34.987754821777344, -33.13957977294922, -31.29140281677246, -29.443227767944336, -27.595050811767578, -25.746875762939453, -23.898700714111328, -22.050525665283203, -20.202350616455078, -18.354175567626953, -16.505998611450195, -14.65782356262207, -12.809648513793945, -10.96147346496582, -9.113298416137695, -7.265122413635254, -5.416947364807129, -3.568772315979004, -1.7205963134765625, 0.1275787353515625, 1.9757537841796875, 3.8239290714263916, 5.672104358673096, 7.520279884338379, 9.368454933166504, 11.216629981994629, 13.06480598449707, 14.912981033325195, 16.76115608215332, 18.609331130981445, 20.45750617980957, 22.305683135986328, 24.153858184814453, 26.002033233642578, 27.850208282470703, 29.698383331298828, 31.546558380126953, 33.39473342895508, 35.2429084777832, 37.09108352661133, 38.93925857543945, 40.78743362426758, 42.63561248779297, 44.483787536621094, 46.33196258544922, 48.180137634277344, 50.02831268310547, 51.876487731933594, 53.72466278076172, 55.572837829589844, 57.42101287841797, 59.269187927246094, 61.11736297607422]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 10.0, 6.0, 15.0, 23.0, 29.0, 37.0, 63.0, 93.0, 120.0, 244.0, 376.0, 655.0, 1026.0, 1838.0, 3571.0, 7530.0, 16480.0, 38121.0, 91035.0, 220679.0, 351571.0, 181054.0, 75141.0, 31649.0, 13792.0, 6343.0, 3030.0, 1611.0, 908.0, 543.0, 360.0, 200.0, 132.0, 79.0, 44.0, 40.0, 26.0, 20.0, 15.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.953125, -9.655029296875, -9.35693359375, -9.058837890625, -8.7607421875, -8.462646484375, -8.16455078125, -7.866455078125, -7.568359375, -7.270263671875, -6.97216796875, -6.674072265625, -6.3759765625, -6.077880859375, -5.77978515625, -5.481689453125, -5.18359375, -4.885498046875, -4.58740234375, -4.289306640625, -3.9912109375, -3.693115234375, -3.39501953125, -3.096923828125, -2.798828125, -2.500732421875, -2.20263671875, -1.904541015625, -1.6064453125, -1.308349609375, -1.01025390625, -0.712158203125, -0.4140625, -0.115966796875, 0.18212890625, 0.480224609375, 0.7783203125, 1.076416015625, 1.37451171875, 1.672607421875, 1.970703125, 2.268798828125, 2.56689453125, 2.864990234375, 3.1630859375, 3.461181640625, 3.75927734375, 4.057373046875, 4.35546875, 4.653564453125, 4.95166015625, 5.249755859375, 5.5478515625, 5.845947265625, 6.14404296875, 6.442138671875, 6.740234375, 7.038330078125, 7.33642578125, 7.634521484375, 7.9326171875, 8.230712890625, 8.52880859375, 8.826904296875, 9.125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 10.0, 10.0, 15.0, 17.0, 20.0, 28.0, 32.0, 38.0, 33.0, 47.0, 56.0, 55.0, 42.0, 61.0, 55.0, 63.0, 62.0, 55.0, 48.0, 50.0, 40.0, 27.0, 29.0, 28.0, 16.0, 20.0, 7.0, 11.0, 8.0, 5.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6875, -6.5133056640625, -6.339111328125, -6.1649169921875, -5.99072265625, -5.8165283203125, -5.642333984375, -5.4681396484375, -5.2939453125, -5.1197509765625, -4.945556640625, -4.7713623046875, -4.59716796875, -4.4229736328125, -4.248779296875, -4.0745849609375, -3.900390625, -3.7261962890625, -3.552001953125, -3.3778076171875, -3.20361328125, -3.0294189453125, -2.855224609375, -2.6810302734375, -2.5068359375, -2.3326416015625, -2.158447265625, -1.9842529296875, -1.81005859375, -1.6358642578125, -1.461669921875, -1.2874755859375, -1.11328125, -0.9390869140625, -0.764892578125, -0.5906982421875, -0.41650390625, -0.2423095703125, -0.068115234375, 0.1060791015625, 0.2802734375, 0.4544677734375, 0.628662109375, 0.8028564453125, 0.97705078125, 1.1512451171875, 1.325439453125, 1.4996337890625, 1.673828125, 1.8480224609375, 2.022216796875, 2.1964111328125, 2.37060546875, 2.5447998046875, 2.718994140625, 2.8931884765625, 3.0673828125, 3.2415771484375, 3.415771484375, 3.5899658203125, 3.76416015625, 3.9383544921875, 4.112548828125, 4.2867431640625, 4.4609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 14.0, 12.0, 18.0, 26.0, 24.0, 42.0, 77.0, 94.0, 139.0, 241.0, 374.0, 688.0, 1407.0, 3458.0, 15355.0, 238245.0, 744950.0, 34085.0, 5227.0, 1859.0, 866.0, 467.0, 286.0, 207.0, 103.0, 74.0, 53.0, 34.0, 31.0, 19.0, 13.0, 16.0, 6.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.0966796875, -25.099609375, -24.1025390625, -23.10546875, -22.1083984375, -21.111328125, -20.1142578125, -19.1171875, -18.1201171875, -17.123046875, -16.1259765625, -15.12890625, -14.1318359375, -13.134765625, -12.1376953125, -11.140625, -10.1435546875, -9.146484375, -8.1494140625, -7.15234375, -6.1552734375, -5.158203125, -4.1611328125, -3.1640625, -2.1669921875, -1.169921875, -0.1728515625, 0.82421875, 1.8212890625, 2.818359375, 3.8154296875, 4.8125, 5.8095703125, 6.806640625, 7.8037109375, 8.80078125, 9.7978515625, 10.794921875, 11.7919921875, 12.7890625, 13.7861328125, 14.783203125, 15.7802734375, 16.77734375, 17.7744140625, 18.771484375, 19.7685546875, 20.765625, 21.7626953125, 22.759765625, 23.7568359375, 24.75390625, 25.7509765625, 26.748046875, 27.7451171875, 28.7421875, 29.7392578125, 30.736328125, 31.7333984375, 32.73046875, 33.7275390625, 34.724609375, 35.7216796875, 36.71875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 14.0, 14.0, 14.0, 22.0, 13.0, 32.0, 27.0, 34.0, 39.0, 35.0, 47.0, 40.0, 40.0, 51.0, 49.0, 48.0, 48.0, 53.0, 39.0, 44.0, 42.0, 44.0, 26.0, 20.0, 30.0, 24.0, 18.0, 16.0, 15.0, 9.0, 11.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.209716796875, -21.56005859375, -20.910400390625, -20.2607421875, -19.611083984375, -18.96142578125, -18.311767578125, -17.662109375, -17.012451171875, -16.36279296875, -15.713134765625, -15.0634765625, -14.413818359375, -13.76416015625, -13.114501953125, -12.46484375, -11.815185546875, -11.16552734375, -10.515869140625, -9.8662109375, -9.216552734375, -8.56689453125, -7.917236328125, -7.267578125, -6.617919921875, -5.96826171875, -5.318603515625, -4.6689453125, -4.019287109375, -3.36962890625, -2.719970703125, -2.0703125, -1.420654296875, -0.77099609375, -0.121337890625, 0.5283203125, 1.177978515625, 1.82763671875, 2.477294921875, 3.126953125, 3.776611328125, 4.42626953125, 5.075927734375, 5.7255859375, 6.375244140625, 7.02490234375, 7.674560546875, 8.32421875, 8.973876953125, 9.62353515625, 10.273193359375, 10.9228515625, 11.572509765625, 12.22216796875, 12.871826171875, 13.521484375, 14.171142578125, 14.82080078125, 15.470458984375, 16.1201171875, 16.769775390625, 17.41943359375, 18.069091796875, 18.71875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 23.0, 22.0, 31.0, 51.0, 77.0, 149.0, 263.0, 527.0, 1732.0, 7142.0, 56543.0, 784221.0, 176974.0, 16054.0, 2977.0, 923.0, 340.0, 186.0, 98.0, 60.0, 29.0, 17.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.9046630859375, -10.590576171875, -10.2764892578125, -9.96240234375, -9.6483154296875, -9.334228515625, -9.0201416015625, -8.7060546875, -8.3919677734375, -8.077880859375, -7.7637939453125, -7.44970703125, -7.1356201171875, -6.821533203125, -6.5074462890625, -6.193359375, -5.8792724609375, -5.565185546875, -5.2510986328125, -4.93701171875, -4.6229248046875, -4.308837890625, -3.9947509765625, -3.6806640625, -3.3665771484375, -3.052490234375, -2.7384033203125, -2.42431640625, -2.1102294921875, -1.796142578125, -1.4820556640625, -1.16796875, -0.8538818359375, -0.539794921875, -0.2257080078125, 0.08837890625, 0.4024658203125, 0.716552734375, 1.0306396484375, 1.3447265625, 1.6588134765625, 1.972900390625, 2.2869873046875, 2.60107421875, 2.9151611328125, 3.229248046875, 3.5433349609375, 3.857421875, 4.1715087890625, 4.485595703125, 4.7996826171875, 5.11376953125, 5.4278564453125, 5.741943359375, 6.0560302734375, 6.3701171875, 6.6842041015625, 6.998291015625, 7.3123779296875, 7.62646484375, 7.9405517578125, 8.254638671875, 8.5687255859375, 8.8828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 18.0, 31.0, 33.0, 52.0, 55.0, 98.0, 165.0, 182.0, 79.0, 75.0, 49.0, 23.0, 32.0, 15.0, 16.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002140045166015625, -0.0020686984062194824, -0.00199735164642334, -0.0019260048866271973, -0.0018546581268310547, -0.0017833113670349121, -0.0017119646072387695, -0.001640617847442627, -0.0015692710876464844, -0.0014979243278503418, -0.0014265775680541992, -0.0013552308082580566, -0.001283884048461914, -0.0012125372886657715, -0.001141190528869629, -0.0010698437690734863, -0.0009984970092773438, -0.0009271502494812012, -0.0008558034896850586, -0.000784456729888916, -0.0007131099700927734, -0.0006417632102966309, -0.0005704164505004883, -0.0004990696907043457, -0.0004277229309082031, -0.00035637617111206055, -0.00028502941131591797, -0.0002136826515197754, -0.0001423358917236328, -7.098913192749023e-05, 3.5762786865234375e-07, 7.170438766479492e-05, 0.0001430511474609375, 0.00021439790725708008, 0.00028574466705322266, 0.00035709142684936523, 0.0004284381866455078, 0.0004997849464416504, 0.000571131706237793, 0.0006424784660339355, 0.0007138252258300781, 0.0007851719856262207, 0.0008565187454223633, 0.0009278655052185059, 0.0009992122650146484, 0.001070559024810791, 0.0011419057846069336, 0.0012132525444030762, 0.0012845993041992188, 0.0013559460639953613, 0.001427292823791504, 0.0014986395835876465, 0.001569986343383789, 0.0016413331031799316, 0.0017126798629760742, 0.0017840266227722168, 0.0018553733825683594, 0.001926720142364502, 0.0019980669021606445, 0.002069413661956787, 0.0021407604217529297, 0.0022121071815490723, 0.002283453941345215, 0.0023548007011413574, 0.0024261474609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 22.0, 25.0, 32.0, 33.0, 73.0, 113.0, 188.0, 363.0, 685.0, 1412.0, 3950.0, 15950.0, 136435.0, 797670.0, 74790.0, 11315.0, 3037.0, 1130.0, 563.0, 283.0, 147.0, 99.0, 57.0, 52.0, 26.0, 19.0, 17.0, 19.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.5234375, -8.242919921875, -7.96240234375, -7.681884765625, -7.4013671875, -7.120849609375, -6.84033203125, -6.559814453125, -6.279296875, -5.998779296875, -5.71826171875, -5.437744140625, -5.1572265625, -4.876708984375, -4.59619140625, -4.315673828125, -4.03515625, -3.754638671875, -3.47412109375, -3.193603515625, -2.9130859375, -2.632568359375, -2.35205078125, -2.071533203125, -1.791015625, -1.510498046875, -1.22998046875, -0.949462890625, -0.6689453125, -0.388427734375, -0.10791015625, 0.172607421875, 0.453125, 0.733642578125, 1.01416015625, 1.294677734375, 1.5751953125, 1.855712890625, 2.13623046875, 2.416748046875, 2.697265625, 2.977783203125, 3.25830078125, 3.538818359375, 3.8193359375, 4.099853515625, 4.38037109375, 4.660888671875, 4.94140625, 5.221923828125, 5.50244140625, 5.782958984375, 6.0634765625, 6.343994140625, 6.62451171875, 6.905029296875, 7.185546875, 7.466064453125, 7.74658203125, 8.027099609375, 8.3076171875, 8.588134765625, 8.86865234375, 9.149169921875, 9.4296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 2.0, 4.0, 6.0, 8.0, 12.0, 10.0, 16.0, 26.0, 22.0, 21.0, 27.0, 37.0, 36.0, 48.0, 54.0, 52.0, 71.0, 77.0, 72.0, 46.0, 54.0, 47.0, 37.0, 42.0, 29.0, 23.0, 15.0, 24.0, 12.0, 8.0, 5.0, 12.0, 7.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.37896728515625, -4.2344970703125, -4.09002685546875, -3.945556640625, -3.80108642578125, -3.6566162109375, -3.51214599609375, -3.36767578125, -3.22320556640625, -3.0787353515625, -2.93426513671875, -2.789794921875, -2.64532470703125, -2.5008544921875, -2.35638427734375, -2.2119140625, -2.06744384765625, -1.9229736328125, -1.77850341796875, -1.634033203125, -1.48956298828125, -1.3450927734375, -1.20062255859375, -1.05615234375, -0.91168212890625, -0.7672119140625, -0.62274169921875, -0.478271484375, -0.33380126953125, -0.1893310546875, -0.04486083984375, 0.099609375, 0.24407958984375, 0.3885498046875, 0.53302001953125, 0.677490234375, 0.82196044921875, 0.9664306640625, 1.11090087890625, 1.25537109375, 1.39984130859375, 1.5443115234375, 1.68878173828125, 1.833251953125, 1.97772216796875, 2.1221923828125, 2.26666259765625, 2.4111328125, 2.55560302734375, 2.7000732421875, 2.84454345703125, 2.989013671875, 3.13348388671875, 3.2779541015625, 3.42242431640625, 3.56689453125, 3.71136474609375, 3.8558349609375, 4.00030517578125, 4.144775390625, 4.28924560546875, 4.4337158203125, 4.57818603515625, 4.72265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 13.0, 15.0, 35.0, 79.0, 123.0, 205.0, 244.0, 124.0, 81.0, 37.0, 14.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.18331909179688, -122.13169860839844, -117.08008575439453, -112.0284652709961, -106.97685241699219, -101.92523193359375, -96.87361145019531, -91.8219985961914, -86.7703857421875, -81.71876525878906, -76.66715240478516, -71.61553192138672, -66.56391906738281, -61.512298583984375, -56.4606819152832, -51.40906524658203, -46.357444763183594, -41.30582809448242, -36.25421142578125, -31.202592849731445, -26.150976181030273, -21.0993595123291, -16.047740936279297, -10.996124267578125, -5.944507598876953, -0.892890453338623, 4.158726692199707, 9.210344314575195, 14.261960983276367, 19.31357765197754, 24.365196228027344, 29.416812896728516, 34.46842956542969, 39.52004623413086, 44.57166290283203, 49.62328338623047, 54.674896240234375, 59.72651672363281, 64.77813720703125, 69.82975006103516, 74.88136291503906, 79.9329833984375, 84.9845962524414, 90.03621673583984, 95.08782958984375, 100.13945007324219, 105.19107055664062, 110.24268341064453, 115.29430389404297, 120.3459243774414, 125.39753723144531, 130.44915771484375, 135.5007781982422, 140.55238342285156, 145.60400390625, 150.65562438964844, 155.70724487304688, 160.7588653564453, 165.81048583984375, 170.86209106445312, 175.91371154785156, 180.96533203125, 186.01695251464844, 191.06857299804688, 196.12017822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 12.0, 8.0, 17.0, 21.0, 26.0, 20.0, 31.0, 54.0, 36.0, 50.0, 58.0, 83.0, 78.0, 91.0, 65.0, 39.0, 33.0, 33.0, 34.0, 27.0, 26.0, 23.0, 25.0, 22.0, 13.0, 12.0, 6.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.29074096679688, -74.36323547363281, -71.43572998046875, -68.50822448730469, -65.58071899414062, -62.65321350097656, -59.7257080078125, -56.79820251464844, -53.870697021484375, -50.94319152832031, -48.01568603515625, -45.08818054199219, -42.160675048828125, -39.23316955566406, -36.3056640625, -33.37815856933594, -30.45065689086914, -27.523151397705078, -24.595645904541016, -21.668140411376953, -18.74063491821289, -15.813130378723145, -12.885625839233398, -9.958120346069336, -7.030614852905273, -4.103109359741211, -1.1756043434143066, 1.7519006729125977, 4.67940616607666, 7.606911659240723, 10.534416198730469, 13.461921691894531, 16.389427185058594, 19.316932678222656, 22.24443817138672, 25.17194366455078, 28.099449157714844, 31.026954650878906, 33.95446014404297, 36.88196563720703, 39.809471130371094, 42.736976623535156, 45.66448211669922, 48.59198760986328, 51.519493103027344, 54.446998596191406, 57.37450408935547, 60.30200958251953, 63.22951126098633, 66.15701293945312, 69.08451843261719, 72.01202392578125, 74.93952941894531, 77.86703491210938, 80.79454040527344, 83.7220458984375, 86.64955139160156, 89.57705688476562, 92.50456237792969, 95.43206787109375, 98.35957336425781, 101.28707885742188, 104.21458435058594, 107.14208984375, 110.06959533691406]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 15.0, 19.0, 33.0, 58.0, 80.0, 174.0, 324.0, 647.0, 1454.0, 3814.0, 12065.0, 51723.0, 484646.0, 3132719.0, 439709.0, 49175.0, 11404.0, 3646.0, 1339.0, 574.0, 295.0, 156.0, 82.0, 44.0, 29.0, 19.0, 13.0, 10.0, 5.0, 2.0, 6.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.90087890625, -7.5908203125, -7.28076171875, -6.970703125, -6.66064453125, -6.3505859375, -6.04052734375, -5.73046875, -5.42041015625, -5.1103515625, -4.80029296875, -4.490234375, -4.18017578125, -3.8701171875, -3.56005859375, -3.25, -2.93994140625, -2.6298828125, -2.31982421875, -2.009765625, -1.69970703125, -1.3896484375, -1.07958984375, -0.76953125, -0.45947265625, -0.1494140625, 0.16064453125, 0.470703125, 0.78076171875, 1.0908203125, 1.40087890625, 1.7109375, 2.02099609375, 2.3310546875, 2.64111328125, 2.951171875, 3.26123046875, 3.5712890625, 3.88134765625, 4.19140625, 4.50146484375, 4.8115234375, 5.12158203125, 5.431640625, 5.74169921875, 6.0517578125, 6.36181640625, 6.671875, 6.98193359375, 7.2919921875, 7.60205078125, 7.912109375, 8.22216796875, 8.5322265625, 8.84228515625, 9.15234375, 9.46240234375, 9.7724609375, 10.08251953125, 10.392578125, 10.70263671875, 11.0126953125, 11.32275390625, 11.6328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 10.0, 18.0, 24.0, 24.0, 21.0, 34.0, 37.0, 42.0, 61.0, 76.0, 51.0, 57.0, 61.0, 54.0, 60.0, 64.0, 61.0, 46.0, 32.0, 35.0, 20.0, 28.0, 16.0, 14.0, 4.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -3.97509765625, -3.7900390625, -3.60498046875, -3.419921875, -3.23486328125, -3.0498046875, -2.86474609375, -2.6796875, -2.49462890625, -2.3095703125, -2.12451171875, -1.939453125, -1.75439453125, -1.5693359375, -1.38427734375, -1.19921875, -1.01416015625, -0.8291015625, -0.64404296875, -0.458984375, -0.27392578125, -0.0888671875, 0.09619140625, 0.28125, 0.46630859375, 0.6513671875, 0.83642578125, 1.021484375, 1.20654296875, 1.3916015625, 1.57666015625, 1.76171875, 1.94677734375, 2.1318359375, 2.31689453125, 2.501953125, 2.68701171875, 2.8720703125, 3.05712890625, 3.2421875, 3.42724609375, 3.6123046875, 3.79736328125, 3.982421875, 4.16748046875, 4.3525390625, 4.53759765625, 4.72265625, 4.90771484375, 5.0927734375, 5.27783203125, 5.462890625, 5.64794921875, 5.8330078125, 6.01806640625, 6.203125, 6.38818359375, 6.5732421875, 6.75830078125, 6.943359375, 7.12841796875, 7.3134765625, 7.49853515625, 7.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 16.0, 38.0, 65.0, 107.0, 231.0, 671.0, 2224.0, 11850.0, 132969.0, 3788168.0, 235660.0, 17740.0, 3082.0, 907.0, 296.0, 132.0, 63.0, 24.0, 8.0, 11.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.766357421875, -16.11083984375, -15.455322265625, -14.7998046875, -14.144287109375, -13.48876953125, -12.833251953125, -12.177734375, -11.522216796875, -10.86669921875, -10.211181640625, -9.5556640625, -8.900146484375, -8.24462890625, -7.589111328125, -6.93359375, -6.278076171875, -5.62255859375, -4.967041015625, -4.3115234375, -3.656005859375, -3.00048828125, -2.344970703125, -1.689453125, -1.033935546875, -0.37841796875, 0.277099609375, 0.9326171875, 1.588134765625, 2.24365234375, 2.899169921875, 3.5546875, 4.210205078125, 4.86572265625, 5.521240234375, 6.1767578125, 6.832275390625, 7.48779296875, 8.143310546875, 8.798828125, 9.454345703125, 10.10986328125, 10.765380859375, 11.4208984375, 12.076416015625, 12.73193359375, 13.387451171875, 14.04296875, 14.698486328125, 15.35400390625, 16.009521484375, 16.6650390625, 17.320556640625, 17.97607421875, 18.631591796875, 19.287109375, 19.942626953125, 20.59814453125, 21.253662109375, 21.9091796875, 22.564697265625, 23.22021484375, 23.875732421875, 24.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 13.0, 17.0, 20.0, 36.0, 62.0, 81.0, 123.0, 279.0, 527.0, 962.0, 866.0, 461.0, 224.0, 127.0, 82.0, 59.0, 30.0, 26.0, 23.0, 14.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.23974609375, -16.7451171875, -16.25048828125, -15.755859375, -15.26123046875, -14.7666015625, -14.27197265625, -13.77734375, -13.28271484375, -12.7880859375, -12.29345703125, -11.798828125, -11.30419921875, -10.8095703125, -10.31494140625, -9.8203125, -9.32568359375, -8.8310546875, -8.33642578125, -7.841796875, -7.34716796875, -6.8525390625, -6.35791015625, -5.86328125, -5.36865234375, -4.8740234375, -4.37939453125, -3.884765625, -3.39013671875, -2.8955078125, -2.40087890625, -1.90625, -1.41162109375, -0.9169921875, -0.42236328125, 0.072265625, 0.56689453125, 1.0615234375, 1.55615234375, 2.05078125, 2.54541015625, 3.0400390625, 3.53466796875, 4.029296875, 4.52392578125, 5.0185546875, 5.51318359375, 6.0078125, 6.50244140625, 6.9970703125, 7.49169921875, 7.986328125, 8.48095703125, 8.9755859375, 9.47021484375, 9.96484375, 10.45947265625, 10.9541015625, 11.44873046875, 11.943359375, 12.43798828125, 12.9326171875, 13.42724609375, 13.921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 8.0, 26.0, 82.0, 198.0, 315.0, 224.0, 87.0, 29.0, 14.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.4720458984375, -174.14645385742188, -167.82086181640625, -161.49526977539062, -155.169677734375, -148.84408569335938, -142.51849365234375, -136.19290161132812, -129.8673095703125, -123.54171752929688, -117.21612548828125, -110.89053344726562, -104.56494140625, -98.23934936523438, -91.91375732421875, -85.58816528320312, -79.2625732421875, -72.93698120117188, -66.61138916015625, -60.285797119140625, -53.960205078125, -47.634613037109375, -41.30902099609375, -34.983428955078125, -28.6578369140625, -22.332244873046875, -16.00665283203125, -9.681060791015625, -3.35546875, 2.970123291015625, 9.29571533203125, 15.621307373046875, 21.946914672851562, 28.272506713867188, 34.59809875488281, 40.92369079589844, 47.24928283691406, 53.57487487792969, 59.90046691894531, 66.22605895996094, 72.55165100097656, 78.87724304199219, 85.20283508300781, 91.52842712402344, 97.85401916503906, 104.17961120605469, 110.50520324707031, 116.83079528808594, 123.15638732910156, 129.4819793701172, 135.8075714111328, 142.13316345214844, 148.45875549316406, 154.7843475341797, 161.1099395751953, 167.43553161621094, 173.76112365722656, 180.0867156982422, 186.4123077392578, 192.73789978027344, 199.06349182128906, 205.3890838623047, 211.7146759033203, 218.04026794433594, 224.36585998535156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 6.0, 8.0, 10.0, 16.0, 23.0, 19.0, 25.0, 26.0, 39.0, 26.0, 34.0, 38.0, 52.0, 50.0, 49.0, 67.0, 39.0, 42.0, 54.0, 49.0, 48.0, 50.0, 34.0, 29.0, 24.0, 24.0, 27.0, 15.0, 21.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.355377197265625, -60.53413009643555, -58.712886810302734, -56.891639709472656, -55.07039260864258, -53.2491455078125, -51.42790222167969, -49.60665512084961, -47.78540802001953, -45.96416091918945, -44.14291763305664, -42.32167053222656, -40.500423431396484, -38.679176330566406, -36.857933044433594, -35.036685943603516, -33.2154426574707, -31.394197463989258, -29.57295036315918, -27.751705169677734, -25.930458068847656, -24.10921287536621, -22.287967681884766, -20.466720581054688, -18.645475387573242, -16.824230194091797, -15.002983093261719, -13.181737899780273, -11.360491752624512, -9.53924560546875, -7.718000411987305, -5.896754264831543, -4.075504302978516, -2.254258394241333, -0.4330124855041504, 1.3882331848144531, 3.209479331970215, 5.030725479125977, 6.851970672607422, 8.673216819763184, 10.494462966918945, 12.315709114074707, 14.136955261230469, 15.958200454711914, 17.77944564819336, 19.600692749023438, 21.421937942504883, 23.243183135986328, 25.064430236816406, 26.88567543029785, 28.70692253112793, 30.528167724609375, 32.34941482543945, 34.17066192626953, 35.991905212402344, 37.81315231323242, 39.6343994140625, 41.45564651489258, 43.27688980102539, 45.09813690185547, 46.91938400268555, 48.740631103515625, 50.56187438964844, 52.383121490478516, 54.20436477661133]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 4.0, 7.0, 8.0, 17.0, 24.0, 36.0, 57.0, 77.0, 92.0, 190.0, 268.0, 403.0, 724.0, 1280.0, 2298.0, 4203.0, 8083.0, 16293.0, 35068.0, 82466.0, 218229.0, 365207.0, 182493.0, 70507.0, 30319.0, 14310.0, 7268.0, 3697.0, 2020.0, 1124.0, 661.0, 387.0, 248.0, 151.0, 101.0, 70.0, 45.0, 24.0, 13.0, 20.0, 26.0, 8.0, 0.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.948486328125, -7.67822265625, -7.407958984375, -7.1376953125, -6.867431640625, -6.59716796875, -6.326904296875, -6.056640625, -5.786376953125, -5.51611328125, -5.245849609375, -4.9755859375, -4.705322265625, -4.43505859375, -4.164794921875, -3.89453125, -3.624267578125, -3.35400390625, -3.083740234375, -2.8134765625, -2.543212890625, -2.27294921875, -2.002685546875, -1.732421875, -1.462158203125, -1.19189453125, -0.921630859375, -0.6513671875, -0.381103515625, -0.11083984375, 0.159423828125, 0.4296875, 0.699951171875, 0.97021484375, 1.240478515625, 1.5107421875, 1.781005859375, 2.05126953125, 2.321533203125, 2.591796875, 2.862060546875, 3.13232421875, 3.402587890625, 3.6728515625, 3.943115234375, 4.21337890625, 4.483642578125, 4.75390625, 5.024169921875, 5.29443359375, 5.564697265625, 5.8349609375, 6.105224609375, 6.37548828125, 6.645751953125, 6.916015625, 7.186279296875, 7.45654296875, 7.726806640625, 7.9970703125, 8.267333984375, 8.53759765625, 8.807861328125, 9.078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 5.0, 10.0, 7.0, 15.0, 14.0, 14.0, 29.0, 17.0, 29.0, 20.0, 30.0, 31.0, 45.0, 38.0, 40.0, 46.0, 45.0, 46.0, 53.0, 40.0, 41.0, 45.0, 50.0, 31.0, 37.0, 31.0, 26.0, 17.0, 26.0, 18.0, 21.0, 14.0, 4.0, 7.0, 9.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.953125, -3.8155517578125, -3.677978515625, -3.5404052734375, -3.40283203125, -3.2652587890625, -3.127685546875, -2.9901123046875, -2.8525390625, -2.7149658203125, -2.577392578125, -2.4398193359375, -2.30224609375, -2.1646728515625, -2.027099609375, -1.8895263671875, -1.751953125, -1.6143798828125, -1.476806640625, -1.3392333984375, -1.20166015625, -1.0640869140625, -0.926513671875, -0.7889404296875, -0.6513671875, -0.5137939453125, -0.376220703125, -0.2386474609375, -0.10107421875, 0.0364990234375, 0.174072265625, 0.3116455078125, 0.44921875, 0.5867919921875, 0.724365234375, 0.8619384765625, 0.99951171875, 1.1370849609375, 1.274658203125, 1.4122314453125, 1.5498046875, 1.6873779296875, 1.824951171875, 1.9625244140625, 2.10009765625, 2.2376708984375, 2.375244140625, 2.5128173828125, 2.650390625, 2.7879638671875, 2.925537109375, 3.0631103515625, 3.20068359375, 3.3382568359375, 3.475830078125, 3.6134033203125, 3.7509765625, 3.8885498046875, 4.026123046875, 4.1636962890625, 4.30126953125, 4.4388427734375, 4.576416015625, 4.7139892578125, 4.8515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 21.0, 29.0, 58.0, 82.0, 106.0, 178.0, 271.0, 516.0, 971.0, 2150.0, 6679.0, 44688.0, 776216.0, 193468.0, 16181.0, 3687.0, 1408.0, 725.0, 428.0, 204.0, 159.0, 100.0, 58.0, 44.0, 25.0, 16.0, 16.0, 9.0, 9.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.84375, -31.950439453125, -31.05712890625, -30.163818359375, -29.2705078125, -28.377197265625, -27.48388671875, -26.590576171875, -25.697265625, -24.803955078125, -23.91064453125, -23.017333984375, -22.1240234375, -21.230712890625, -20.33740234375, -19.444091796875, -18.55078125, -17.657470703125, -16.76416015625, -15.870849609375, -14.9775390625, -14.084228515625, -13.19091796875, -12.297607421875, -11.404296875, -10.510986328125, -9.61767578125, -8.724365234375, -7.8310546875, -6.937744140625, -6.04443359375, -5.151123046875, -4.2578125, -3.364501953125, -2.47119140625, -1.577880859375, -0.6845703125, 0.208740234375, 1.10205078125, 1.995361328125, 2.888671875, 3.781982421875, 4.67529296875, 5.568603515625, 6.4619140625, 7.355224609375, 8.24853515625, 9.141845703125, 10.03515625, 10.928466796875, 11.82177734375, 12.715087890625, 13.6083984375, 14.501708984375, 15.39501953125, 16.288330078125, 17.181640625, 18.074951171875, 18.96826171875, 19.861572265625, 20.7548828125, 21.648193359375, 22.54150390625, 23.434814453125, 24.328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 12.0, 10.0, 15.0, 29.0, 28.0, 38.0, 35.0, 38.0, 46.0, 57.0, 68.0, 54.0, 69.0, 71.0, 59.0, 50.0, 43.0, 42.0, 52.0, 42.0, 20.0, 27.0, 17.0, 21.0, 13.0, 13.0, 11.0, 4.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.673828125, -17.92578125, -17.177734375, -16.4296875, -15.681640625, -14.93359375, -14.185546875, -13.4375, -12.689453125, -11.94140625, -11.193359375, -10.4453125, -9.697265625, -8.94921875, -8.201171875, -7.453125, -6.705078125, -5.95703125, -5.208984375, -4.4609375, -3.712890625, -2.96484375, -2.216796875, -1.46875, -0.720703125, 0.02734375, 0.775390625, 1.5234375, 2.271484375, 3.01953125, 3.767578125, 4.515625, 5.263671875, 6.01171875, 6.759765625, 7.5078125, 8.255859375, 9.00390625, 9.751953125, 10.5, 11.248046875, 11.99609375, 12.744140625, 13.4921875, 14.240234375, 14.98828125, 15.736328125, 16.484375, 17.232421875, 17.98046875, 18.728515625, 19.4765625, 20.224609375, 20.97265625, 21.720703125, 22.46875, 23.216796875, 23.96484375, 24.712890625, 25.4609375, 26.208984375, 26.95703125, 27.705078125, 28.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 11.0, 8.0, 14.0, 17.0, 11.0, 18.0, 37.0, 54.0, 92.0, 155.0, 374.0, 1013.0, 3885.0, 28594.0, 742841.0, 252117.0, 15242.0, 2585.0, 797.0, 269.0, 167.0, 78.0, 46.0, 28.0, 25.0, 16.0, 7.0, 8.0, 9.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.4580078125, -10.095703125, -9.7333984375, -9.37109375, -9.0087890625, -8.646484375, -8.2841796875, -7.921875, -7.5595703125, -7.197265625, -6.8349609375, -6.47265625, -6.1103515625, -5.748046875, -5.3857421875, -5.0234375, -4.6611328125, -4.298828125, -3.9365234375, -3.57421875, -3.2119140625, -2.849609375, -2.4873046875, -2.125, -1.7626953125, -1.400390625, -1.0380859375, -0.67578125, -0.3134765625, 0.048828125, 0.4111328125, 0.7734375, 1.1357421875, 1.498046875, 1.8603515625, 2.22265625, 2.5849609375, 2.947265625, 3.3095703125, 3.671875, 4.0341796875, 4.396484375, 4.7587890625, 5.12109375, 5.4833984375, 5.845703125, 6.2080078125, 6.5703125, 6.9326171875, 7.294921875, 7.6572265625, 8.01953125, 8.3818359375, 8.744140625, 9.1064453125, 9.46875, 9.8310546875, 10.193359375, 10.5556640625, 10.91796875, 11.2802734375, 11.642578125, 12.0048828125, 12.3671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 9.0, 7.0, 11.0, 18.0, 14.0, 12.0, 17.0, 26.0, 27.0, 38.0, 61.0, 87.0, 134.0, 117.0, 104.0, 66.0, 50.0, 36.0, 34.0, 22.0, 14.0, 23.0, 11.0, 14.0, 6.0, 10.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.001171410083770752, -0.001129746437072754, -0.0010880827903747559, -0.0010464191436767578, -0.0010047554969787598, -0.0009630918502807617, -0.0009214282035827637, -0.0008797645568847656, -0.0008381009101867676, -0.0007964372634887695, -0.0007547736167907715, -0.0007131099700927734, -0.0006714463233947754, -0.0006297826766967773, -0.0005881190299987793, -0.0005464553833007812, -0.0005047917366027832, -0.00046312808990478516, -0.0004214644432067871, -0.00037980079650878906, -0.000338137149810791, -0.00029647350311279297, -0.0002548098564147949, -0.00021314620971679688, -0.00017148256301879883, -0.00012981891632080078, -8.815526962280273e-05, -4.649162292480469e-05, -4.827976226806641e-06, 3.6835670471191406e-05, 7.849931716918945e-05, 0.0001201629638671875, 0.00016182661056518555, 0.0002034902572631836, 0.00024515390396118164, 0.0002868175506591797, 0.00032848119735717773, 0.0003701448440551758, 0.00041180849075317383, 0.0004534721374511719, 0.0004951357841491699, 0.000536799430847168, 0.000578463077545166, 0.0006201267242431641, 0.0006617903709411621, 0.0007034540176391602, 0.0007451176643371582, 0.0007867813110351562, 0.0008284449577331543, 0.0008701086044311523, 0.0009117722511291504, 0.0009534358978271484, 0.0009950995445251465, 0.0010367631912231445, 0.0010784268379211426, 0.0011200904846191406, 0.0011617541313171387, 0.0012034177780151367, 0.0012450814247131348, 0.0012867450714111328, 0.0013284087181091309, 0.001370072364807129, 0.001411736011505127, 0.001453399658203125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 17.0, 16.0, 21.0, 46.0, 56.0, 98.0, 161.0, 306.0, 522.0, 1017.0, 2680.0, 9627.0, 65954.0, 790962.0, 153977.0, 16450.0, 3839.0, 1331.0, 634.0, 331.0, 178.0, 135.0, 62.0, 43.0, 34.0, 15.0, 16.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.0352783203125, -7.781494140625, -7.5277099609375, -7.27392578125, -7.0201416015625, -6.766357421875, -6.5125732421875, -6.2587890625, -6.0050048828125, -5.751220703125, -5.4974365234375, -5.24365234375, -4.9898681640625, -4.736083984375, -4.4822998046875, -4.228515625, -3.9747314453125, -3.720947265625, -3.4671630859375, -3.21337890625, -2.9595947265625, -2.705810546875, -2.4520263671875, -2.1982421875, -1.9444580078125, -1.690673828125, -1.4368896484375, -1.18310546875, -0.9293212890625, -0.675537109375, -0.4217529296875, -0.16796875, 0.0858154296875, 0.339599609375, 0.5933837890625, 0.84716796875, 1.1009521484375, 1.354736328125, 1.6085205078125, 1.8623046875, 2.1160888671875, 2.369873046875, 2.6236572265625, 2.87744140625, 3.1312255859375, 3.385009765625, 3.6387939453125, 3.892578125, 4.1463623046875, 4.400146484375, 4.6539306640625, 4.90771484375, 5.1614990234375, 5.415283203125, 5.6690673828125, 5.9228515625, 6.1766357421875, 6.430419921875, 6.6842041015625, 6.93798828125, 7.1917724609375, 7.445556640625, 7.6993408203125, 7.953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 14.0, 14.0, 24.0, 24.0, 30.0, 38.0, 49.0, 57.0, 82.0, 102.0, 93.0, 94.0, 73.0, 55.0, 54.0, 35.0, 25.0, 32.0, 17.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.57421875, -5.402587890625, -5.23095703125, -5.059326171875, -4.8876953125, -4.716064453125, -4.54443359375, -4.372802734375, -4.201171875, -4.029541015625, -3.85791015625, -3.686279296875, -3.5146484375, -3.343017578125, -3.17138671875, -2.999755859375, -2.828125, -2.656494140625, -2.48486328125, -2.313232421875, -2.1416015625, -1.969970703125, -1.79833984375, -1.626708984375, -1.455078125, -1.283447265625, -1.11181640625, -0.940185546875, -0.7685546875, -0.596923828125, -0.42529296875, -0.253662109375, -0.08203125, 0.089599609375, 0.26123046875, 0.432861328125, 0.6044921875, 0.776123046875, 0.94775390625, 1.119384765625, 1.291015625, 1.462646484375, 1.63427734375, 1.805908203125, 1.9775390625, 2.149169921875, 2.32080078125, 2.492431640625, 2.6640625, 2.835693359375, 3.00732421875, 3.178955078125, 3.3505859375, 3.522216796875, 3.69384765625, 3.865478515625, 4.037109375, 4.208740234375, 4.38037109375, 4.552001953125, 4.7236328125, 4.895263671875, 5.06689453125, 5.238525390625, 5.41015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 14.0, 27.0, 78.0, 142.0, 314.0, 203.0, 101.0, 49.0, 27.0, 8.0, 8.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.22621154785156, -149.6083526611328, -143.99050903320312, -138.37265014648438, -132.75479125976562, -127.1369400024414, -121.51908874511719, -115.90122985839844, -110.28337860107422, -104.66552734375, -99.04766845703125, -93.42981719970703, -87.81196594238281, -82.19410705566406, -76.57625579833984, -70.95840454101562, -65.34054565429688, -59.72269058227539, -54.104835510253906, -48.48698425292969, -42.8691291809082, -37.25127410888672, -31.6334228515625, -26.015567779541016, -20.39771270751953, -14.779858589172363, -9.162004470825195, -3.5441513061523438, 2.0737037658691406, 7.691558837890625, 13.309410095214844, 18.927265167236328, 24.54510498046875, 30.162960052490234, 35.78081512451172, 41.39866638183594, 47.01652145385742, 52.634376525878906, 58.252227783203125, 63.87008285522461, 69.4879379272461, 75.10578918457031, 80.72364807128906, 86.34149932861328, 91.9593505859375, 97.57720947265625, 103.19506072998047, 108.81291198730469, 114.43077087402344, 120.04862213134766, 125.6664810180664, 131.28433227539062, 136.90219116210938, 142.52005004882812, 148.1378936767578, 153.75575256347656, 159.37359619140625, 164.991455078125, 170.6092987060547, 176.22715759277344, 181.8450164794922, 187.46286010742188, 193.08071899414062, 198.69857788085938, 204.31643676757812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 10.0, 11.0, 22.0, 12.0, 23.0, 30.0, 29.0, 32.0, 20.0, 29.0, 56.0, 59.0, 84.0, 82.0, 80.0, 50.0, 47.0, 42.0, 39.0, 37.0, 33.0, 41.0, 23.0, 17.0, 15.0, 9.0, 12.0, 7.0, 9.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0], "bins": [-104.61738586425781, -102.0246810913086, -99.43196868896484, -96.83926391601562, -94.24655151367188, -91.65384674072266, -89.06114196777344, -86.46842956542969, -83.87572479248047, -81.28302001953125, -78.6903076171875, -76.09760284423828, -73.50489807128906, -70.91218566894531, -68.3194808959961, -65.72677612304688, -63.134063720703125, -60.54135513305664, -57.948646545410156, -55.35594177246094, -52.76323318481445, -50.17052459716797, -47.57781982421875, -44.985111236572266, -42.39240264892578, -39.7996940612793, -37.20698547363281, -34.614280700683594, -32.02157211303711, -29.428863525390625, -26.836156845092773, -24.243450164794922, -21.650741577148438, -19.058032989501953, -16.4653263092041, -13.872618675231934, -11.279911041259766, -8.687203407287598, -6.09449577331543, -3.501789093017578, -0.9090805053710938, 1.6836271286010742, 4.276334762573242, 6.86904239654541, 9.461750030517578, 12.054457664489746, 14.647165298461914, 17.239871978759766, 19.83258056640625, 22.425289154052734, 25.017995834350586, 27.610702514648438, 30.203411102294922, 32.796119689941406, 35.388824462890625, 37.98153305053711, 40.574241638183594, 43.16695022583008, 45.75965881347656, 48.35236358642578, 50.945072174072266, 53.53778076171875, 56.13048553466797, 58.72319412231445, 61.31590270996094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 16.0, 16.0, 21.0, 30.0, 66.0, 91.0, 145.0, 271.0, 486.0, 1163.0, 2744.0, 8630.0, 42001.0, 742483.0, 3203506.0, 164209.0, 19792.0, 5186.0, 1825.0, 776.0, 368.0, 193.0, 105.0, 53.0, 35.0, 15.0, 14.0, 9.0, 11.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5408935546875, -11.183349609375, -10.8258056640625, -10.46826171875, -10.1107177734375, -9.753173828125, -9.3956298828125, -9.0380859375, -8.6805419921875, -8.322998046875, -7.9654541015625, -7.60791015625, -7.2503662109375, -6.892822265625, -6.5352783203125, -6.177734375, -5.8201904296875, -5.462646484375, -5.1051025390625, -4.74755859375, -4.3900146484375, -4.032470703125, -3.6749267578125, -3.3173828125, -2.9598388671875, -2.602294921875, -2.2447509765625, -1.88720703125, -1.5296630859375, -1.172119140625, -0.8145751953125, -0.45703125, -0.0994873046875, 0.258056640625, 0.6156005859375, 0.97314453125, 1.3306884765625, 1.688232421875, 2.0457763671875, 2.4033203125, 2.7608642578125, 3.118408203125, 3.4759521484375, 3.83349609375, 4.1910400390625, 4.548583984375, 4.9061279296875, 5.263671875, 5.6212158203125, 5.978759765625, 6.3363037109375, 6.69384765625, 7.0513916015625, 7.408935546875, 7.7664794921875, 8.1240234375, 8.4815673828125, 8.839111328125, 9.1966552734375, 9.55419921875, 9.9117431640625, 10.269287109375, 10.6268310546875, 10.984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 9.0, 12.0, 16.0, 8.0, 14.0, 27.0, 26.0, 31.0, 30.0, 37.0, 39.0, 42.0, 61.0, 46.0, 52.0, 59.0, 44.0, 48.0, 45.0, 45.0, 53.0, 37.0, 30.0, 31.0, 30.0, 20.0, 15.0, 14.0, 19.0, 10.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.14654541015625, -4.0001220703125, -3.85369873046875, -3.707275390625, -3.56085205078125, -3.4144287109375, -3.26800537109375, -3.12158203125, -2.97515869140625, -2.8287353515625, -2.68231201171875, -2.535888671875, -2.38946533203125, -2.2430419921875, -2.09661865234375, -1.9501953125, -1.80377197265625, -1.6573486328125, -1.51092529296875, -1.364501953125, -1.21807861328125, -1.0716552734375, -0.92523193359375, -0.77880859375, -0.63238525390625, -0.4859619140625, -0.33953857421875, -0.193115234375, -0.04669189453125, 0.0997314453125, 0.24615478515625, 0.392578125, 0.53900146484375, 0.6854248046875, 0.83184814453125, 0.978271484375, 1.12469482421875, 1.2711181640625, 1.41754150390625, 1.56396484375, 1.71038818359375, 1.8568115234375, 2.00323486328125, 2.149658203125, 2.29608154296875, 2.4425048828125, 2.58892822265625, 2.7353515625, 2.88177490234375, 3.0281982421875, 3.17462158203125, 3.321044921875, 3.46746826171875, 3.6138916015625, 3.76031494140625, 3.90673828125, 4.05316162109375, 4.1995849609375, 4.34600830078125, 4.492431640625, 4.63885498046875, 4.7852783203125, 4.93170166015625, 5.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 11.0, 6.0, 33.0, 57.0, 150.0, 342.0, 897.0, 4601.0, 124276.0, 4031977.0, 28044.0, 2685.0, 700.0, 279.0, 115.0, 53.0, 23.0, 16.0, 11.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.40625, -39.26220703125, -38.1181640625, -36.97412109375, -35.830078125, -34.68603515625, -33.5419921875, -32.39794921875, -31.25390625, -30.10986328125, -28.9658203125, -27.82177734375, -26.677734375, -25.53369140625, -24.3896484375, -23.24560546875, -22.1015625, -20.95751953125, -19.8134765625, -18.66943359375, -17.525390625, -16.38134765625, -15.2373046875, -14.09326171875, -12.94921875, -11.80517578125, -10.6611328125, -9.51708984375, -8.373046875, -7.22900390625, -6.0849609375, -4.94091796875, -3.796875, -2.65283203125, -1.5087890625, -0.36474609375, 0.779296875, 1.92333984375, 3.0673828125, 4.21142578125, 5.35546875, 6.49951171875, 7.6435546875, 8.78759765625, 9.931640625, 11.07568359375, 12.2197265625, 13.36376953125, 14.5078125, 15.65185546875, 16.7958984375, 17.93994140625, 19.083984375, 20.22802734375, 21.3720703125, 22.51611328125, 23.66015625, 24.80419921875, 25.9482421875, 27.09228515625, 28.236328125, 29.38037109375, 30.5244140625, 31.66845703125, 32.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 10.0, 6.0, 21.0, 51.0, 82.0, 190.0, 920.0, 1822.0, 635.0, 176.0, 83.0, 30.0, 20.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5, -28.615966796875, -27.73193359375, -26.847900390625, -25.9638671875, -25.079833984375, -24.19580078125, -23.311767578125, -22.427734375, -21.543701171875, -20.65966796875, -19.775634765625, -18.8916015625, -18.007568359375, -17.12353515625, -16.239501953125, -15.35546875, -14.471435546875, -13.58740234375, -12.703369140625, -11.8193359375, -10.935302734375, -10.05126953125, -9.167236328125, -8.283203125, -7.399169921875, -6.51513671875, -5.631103515625, -4.7470703125, -3.863037109375, -2.97900390625, -2.094970703125, -1.2109375, -0.326904296875, 0.55712890625, 1.441162109375, 2.3251953125, 3.209228515625, 4.09326171875, 4.977294921875, 5.861328125, 6.745361328125, 7.62939453125, 8.513427734375, 9.3974609375, 10.281494140625, 11.16552734375, 12.049560546875, 12.93359375, 13.817626953125, 14.70166015625, 15.585693359375, 16.4697265625, 17.353759765625, 18.23779296875, 19.121826171875, 20.005859375, 20.889892578125, 21.77392578125, 22.657958984375, 23.5419921875, 24.426025390625, 25.31005859375, 26.194091796875, 27.078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 13.0, 25.0, 91.0, 285.0, 344.0, 165.0, 43.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.77316284179688, -130.68785095214844, -122.60254669189453, -114.51724243164062, -106.43193054199219, -98.34661865234375, -90.26131439208984, -82.17601013183594, -74.0906982421875, -66.00538635253906, -57.920082092285156, -49.834774017333984, -41.74946594238281, -33.66415786743164, -25.57884979248047, -17.493541717529297, -9.408233642578125, -1.3229255676269531, 6.762382507324219, 14.84769058227539, 22.932998657226562, 31.018306732177734, 39.103614807128906, 47.18892288208008, 55.27423095703125, 63.35953903198242, 71.4448471069336, 79.5301513671875, 87.61546325683594, 95.70077514648438, 103.78607940673828, 111.87138366699219, 119.95672607421875, 128.0420379638672, 136.12734985351562, 144.212646484375, 152.29795837402344, 160.38327026367188, 168.46856689453125, 176.5538787841797, 184.63919067382812, 192.72450256347656, 200.809814453125, 208.89511108398438, 216.9804229736328, 225.06573486328125, 233.15103149414062, 241.23634338378906, 249.3216552734375, 257.4069519042969, 265.4922790527344, 273.57757568359375, 281.66290283203125, 289.7481994628906, 297.83349609375, 305.9188232421875, 314.0041198730469, 322.08941650390625, 330.17474365234375, 338.2600402832031, 346.3453369140625, 354.4306640625, 362.5159606933594, 370.6012878417969, 378.68658447265625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 8.0, 8.0, 17.0, 17.0, 24.0, 39.0, 41.0, 47.0, 46.0, 49.0, 55.0, 67.0, 66.0, 78.0, 56.0, 78.0, 63.0, 46.0, 42.0, 26.0, 32.0, 27.0, 18.0, 16.0, 10.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.17898559570312, -99.54145812988281, -96.90392303466797, -94.26639556884766, -91.62886810302734, -88.9913330078125, -86.35380554199219, -83.71627807617188, -81.07874298095703, -78.44121551513672, -75.80368041992188, -73.16615295410156, -70.52862548828125, -67.8910903930664, -65.2535629272461, -62.616031646728516, -59.9785041809082, -57.340972900390625, -54.70344543457031, -52.065914154052734, -49.428382873535156, -46.790855407714844, -44.153324127197266, -41.51579284667969, -38.878265380859375, -36.2407341003418, -33.603206634521484, -30.965675354003906, -28.328144073486328, -25.690614700317383, -23.053085327148438, -20.41555404663086, -17.77802276611328, -15.14049243927002, -12.502962112426758, -9.865432739257812, -7.227902412414551, -4.590372085571289, -1.9528427124023438, 0.6846885681152344, 3.3222179412841797, 5.959748268127441, 8.597278594970703, 11.234807968139648, 13.87233829498291, 16.509868621826172, 19.147397994995117, 21.784929275512695, 24.42245864868164, 27.059988021850586, 29.697519302368164, 32.33504867553711, 34.97257995605469, 37.610107421875, 40.24763870239258, 42.885169982910156, 45.52269744873047, 48.16022872924805, 50.79775619506836, 53.43528747558594, 56.072818756103516, 58.710350036621094, 61.347877502441406, 63.985408782958984, 66.62294006347656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 15.0, 18.0, 28.0, 44.0, 55.0, 101.0, 164.0, 297.0, 555.0, 984.0, 2089.0, 4274.0, 10290.0, 27474.0, 85241.0, 266090.0, 393718.0, 171970.0, 53431.0, 18260.0, 7083.0, 3051.0, 1533.0, 780.0, 391.0, 224.0, 145.0, 81.0, 58.0, 28.0, 21.0, 19.0, 16.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.37060546875, -7.1005859375, -6.83056640625, -6.560546875, -6.29052734375, -6.0205078125, -5.75048828125, -5.48046875, -5.21044921875, -4.9404296875, -4.67041015625, -4.400390625, -4.13037109375, -3.8603515625, -3.59033203125, -3.3203125, -3.05029296875, -2.7802734375, -2.51025390625, -2.240234375, -1.97021484375, -1.7001953125, -1.43017578125, -1.16015625, -0.89013671875, -0.6201171875, -0.35009765625, -0.080078125, 0.18994140625, 0.4599609375, 0.72998046875, 1.0, 1.27001953125, 1.5400390625, 1.81005859375, 2.080078125, 2.35009765625, 2.6201171875, 2.89013671875, 3.16015625, 3.43017578125, 3.7001953125, 3.97021484375, 4.240234375, 4.51025390625, 4.7802734375, 5.05029296875, 5.3203125, 5.59033203125, 5.8603515625, 6.13037109375, 6.400390625, 6.67041015625, 6.9404296875, 7.21044921875, 7.48046875, 7.75048828125, 8.0205078125, 8.29052734375, 8.560546875, 8.83056640625, 9.1005859375, 9.37060546875, 9.640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 15.0, 16.0, 19.0, 19.0, 36.0, 34.0, 43.0, 48.0, 39.0, 52.0, 57.0, 59.0, 54.0, 77.0, 40.0, 70.0, 47.0, 56.0, 37.0, 33.0, 25.0, 30.0, 16.0, 16.0, 11.0, 7.0, 5.0, 10.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.7191162109375, -7.512451171875, -7.3057861328125, -7.09912109375, -6.8924560546875, -6.685791015625, -6.4791259765625, -6.2724609375, -6.0657958984375, -5.859130859375, -5.6524658203125, -5.44580078125, -5.2391357421875, -5.032470703125, -4.8258056640625, -4.619140625, -4.4124755859375, -4.205810546875, -3.9991455078125, -3.79248046875, -3.5858154296875, -3.379150390625, -3.1724853515625, -2.9658203125, -2.7591552734375, -2.552490234375, -2.3458251953125, -2.13916015625, -1.9324951171875, -1.725830078125, -1.5191650390625, -1.3125, -1.1058349609375, -0.899169921875, -0.6925048828125, -0.48583984375, -0.2791748046875, -0.072509765625, 0.1341552734375, 0.3408203125, 0.5474853515625, 0.754150390625, 0.9608154296875, 1.16748046875, 1.3741455078125, 1.580810546875, 1.7874755859375, 1.994140625, 2.2008056640625, 2.407470703125, 2.6141357421875, 2.82080078125, 3.0274658203125, 3.234130859375, 3.4407958984375, 3.6474609375, 3.8541259765625, 4.060791015625, 4.2674560546875, 4.47412109375, 4.6807861328125, 4.887451171875, 5.0941162109375, 5.30078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 26.0, 20.0, 30.0, 60.0, 82.0, 137.0, 222.0, 420.0, 800.0, 1996.0, 5767.0, 21730.0, 127983.0, 691780.0, 160577.0, 26117.0, 6490.0, 2193.0, 944.0, 448.0, 259.0, 138.0, 93.0, 51.0, 40.0, 31.0, 23.0, 19.0, 4.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.2734375, -14.7894287109375, -14.305419921875, -13.8214111328125, -13.33740234375, -12.8533935546875, -12.369384765625, -11.8853759765625, -11.4013671875, -10.9173583984375, -10.433349609375, -9.9493408203125, -9.46533203125, -8.9813232421875, -8.497314453125, -8.0133056640625, -7.529296875, -7.0452880859375, -6.561279296875, -6.0772705078125, -5.59326171875, -5.1092529296875, -4.625244140625, -4.1412353515625, -3.6572265625, -3.1732177734375, -2.689208984375, -2.2052001953125, -1.72119140625, -1.2371826171875, -0.753173828125, -0.2691650390625, 0.21484375, 0.6988525390625, 1.182861328125, 1.6668701171875, 2.15087890625, 2.6348876953125, 3.118896484375, 3.6029052734375, 4.0869140625, 4.5709228515625, 5.054931640625, 5.5389404296875, 6.02294921875, 6.5069580078125, 6.990966796875, 7.4749755859375, 7.958984375, 8.4429931640625, 8.927001953125, 9.4110107421875, 9.89501953125, 10.3790283203125, 10.863037109375, 11.3470458984375, 11.8310546875, 12.3150634765625, 12.799072265625, 13.2830810546875, 13.76708984375, 14.2510986328125, 14.735107421875, 15.2191162109375, 15.703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 15.0, 8.0, 10.0, 20.0, 25.0, 21.0, 36.0, 39.0, 45.0, 54.0, 54.0, 52.0, 52.0, 65.0, 55.0, 54.0, 49.0, 50.0, 51.0, 37.0, 21.0, 28.0, 26.0, 24.0, 16.0, 16.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.673583984375, -24.95654296875, -24.239501953125, -23.5224609375, -22.805419921875, -22.08837890625, -21.371337890625, -20.654296875, -19.937255859375, -19.22021484375, -18.503173828125, -17.7861328125, -17.069091796875, -16.35205078125, -15.635009765625, -14.91796875, -14.200927734375, -13.48388671875, -12.766845703125, -12.0498046875, -11.332763671875, -10.61572265625, -9.898681640625, -9.181640625, -8.464599609375, -7.74755859375, -7.030517578125, -6.3134765625, -5.596435546875, -4.87939453125, -4.162353515625, -3.4453125, -2.728271484375, -2.01123046875, -1.294189453125, -0.5771484375, 0.139892578125, 0.85693359375, 1.573974609375, 2.291015625, 3.008056640625, 3.72509765625, 4.442138671875, 5.1591796875, 5.876220703125, 6.59326171875, 7.310302734375, 8.02734375, 8.744384765625, 9.46142578125, 10.178466796875, 10.8955078125, 11.612548828125, 12.32958984375, 13.046630859375, 13.763671875, 14.480712890625, 15.19775390625, 15.914794921875, 16.6318359375, 17.348876953125, 18.06591796875, 18.782958984375, 19.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 10.0, 9.0, 11.0, 35.0, 33.0, 53.0, 69.0, 101.0, 119.0, 216.0, 301.0, 458.0, 733.0, 1219.0, 2333.0, 5059.0, 12771.0, 43554.0, 239220.0, 632233.0, 75895.0, 19634.0, 7269.0, 3221.0, 1630.0, 875.0, 487.0, 327.0, 209.0, 141.0, 76.0, 66.0, 44.0, 44.0, 29.0, 19.0, 11.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.82952880859375, -4.6746826171875, -4.51983642578125, -4.364990234375, -4.21014404296875, -4.0552978515625, -3.90045166015625, -3.74560546875, -3.59075927734375, -3.4359130859375, -3.28106689453125, -3.126220703125, -2.97137451171875, -2.8165283203125, -2.66168212890625, -2.5068359375, -2.35198974609375, -2.1971435546875, -2.04229736328125, -1.887451171875, -1.73260498046875, -1.5777587890625, -1.42291259765625, -1.26806640625, -1.11322021484375, -0.9583740234375, -0.80352783203125, -0.648681640625, -0.49383544921875, -0.3389892578125, -0.18414306640625, -0.029296875, 0.12554931640625, 0.2803955078125, 0.43524169921875, 0.590087890625, 0.74493408203125, 0.8997802734375, 1.05462646484375, 1.20947265625, 1.36431884765625, 1.5191650390625, 1.67401123046875, 1.828857421875, 1.98370361328125, 2.1385498046875, 2.29339599609375, 2.4482421875, 2.60308837890625, 2.7579345703125, 2.91278076171875, 3.067626953125, 3.22247314453125, 3.3773193359375, 3.53216552734375, 3.68701171875, 3.84185791015625, 3.9967041015625, 4.15155029296875, 4.306396484375, 4.46124267578125, 4.6160888671875, 4.77093505859375, 4.92578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 24.0, 27.0, 74.0, 163.0, 330.0, 182.0, 90.0, 41.0, 17.0, 11.0, 5.0, 9.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00299072265625, -0.0029015839099884033, -0.0028124451637268066, -0.00272330641746521, -0.0026341676712036133, -0.0025450289249420166, -0.00245589017868042, -0.0023667514324188232, -0.0022776126861572266, -0.00218847393989563, -0.002099335193634033, -0.0020101964473724365, -0.0019210577011108398, -0.0018319189548492432, -0.0017427802085876465, -0.0016536414623260498, -0.0015645027160644531, -0.0014753639698028564, -0.0013862252235412598, -0.001297086477279663, -0.0012079477310180664, -0.0011188089847564697, -0.001029670238494873, -0.0009405314922332764, -0.0008513927459716797, -0.000762253999710083, -0.0006731152534484863, -0.0005839765071868896, -0.000494837760925293, -0.0004056990146636963, -0.0003165602684020996, -0.00022742152214050293, -0.00013828277587890625, -4.914402961730957e-05, 3.999471664428711e-05, 0.0001291334629058838, 0.00021827220916748047, 0.00030741095542907715, 0.00039654970169067383, 0.0004856884479522705, 0.0005748271942138672, 0.0006639659404754639, 0.0007531046867370605, 0.0008422434329986572, 0.0009313821792602539, 0.0010205209255218506, 0.0011096596717834473, 0.001198798418045044, 0.0012879371643066406, 0.0013770759105682373, 0.001466214656829834, 0.0015553534030914307, 0.0016444921493530273, 0.001733630895614624, 0.0018227696418762207, 0.0019119083881378174, 0.002001047134399414, 0.0020901858806610107, 0.0021793246269226074, 0.002268463373184204, 0.0023576021194458008, 0.0024467408657073975, 0.002535879611968994, 0.002625018358230591, 0.0027141571044921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 7.0, 19.0, 24.0, 40.0, 73.0, 143.0, 405.0, 1040.0, 3237.0, 13338.0, 91813.0, 804966.0, 112503.0, 15328.0, 3649.0, 1134.0, 431.0, 170.0, 83.0, 55.0, 25.0, 21.0, 8.0, 7.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.17047119140625, -7.9268798828125, -7.68328857421875, -7.439697265625, -7.19610595703125, -6.9525146484375, -6.70892333984375, -6.46533203125, -6.22174072265625, -5.9781494140625, -5.73455810546875, -5.490966796875, -5.24737548828125, -5.0037841796875, -4.76019287109375, -4.5166015625, -4.27301025390625, -4.0294189453125, -3.78582763671875, -3.542236328125, -3.29864501953125, -3.0550537109375, -2.81146240234375, -2.56787109375, -2.32427978515625, -2.0806884765625, -1.83709716796875, -1.593505859375, -1.34991455078125, -1.1063232421875, -0.86273193359375, -0.619140625, -0.37554931640625, -0.1319580078125, 0.11163330078125, 0.355224609375, 0.59881591796875, 0.8424072265625, 1.08599853515625, 1.32958984375, 1.57318115234375, 1.8167724609375, 2.06036376953125, 2.303955078125, 2.54754638671875, 2.7911376953125, 3.03472900390625, 3.2783203125, 3.52191162109375, 3.7655029296875, 4.00909423828125, 4.252685546875, 4.49627685546875, 4.7398681640625, 4.98345947265625, 5.22705078125, 5.47064208984375, 5.7142333984375, 5.95782470703125, 6.201416015625, 6.44500732421875, 6.6885986328125, 6.93218994140625, 7.17578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 14.0, 17.0, 26.0, 38.0, 54.0, 72.0, 98.0, 120.0, 131.0, 100.0, 68.0, 71.0, 32.0, 19.0, 25.0, 21.0, 9.0, 6.0, 6.0, 7.0, 7.0, 10.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.3203125, -8.12255859375, -7.9248046875, -7.72705078125, -7.529296875, -7.33154296875, -7.1337890625, -6.93603515625, -6.73828125, -6.54052734375, -6.3427734375, -6.14501953125, -5.947265625, -5.74951171875, -5.5517578125, -5.35400390625, -5.15625, -4.95849609375, -4.7607421875, -4.56298828125, -4.365234375, -4.16748046875, -3.9697265625, -3.77197265625, -3.57421875, -3.37646484375, -3.1787109375, -2.98095703125, -2.783203125, -2.58544921875, -2.3876953125, -2.18994140625, -1.9921875, -1.79443359375, -1.5966796875, -1.39892578125, -1.201171875, -1.00341796875, -0.8056640625, -0.60791015625, -0.41015625, -0.21240234375, -0.0146484375, 0.18310546875, 0.380859375, 0.57861328125, 0.7763671875, 0.97412109375, 1.171875, 1.36962890625, 1.5673828125, 1.76513671875, 1.962890625, 2.16064453125, 2.3583984375, 2.55615234375, 2.75390625, 2.95166015625, 3.1494140625, 3.34716796875, 3.544921875, 3.74267578125, 3.9404296875, 4.13818359375, 4.3359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 15.0, 41.0, 210.0, 482.0, 177.0, 43.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.50439453125, -351.2229309082031, -342.9414978027344, -334.6600341796875, -326.37860107421875, -318.0971374511719, -309.815673828125, -301.53424072265625, -293.2527770996094, -284.9713134765625, -276.68988037109375, -268.4084167480469, -260.1269836425781, -251.84552001953125, -243.56407165527344, -235.28262329101562, -227.0011749267578, -218.7197265625, -210.4382781982422, -202.15682983398438, -193.8753662109375, -185.5939178466797, -177.31246948242188, -169.03102111816406, -160.74957275390625, -152.46812438964844, -144.18667602539062, -135.90521240234375, -127.62376403808594, -119.34231567382812, -111.06086730957031, -102.7794189453125, -94.49795532226562, -86.21650695800781, -77.93505096435547, -69.65360260009766, -61.37215042114258, -53.0906982421875, -44.80924987792969, -36.52779769897461, -28.24634552001953, -19.964893341064453, -11.683443069458008, -3.4019927978515625, 4.879459381103516, 13.160911560058594, 21.442359924316406, 29.723812103271484, 38.00526428222656, 46.28671646118164, 54.56816864013672, 62.84961700439453, 71.13107299804688, 79.41252136230469, 87.6939697265625, 95.97541809082031, 104.25687408447266, 112.53832244873047, 120.81977844238281, 129.10122680664062, 137.38267517089844, 145.66412353515625, 153.94558715820312, 162.22703552246094, 170.50848388671875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 16.0, 19.0, 16.0, 17.0, 26.0, 27.0, 30.0, 44.0, 48.0, 48.0, 80.0, 105.0, 95.0, 89.0, 52.0, 45.0, 44.0, 24.0, 34.0, 23.0, 28.0, 18.0, 14.0, 14.0, 10.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.67813110351562, -73.49794006347656, -70.3177490234375, -67.13755798339844, -63.95736312866211, -60.77717208862305, -57.596981048583984, -54.416786193847656, -51.236595153808594, -48.05640411376953, -44.87621307373047, -41.696022033691406, -38.51582717895508, -35.335636138916016, -32.15544509887695, -28.975252151489258, -25.795063018798828, -22.614871978759766, -19.43467903137207, -16.254487991333008, -13.074295997619629, -9.89410400390625, -6.7139129638671875, -3.533720016479492, -0.3535289764404297, 2.82666277885437, 6.00685453414917, 9.18704605102539, 12.36723804473877, 15.547430038452148, 18.72762107849121, 21.907814025878906, 25.08800506591797, 28.26819610595703, 31.448389053344727, 34.628578186035156, 37.808773040771484, 40.98896408081055, 44.16915512084961, 47.34934997558594, 50.529541015625, 53.70973205566406, 56.889923095703125, 60.07011413574219, 63.250308990478516, 66.43049621582031, 69.61068725585938, 72.79088592529297, 75.9710693359375, 79.15126037597656, 82.33145141601562, 85.51164245605469, 88.69183349609375, 91.87202453613281, 95.05221557617188, 98.23241424560547, 101.41260528564453, 104.5927963256836, 107.77298736572266, 110.95317840576172, 114.13336944580078, 117.31356811523438, 120.49375915527344, 123.6739501953125, 126.85414123535156]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 15.0, 26.0, 36.0, 41.0, 57.0, 99.0, 130.0, 195.0, 256.0, 388.0, 521.0, 896.0, 1578.0, 2946.0, 6910.0, 20706.0, 96255.0, 663163.0, 2493862.0, 758812.0, 109318.0, 22972.0, 7460.0, 3163.0, 1684.0, 947.0, 596.0, 359.0, 252.0, 188.0, 117.0, 75.0, 62.0, 40.0, 31.0, 19.0, 17.0, 11.0, 10.0, 8.0, 3.0, 7.0, 3.0, 7.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.546875, -6.3572998046875, -6.167724609375, -5.9781494140625, -5.78857421875, -5.5989990234375, -5.409423828125, -5.2198486328125, -5.0302734375, -4.8406982421875, -4.651123046875, -4.4615478515625, -4.27197265625, -4.0823974609375, -3.892822265625, -3.7032470703125, -3.513671875, -3.3240966796875, -3.134521484375, -2.9449462890625, -2.75537109375, -2.5657958984375, -2.376220703125, -2.1866455078125, -1.9970703125, -1.8074951171875, -1.617919921875, -1.4283447265625, -1.23876953125, -1.0491943359375, -0.859619140625, -0.6700439453125, -0.48046875, -0.2908935546875, -0.101318359375, 0.0882568359375, 0.27783203125, 0.4674072265625, 0.656982421875, 0.8465576171875, 1.0361328125, 1.2257080078125, 1.415283203125, 1.6048583984375, 1.79443359375, 1.9840087890625, 2.173583984375, 2.3631591796875, 2.552734375, 2.7423095703125, 2.931884765625, 3.1214599609375, 3.31103515625, 3.5006103515625, 3.690185546875, 3.8797607421875, 4.0693359375, 4.2589111328125, 4.448486328125, 4.6380615234375, 4.82763671875, 5.0172119140625, 5.206787109375, 5.3963623046875, 5.5859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 9.0, 3.0, 11.0, 7.0, 10.0, 7.0, 14.0, 16.0, 19.0, 24.0, 34.0, 18.0, 24.0, 33.0, 46.0, 39.0, 40.0, 38.0, 51.0, 52.0, 43.0, 43.0, 40.0, 48.0, 34.0, 34.0, 29.0, 31.0, 32.0, 27.0, 36.0, 15.0, 14.0, 17.0, 10.0, 11.0, 15.0, 11.0, 4.0, 2.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.95703125, -4.80810546875, -4.6591796875, -4.51025390625, -4.361328125, -4.21240234375, -4.0634765625, -3.91455078125, -3.765625, -3.61669921875, -3.4677734375, -3.31884765625, -3.169921875, -3.02099609375, -2.8720703125, -2.72314453125, -2.57421875, -2.42529296875, -2.2763671875, -2.12744140625, -1.978515625, -1.82958984375, -1.6806640625, -1.53173828125, -1.3828125, -1.23388671875, -1.0849609375, -0.93603515625, -0.787109375, -0.63818359375, -0.4892578125, -0.34033203125, -0.19140625, -0.04248046875, 0.1064453125, 0.25537109375, 0.404296875, 0.55322265625, 0.7021484375, 0.85107421875, 1.0, 1.14892578125, 1.2978515625, 1.44677734375, 1.595703125, 1.74462890625, 1.8935546875, 2.04248046875, 2.19140625, 2.34033203125, 2.4892578125, 2.63818359375, 2.787109375, 2.93603515625, 3.0849609375, 3.23388671875, 3.3828125, 3.53173828125, 3.6806640625, 3.82958984375, 3.978515625, 4.12744140625, 4.2763671875, 4.42529296875, 4.57421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 19.0, 27.0, 82.0, 254.0, 1078.0, 19614.0, 4142688.0, 28708.0, 1289.0, 326.0, 111.0, 46.0, 23.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.33544921875, -39.0146484375, -37.69384765625, -36.373046875, -35.05224609375, -33.7314453125, -32.41064453125, -31.08984375, -29.76904296875, -28.4482421875, -27.12744140625, -25.806640625, -24.48583984375, -23.1650390625, -21.84423828125, -20.5234375, -19.20263671875, -17.8818359375, -16.56103515625, -15.240234375, -13.91943359375, -12.5986328125, -11.27783203125, -9.95703125, -8.63623046875, -7.3154296875, -5.99462890625, -4.673828125, -3.35302734375, -2.0322265625, -0.71142578125, 0.609375, 1.93017578125, 3.2509765625, 4.57177734375, 5.892578125, 7.21337890625, 8.5341796875, 9.85498046875, 11.17578125, 12.49658203125, 13.8173828125, 15.13818359375, 16.458984375, 17.77978515625, 19.1005859375, 20.42138671875, 21.7421875, 23.06298828125, 24.3837890625, 25.70458984375, 27.025390625, 28.34619140625, 29.6669921875, 30.98779296875, 32.30859375, 33.62939453125, 34.9501953125, 36.27099609375, 37.591796875, 38.91259765625, 40.2333984375, 41.55419921875, 42.875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 6.0, 11.0, 12.0, 17.0, 34.0, 54.0, 109.0, 203.0, 440.0, 875.0, 1041.0, 590.0, 319.0, 145.0, 81.0, 43.0, 19.0, 26.0, 15.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.4649658203125, -7.031494140625, -6.5980224609375, -6.16455078125, -5.7310791015625, -5.297607421875, -4.8641357421875, -4.4306640625, -3.9971923828125, -3.563720703125, -3.1302490234375, -2.69677734375, -2.2633056640625, -1.829833984375, -1.3963623046875, -0.962890625, -0.5294189453125, -0.095947265625, 0.3375244140625, 0.77099609375, 1.2044677734375, 1.637939453125, 2.0714111328125, 2.5048828125, 2.9383544921875, 3.371826171875, 3.8052978515625, 4.23876953125, 4.6722412109375, 5.105712890625, 5.5391845703125, 5.97265625, 6.4061279296875, 6.839599609375, 7.2730712890625, 7.70654296875, 8.1400146484375, 8.573486328125, 9.0069580078125, 9.4404296875, 9.8739013671875, 10.307373046875, 10.7408447265625, 11.17431640625, 11.6077880859375, 12.041259765625, 12.4747314453125, 12.908203125, 13.3416748046875, 13.775146484375, 14.2086181640625, 14.64208984375, 15.0755615234375, 15.509033203125, 15.9425048828125, 16.3759765625, 16.8094482421875, 17.242919921875, 17.6763916015625, 18.10986328125, 18.5433349609375, 18.976806640625, 19.4102783203125, 19.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 26.0, 110.0, 333.0, 313.0, 128.0, 48.0, 13.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.99601745605469, -77.53012084960938, -71.06421661376953, -64.59831237792969, -58.132415771484375, -51.6665153503418, -45.20061492919922, -38.73471450805664, -32.26881408691406, -25.802913665771484, -19.337013244628906, -12.871112823486328, -6.40521240234375, 0.060688018798828125, 6.526588439941406, 12.992488861083984, 19.458389282226562, 25.92428970336914, 32.39019012451172, 38.8560905456543, 45.321990966796875, 51.78789138793945, 58.25379180908203, 64.71969604492188, 71.18559265136719, 77.6514892578125, 84.11739349365234, 90.58329772949219, 97.0491943359375, 103.51509094238281, 109.98099517822266, 116.4468994140625, 122.91278076171875, 129.37867736816406, 135.84457397460938, 142.31048583984375, 148.77638244628906, 155.24227905273438, 161.70819091796875, 168.17408752441406, 174.63998413085938, 181.1058807373047, 187.57177734375, 194.03768920898438, 200.5035858154297, 206.969482421875, 213.43539428710938, 219.9012908935547, 226.3671875, 232.8330841064453, 239.29898071289062, 245.764892578125, 252.2307891845703, 258.6966857910156, 265.16259765625, 271.62847900390625, 278.0943908691406, 284.560302734375, 291.02618408203125, 297.4920959472656, 303.9580078125, 310.42388916015625, 316.8898010253906, 323.3556823730469, 329.82159423828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 37.0, 37.0, 45.0, 43.0, 64.0, 66.0, 60.0, 64.0, 46.0, 57.0, 51.0, 49.0, 45.0, 39.0, 48.0, 33.0, 30.0, 10.0, 11.0, 12.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.43990325927734, -66.47781372070312, -64.5157241821289, -62.55363082885742, -60.5915412902832, -58.629451751708984, -56.6673583984375, -54.70526885986328, -52.74317932128906, -50.781089782714844, -48.819000244140625, -46.85690689086914, -44.89481735229492, -42.9327278137207, -40.97063446044922, -39.008544921875, -37.04645538330078, -35.08436584472656, -33.122276306152344, -31.16018295288086, -29.19809341430664, -27.236003875732422, -25.27391242980957, -23.31182098388672, -21.3497314453125, -19.38764190673828, -17.42555046081543, -15.463459968566895, -13.50136947631836, -11.539278984069824, -9.577188491821289, -7.615097999572754, -5.653011322021484, -3.690920829772949, -1.728830337524414, 0.2332601547241211, 2.1953506469726562, 4.157441139221191, 6.119531631469727, 8.081622123718262, 10.043712615966797, 12.005803108215332, 13.967893600463867, 15.929984092712402, 17.892074584960938, 19.854164123535156, 21.816255569458008, 23.77834701538086, 25.740436553955078, 27.702526092529297, 29.66461753845215, 31.626708984375, 33.58879852294922, 35.55088806152344, 37.512977600097656, 39.47507095336914, 41.43716049194336, 43.39925003051758, 45.36134338378906, 47.32343292236328, 49.2855224609375, 51.24761199951172, 53.20970153808594, 55.17179489135742, 57.13388442993164]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 3.0, 8.0, 20.0, 31.0, 28.0, 30.0, 57.0, 103.0, 159.0, 262.0, 418.0, 712.0, 1280.0, 2398.0, 4608.0, 8989.0, 19458.0, 44098.0, 105905.0, 242760.0, 313887.0, 173316.0, 71582.0, 30382.0, 13844.0, 6628.0, 3377.0, 1775.0, 959.0, 600.0, 312.0, 212.0, 120.0, 65.0, 48.0, 37.0, 18.0, 16.0, 12.0, 11.0, 10.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.86328125, -4.68499755859375, -4.5067138671875, -4.32843017578125, -4.150146484375, -3.97186279296875, -3.7935791015625, -3.61529541015625, -3.43701171875, -3.25872802734375, -3.0804443359375, -2.90216064453125, -2.723876953125, -2.54559326171875, -2.3673095703125, -2.18902587890625, -2.0107421875, -1.83245849609375, -1.6541748046875, -1.47589111328125, -1.297607421875, -1.11932373046875, -0.9410400390625, -0.76275634765625, -0.58447265625, -0.40618896484375, -0.2279052734375, -0.04962158203125, 0.128662109375, 0.30694580078125, 0.4852294921875, 0.66351318359375, 0.841796875, 1.02008056640625, 1.1983642578125, 1.37664794921875, 1.554931640625, 1.73321533203125, 1.9114990234375, 2.08978271484375, 2.26806640625, 2.44635009765625, 2.6246337890625, 2.80291748046875, 2.981201171875, 3.15948486328125, 3.3377685546875, 3.51605224609375, 3.6943359375, 3.87261962890625, 4.0509033203125, 4.22918701171875, 4.407470703125, 4.58575439453125, 4.7640380859375, 4.94232177734375, 5.12060546875, 5.29888916015625, 5.4771728515625, 5.65545654296875, 5.833740234375, 6.01202392578125, 6.1903076171875, 6.36859130859375, 6.546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 9.0, 9.0, 13.0, 11.0, 17.0, 17.0, 12.0, 19.0, 20.0, 18.0, 17.0, 26.0, 26.0, 40.0, 29.0, 34.0, 34.0, 30.0, 38.0, 43.0, 32.0, 41.0, 28.0, 43.0, 30.0, 37.0, 25.0, 27.0, 44.0, 27.0, 26.0, 25.0, 22.0, 10.0, 14.0, 13.0, 15.0, 10.0, 7.0, 14.0, 6.0, 4.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.20703125, -4.07733154296875, -3.9476318359375, -3.81793212890625, -3.688232421875, -3.55853271484375, -3.4288330078125, -3.29913330078125, -3.16943359375, -3.03973388671875, -2.9100341796875, -2.78033447265625, -2.650634765625, -2.52093505859375, -2.3912353515625, -2.26153564453125, -2.1318359375, -2.00213623046875, -1.8724365234375, -1.74273681640625, -1.613037109375, -1.48333740234375, -1.3536376953125, -1.22393798828125, -1.09423828125, -0.96453857421875, -0.8348388671875, -0.70513916015625, -0.575439453125, -0.44573974609375, -0.3160400390625, -0.18634033203125, -0.056640625, 0.07305908203125, 0.2027587890625, 0.33245849609375, 0.462158203125, 0.59185791015625, 0.7215576171875, 0.85125732421875, 0.98095703125, 1.11065673828125, 1.2403564453125, 1.37005615234375, 1.499755859375, 1.62945556640625, 1.7591552734375, 1.88885498046875, 2.0185546875, 2.14825439453125, 2.2779541015625, 2.40765380859375, 2.537353515625, 2.66705322265625, 2.7967529296875, 2.92645263671875, 3.05615234375, 3.18585205078125, 3.3155517578125, 3.44525146484375, 3.574951171875, 3.70465087890625, 3.8343505859375, 3.96405029296875, 4.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 13.0, 16.0, 25.0, 38.0, 45.0, 79.0, 107.0, 148.0, 235.0, 386.0, 679.0, 1332.0, 3720.0, 14898.0, 102866.0, 767625.0, 131074.0, 17632.0, 4225.0, 1495.0, 696.0, 411.0, 265.0, 148.0, 96.0, 71.0, 53.0, 42.0, 27.0, 27.0, 21.0, 8.0, 14.0, 7.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.220458984375, -15.72216796875, -15.223876953125, -14.7255859375, -14.227294921875, -13.72900390625, -13.230712890625, -12.732421875, -12.234130859375, -11.73583984375, -11.237548828125, -10.7392578125, -10.240966796875, -9.74267578125, -9.244384765625, -8.74609375, -8.247802734375, -7.74951171875, -7.251220703125, -6.7529296875, -6.254638671875, -5.75634765625, -5.258056640625, -4.759765625, -4.261474609375, -3.76318359375, -3.264892578125, -2.7666015625, -2.268310546875, -1.77001953125, -1.271728515625, -0.7734375, -0.275146484375, 0.22314453125, 0.721435546875, 1.2197265625, 1.718017578125, 2.21630859375, 2.714599609375, 3.212890625, 3.711181640625, 4.20947265625, 4.707763671875, 5.2060546875, 5.704345703125, 6.20263671875, 6.700927734375, 7.19921875, 7.697509765625, 8.19580078125, 8.694091796875, 9.1923828125, 9.690673828125, 10.18896484375, 10.687255859375, 11.185546875, 11.683837890625, 12.18212890625, 12.680419921875, 13.1787109375, 13.677001953125, 14.17529296875, 14.673583984375, 15.171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 12.0, 18.0, 18.0, 29.0, 25.0, 24.0, 31.0, 48.0, 59.0, 48.0, 59.0, 48.0, 69.0, 67.0, 51.0, 52.0, 54.0, 42.0, 32.0, 33.0, 39.0, 24.0, 22.0, 13.0, 11.0, 15.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.594970703125, -20.89306640625, -20.191162109375, -19.4892578125, -18.787353515625, -18.08544921875, -17.383544921875, -16.681640625, -15.979736328125, -15.27783203125, -14.575927734375, -13.8740234375, -13.172119140625, -12.47021484375, -11.768310546875, -11.06640625, -10.364501953125, -9.66259765625, -8.960693359375, -8.2587890625, -7.556884765625, -6.85498046875, -6.153076171875, -5.451171875, -4.749267578125, -4.04736328125, -3.345458984375, -2.6435546875, -1.941650390625, -1.23974609375, -0.537841796875, 0.1640625, 0.865966796875, 1.56787109375, 2.269775390625, 2.9716796875, 3.673583984375, 4.37548828125, 5.077392578125, 5.779296875, 6.481201171875, 7.18310546875, 7.885009765625, 8.5869140625, 9.288818359375, 9.99072265625, 10.692626953125, 11.39453125, 12.096435546875, 12.79833984375, 13.500244140625, 14.2021484375, 14.904052734375, 15.60595703125, 16.307861328125, 17.009765625, 17.711669921875, 18.41357421875, 19.115478515625, 19.8173828125, 20.519287109375, 21.22119140625, 21.923095703125, 22.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 13.0, 20.0, 25.0, 48.0, 95.0, 246.0, 826.0, 3844.0, 33458.0, 925655.0, 76146.0, 6418.0, 1185.0, 336.0, 114.0, 48.0, 24.0, 17.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.8321533203125, -10.500244140625, -10.1683349609375, -9.83642578125, -9.5045166015625, -9.172607421875, -8.8406982421875, -8.5087890625, -8.1768798828125, -7.844970703125, -7.5130615234375, -7.18115234375, -6.8492431640625, -6.517333984375, -6.1854248046875, -5.853515625, -5.5216064453125, -5.189697265625, -4.8577880859375, -4.52587890625, -4.1939697265625, -3.862060546875, -3.5301513671875, -3.1982421875, -2.8663330078125, -2.534423828125, -2.2025146484375, -1.87060546875, -1.5386962890625, -1.206787109375, -0.8748779296875, -0.54296875, -0.2110595703125, 0.120849609375, 0.4527587890625, 0.78466796875, 1.1165771484375, 1.448486328125, 1.7803955078125, 2.1123046875, 2.4442138671875, 2.776123046875, 3.1080322265625, 3.43994140625, 3.7718505859375, 4.103759765625, 4.4356689453125, 4.767578125, 5.0994873046875, 5.431396484375, 5.7633056640625, 6.09521484375, 6.4271240234375, 6.759033203125, 7.0909423828125, 7.4228515625, 7.7547607421875, 8.086669921875, 8.4185791015625, 8.75048828125, 9.0823974609375, 9.414306640625, 9.7462158203125, 10.078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 23.0, 29.0, 39.0, 64.0, 129.0, 224.0, 182.0, 86.0, 55.0, 29.0, 18.0, 12.0, 15.0, 6.0, 6.0, 4.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968612670898438, -0.0011520981788635254, -0.001107335090637207, -0.0010625720024108887, -0.0010178089141845703, -0.000973045825958252, -0.0009282827377319336, -0.0008835196495056152, -0.0008387565612792969, -0.0007939934730529785, -0.0007492303848266602, -0.0007044672966003418, -0.0006597042083740234, -0.0006149411201477051, -0.0005701780319213867, -0.0005254149436950684, -0.00048065185546875, -0.00043588876724243164, -0.0003911256790161133, -0.0003463625907897949, -0.00030159950256347656, -0.0002568364143371582, -0.00021207332611083984, -0.00016731023788452148, -0.00012254714965820312, -7.778406143188477e-05, -3.3020973205566406e-05, 1.1742115020751953e-05, 5.650520324707031e-05, 0.00010126829147338867, 0.00014603137969970703, 0.0001907944679260254, 0.00023555755615234375, 0.0002803206443786621, 0.00032508373260498047, 0.00036984682083129883, 0.0004146099090576172, 0.00045937299728393555, 0.0005041360855102539, 0.0005488991737365723, 0.0005936622619628906, 0.000638425350189209, 0.0006831884384155273, 0.0007279515266418457, 0.0007727146148681641, 0.0008174777030944824, 0.0008622407913208008, 0.0009070038795471191, 0.0009517669677734375, 0.0009965300559997559, 0.0010412931442260742, 0.0010860562324523926, 0.001130819320678711, 0.0011755824089050293, 0.0012203454971313477, 0.001265108585357666, 0.0013098716735839844, 0.0013546347618103027, 0.001399397850036621, 0.0014441609382629395, 0.0014889240264892578, 0.0015336871147155762, 0.0015784502029418945, 0.0016232132911682129, 0.0016679763793945312]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 9.0, 16.0, 15.0, 48.0, 149.0, 442.0, 2295.0, 96934.0, 941833.0, 5782.0, 693.0, 193.0, 76.0, 29.0, 14.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.251220703125, -19.65869140625, -19.066162109375, -18.4736328125, -17.881103515625, -17.28857421875, -16.696044921875, -16.103515625, -15.510986328125, -14.91845703125, -14.325927734375, -13.7333984375, -13.140869140625, -12.54833984375, -11.955810546875, -11.36328125, -10.770751953125, -10.17822265625, -9.585693359375, -8.9931640625, -8.400634765625, -7.80810546875, -7.215576171875, -6.623046875, -6.030517578125, -5.43798828125, -4.845458984375, -4.2529296875, -3.660400390625, -3.06787109375, -2.475341796875, -1.8828125, -1.290283203125, -0.69775390625, -0.105224609375, 0.4873046875, 1.079833984375, 1.67236328125, 2.264892578125, 2.857421875, 3.449951171875, 4.04248046875, 4.635009765625, 5.2275390625, 5.820068359375, 6.41259765625, 7.005126953125, 7.59765625, 8.190185546875, 8.78271484375, 9.375244140625, 9.9677734375, 10.560302734375, 11.15283203125, 11.745361328125, 12.337890625, 12.930419921875, 13.52294921875, 14.115478515625, 14.7080078125, 15.300537109375, 15.89306640625, 16.485595703125, 17.078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 23.0, 26.0, 80.0, 178.0, 334.0, 183.0, 71.0, 38.0, 15.0, 12.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.418212890625, -12.02392578125, -11.629638671875, -11.2353515625, -10.841064453125, -10.44677734375, -10.052490234375, -9.658203125, -9.263916015625, -8.86962890625, -8.475341796875, -8.0810546875, -7.686767578125, -7.29248046875, -6.898193359375, -6.50390625, -6.109619140625, -5.71533203125, -5.321044921875, -4.9267578125, -4.532470703125, -4.13818359375, -3.743896484375, -3.349609375, -2.955322265625, -2.56103515625, -2.166748046875, -1.7724609375, -1.378173828125, -0.98388671875, -0.589599609375, -0.1953125, 0.198974609375, 0.59326171875, 0.987548828125, 1.3818359375, 1.776123046875, 2.17041015625, 2.564697265625, 2.958984375, 3.353271484375, 3.74755859375, 4.141845703125, 4.5361328125, 4.930419921875, 5.32470703125, 5.718994140625, 6.11328125, 6.507568359375, 6.90185546875, 7.296142578125, 7.6904296875, 8.084716796875, 8.47900390625, 8.873291015625, 9.267578125, 9.661865234375, 10.05615234375, 10.450439453125, 10.8447265625, 11.239013671875, 11.63330078125, 12.027587890625, 12.421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 12.0, 15.0, 17.0, 50.0, 87.0, 194.0, 379.0, 150.0, 50.0, 20.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-178.47137451171875, -174.04998779296875, -169.62860107421875, -165.2071990966797, -160.7858123779297, -156.3644256591797, -151.9430389404297, -147.52163696289062, -143.10025024414062, -138.67886352539062, -134.25747680664062, -129.83607482910156, -125.41468811035156, -120.99330139160156, -116.57191467285156, -112.15052032470703, -107.72913360595703, -103.30774688720703, -98.8863525390625, -94.4649658203125, -90.04357147216797, -85.62218475341797, -81.20079040527344, -76.77940368652344, -72.35801696777344, -67.93663024902344, -63.515235900878906, -59.093849182128906, -54.672454833984375, -50.251068115234375, -45.82967758178711, -41.408287048339844, -36.98689270019531, -32.56550216674805, -28.14411163330078, -23.72272300720215, -19.301332473754883, -14.879941940307617, -10.458553314208984, -6.037162780761719, -1.6157722473144531, 2.8056178092956543, 7.227007865905762, 11.648397445678711, 16.069787979125977, 20.491178512573242, 24.912567138671875, 29.33395767211914, 33.755348205566406, 38.17673873901367, 42.59812927246094, 47.01951599121094, 51.44091033935547, 55.86229705810547, 60.283687591552734, 64.705078125, 69.12646484375, 73.5478515625, 77.96924591064453, 82.39063262939453, 86.81202697753906, 91.23341369628906, 95.65480041503906, 100.0761947631836, 104.49758911132812]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 9.0, 9.0, 8.0, 23.0, 16.0, 17.0, 20.0, 22.0, 20.0, 37.0, 28.0, 32.0, 28.0, 53.0, 66.0, 99.0, 89.0, 69.0, 39.0, 31.0, 30.0, 35.0, 29.0, 20.0, 13.0, 16.0, 17.0, 9.0, 15.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-68.72903442382812, -66.56958770751953, -64.41014862060547, -62.250701904296875, -60.09125518798828, -57.93181228637695, -55.772369384765625, -53.61292266845703, -51.4534797668457, -49.294036865234375, -47.13459014892578, -44.97514724731445, -42.815704345703125, -40.65625762939453, -38.4968147277832, -36.337371826171875, -34.17792510986328, -32.01848220825195, -29.85903549194336, -27.69959259033203, -25.54014778137207, -23.38070297241211, -21.22126007080078, -19.06181526184082, -16.90237045288086, -14.742925643920898, -12.583481788635254, -10.42403793334961, -8.264593124389648, -6.1051483154296875, -3.945704460144043, -1.7862606048583984, 0.3731842041015625, 2.5326285362243652, 4.692072868347168, 6.851517200469971, 9.010961532592773, 11.170406341552734, 13.329850196838379, 15.489294052124023, 17.648738861083984, 19.808183670043945, 21.967628479003906, 24.127071380615234, 26.286516189575195, 28.445960998535156, 30.605403900146484, 32.76484680175781, 34.924293518066406, 37.083736419677734, 39.24318313598633, 41.402626037597656, 43.56207275390625, 45.72151565551758, 47.880958557128906, 50.0404052734375, 52.19984817504883, 54.359291076660156, 56.51873779296875, 58.67818069458008, 60.837623596191406, 62.9970703125, 65.1565170288086, 67.31595611572266, 69.47540283203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 13.0, 15.0, 29.0, 57.0, 95.0, 195.0, 387.0, 731.0, 1691.0, 4567.0, 16015.0, 97786.0, 1041812.0, 2605531.0, 371246.0, 40148.0, 8725.0, 2922.0, 1208.0, 513.0, 255.0, 143.0, 78.0, 45.0, 27.0, 16.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.7071533203125, -8.445556640625, -8.1839599609375, -7.92236328125, -7.6607666015625, -7.399169921875, -7.1375732421875, -6.8759765625, -6.6143798828125, -6.352783203125, -6.0911865234375, -5.82958984375, -5.5679931640625, -5.306396484375, -5.0447998046875, -4.783203125, -4.5216064453125, -4.260009765625, -3.9984130859375, -3.73681640625, -3.4752197265625, -3.213623046875, -2.9520263671875, -2.6904296875, -2.4288330078125, -2.167236328125, -1.9056396484375, -1.64404296875, -1.3824462890625, -1.120849609375, -0.8592529296875, -0.59765625, -0.3360595703125, -0.074462890625, 0.1871337890625, 0.44873046875, 0.7103271484375, 0.971923828125, 1.2335205078125, 1.4951171875, 1.7567138671875, 2.018310546875, 2.2799072265625, 2.54150390625, 2.8031005859375, 3.064697265625, 3.3262939453125, 3.587890625, 3.8494873046875, 4.111083984375, 4.3726806640625, 4.63427734375, 4.8958740234375, 5.157470703125, 5.4190673828125, 5.6806640625, 5.9422607421875, 6.203857421875, 6.4654541015625, 6.72705078125, 6.9886474609375, 7.250244140625, 7.5118408203125, 7.7734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 12.0, 17.0, 13.0, 21.0, 17.0, 32.0, 17.0, 24.0, 33.0, 42.0, 41.0, 32.0, 50.0, 38.0, 29.0, 43.0, 51.0, 47.0, 42.0, 46.0, 36.0, 40.0, 41.0, 33.0, 24.0, 23.0, 20.0, 15.0, 24.0, 19.0, 15.0, 4.0, 6.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45916748046875, -4.3050537109375, -4.15093994140625, -3.996826171875, -3.84271240234375, -3.6885986328125, -3.53448486328125, -3.38037109375, -3.22625732421875, -3.0721435546875, -2.91802978515625, -2.763916015625, -2.60980224609375, -2.4556884765625, -2.30157470703125, -2.1474609375, -1.99334716796875, -1.8392333984375, -1.68511962890625, -1.531005859375, -1.37689208984375, -1.2227783203125, -1.06866455078125, -0.91455078125, -0.76043701171875, -0.6063232421875, -0.45220947265625, -0.298095703125, -0.14398193359375, 0.0101318359375, 0.16424560546875, 0.318359375, 0.47247314453125, 0.6265869140625, 0.78070068359375, 0.934814453125, 1.08892822265625, 1.2430419921875, 1.39715576171875, 1.55126953125, 1.70538330078125, 1.8594970703125, 2.01361083984375, 2.167724609375, 2.32183837890625, 2.4759521484375, 2.63006591796875, 2.7841796875, 2.93829345703125, 3.0924072265625, 3.24652099609375, 3.400634765625, 3.55474853515625, 3.7088623046875, 3.86297607421875, 4.01708984375, 4.17120361328125, 4.3253173828125, 4.47943115234375, 4.633544921875, 4.78765869140625, 4.9417724609375, 5.09588623046875, 5.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 17.0, 62.0, 132.0, 371.0, 1944.0, 447515.0, 3739835.0, 3528.0, 541.0, 204.0, 72.0, 28.0, 18.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9375, -38.4638671875, -36.990234375, -35.5166015625, -34.04296875, -32.5693359375, -31.095703125, -29.6220703125, -28.1484375, -26.6748046875, -25.201171875, -23.7275390625, -22.25390625, -20.7802734375, -19.306640625, -17.8330078125, -16.359375, -14.8857421875, -13.412109375, -11.9384765625, -10.46484375, -8.9912109375, -7.517578125, -6.0439453125, -4.5703125, -3.0966796875, -1.623046875, -0.1494140625, 1.32421875, 2.7978515625, 4.271484375, 5.7451171875, 7.21875, 8.6923828125, 10.166015625, 11.6396484375, 13.11328125, 14.5869140625, 16.060546875, 17.5341796875, 19.0078125, 20.4814453125, 21.955078125, 23.4287109375, 24.90234375, 26.3759765625, 27.849609375, 29.3232421875, 30.796875, 32.2705078125, 33.744140625, 35.2177734375, 36.69140625, 38.1650390625, 39.638671875, 41.1123046875, 42.5859375, 44.0595703125, 45.533203125, 47.0068359375, 48.48046875, 49.9541015625, 51.427734375, 52.9013671875, 54.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 12.0, 11.0, 17.0, 40.0, 80.0, 143.0, 364.0, 830.0, 1212.0, 753.0, 299.0, 149.0, 65.0, 44.0, 18.0, 17.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.623779296875, -10.01318359375, -9.402587890625, -8.7919921875, -8.181396484375, -7.57080078125, -6.960205078125, -6.349609375, -5.739013671875, -5.12841796875, -4.517822265625, -3.9072265625, -3.296630859375, -2.68603515625, -2.075439453125, -1.46484375, -0.854248046875, -0.24365234375, 0.366943359375, 0.9775390625, 1.588134765625, 2.19873046875, 2.809326171875, 3.419921875, 4.030517578125, 4.64111328125, 5.251708984375, 5.8623046875, 6.472900390625, 7.08349609375, 7.694091796875, 8.3046875, 8.915283203125, 9.52587890625, 10.136474609375, 10.7470703125, 11.357666015625, 11.96826171875, 12.578857421875, 13.189453125, 13.800048828125, 14.41064453125, 15.021240234375, 15.6318359375, 16.242431640625, 16.85302734375, 17.463623046875, 18.07421875, 18.684814453125, 19.29541015625, 19.906005859375, 20.5166015625, 21.127197265625, 21.73779296875, 22.348388671875, 22.958984375, 23.569580078125, 24.18017578125, 24.790771484375, 25.4013671875, 26.011962890625, 26.62255859375, 27.233154296875, 27.84375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 37.0, 125.0, 299.0, 326.0, 134.0, 33.0, 13.0, 8.0, 6.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-262.331298828125, -255.21958923339844, -248.1078643798828, -240.99615478515625, -233.8844451904297, -226.77273559570312, -219.6610107421875, -212.54930114746094, -205.43759155273438, -198.3258819580078, -191.2141571044922, -184.10244750976562, -176.99073791503906, -169.8790283203125, -162.76730346679688, -155.6555938720703, -148.5438690185547, -141.43215942382812, -134.3204345703125, -127.20872497558594, -120.09701538085938, -112.98529815673828, -105.87358093261719, -98.76187133789062, -91.65015411376953, -84.53843688964844, -77.42672729492188, -70.31501007080078, -63.20329666137695, -56.091583251953125, -48.97986602783203, -41.8681526184082, -34.75642395019531, -27.644710540771484, -20.532995223999023, -13.421279907226562, -6.309566497802734, 0.8021469116210938, 7.9138641357421875, 15.025577545166016, 22.137290954589844, 29.249004364013672, 36.3607177734375, 43.472434997558594, 50.58414840698242, 57.69586181640625, 64.80757904052734, 71.91929626464844, 79.031005859375, 86.1427230834961, 93.25443267822266, 100.36614990234375, 107.47785949707031, 114.5895767211914, 121.7012939453125, 128.81300354003906, 135.92471313476562, 143.0364227294922, 150.1481475830078, 157.25985717773438, 164.37156677246094, 171.4832763671875, 178.59500122070312, 185.7067108154297, 192.8184356689453]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 9.0, 12.0, 5.0, 7.0, 8.0, 6.0, 15.0, 20.0, 32.0, 21.0, 30.0, 32.0, 33.0, 38.0, 40.0, 43.0, 48.0, 46.0, 56.0, 53.0, 41.0, 48.0, 53.0, 28.0, 45.0, 30.0, 31.0, 27.0, 33.0, 27.0, 15.0, 12.0, 13.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-68.60537719726562, -66.64068603515625, -64.67599487304688, -62.711299896240234, -60.746604919433594, -58.78191375732422, -56.817222595214844, -54.8525276184082, -52.88783264160156, -50.92314147949219, -48.95844650268555, -46.99375534057617, -45.02906036376953, -43.064369201660156, -41.09967803955078, -39.13498306274414, -37.170291900634766, -35.20560073852539, -33.24090576171875, -31.276214599609375, -29.311519622802734, -27.34682846069336, -25.38213539123535, -23.417442321777344, -21.452749252319336, -19.488056182861328, -17.52336311340332, -15.558670997619629, -13.593977928161621, -11.629284858703613, -9.664592742919922, -7.699899673461914, -5.735206604003906, -3.7705137729644775, -1.8058209419250488, 0.15887165069580078, 2.1235647201538086, 4.088257789611816, 6.052949905395508, 8.017642974853516, 9.982336044311523, 11.947029113769531, 13.911722183227539, 15.87641429901123, 17.841106414794922, 19.805801391601562, 21.770492553710938, 23.735185623168945, 25.699878692626953, 27.66457176208496, 29.62926483154297, 31.593955993652344, 33.558650970458984, 35.52334213256836, 37.488037109375, 39.452728271484375, 41.41741943359375, 43.382110595703125, 45.346805572509766, 47.31149673461914, 49.27619171142578, 51.240882873535156, 53.20557403564453, 55.17026901245117, 57.13496398925781]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 31.0, 50.0, 69.0, 100.0, 190.0, 276.0, 466.0, 914.0, 1909.0, 4264.0, 10600.0, 28629.0, 84386.0, 273120.0, 414397.0, 150997.0, 48725.0, 16838.0, 6728.0, 2861.0, 1361.0, 647.0, 355.0, 216.0, 122.0, 84.0, 50.0, 42.0, 19.0, 15.0, 12.0, 10.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.03125, -9.7545166015625, -9.477783203125, -9.2010498046875, -8.92431640625, -8.6475830078125, -8.370849609375, -8.0941162109375, -7.8173828125, -7.5406494140625, -7.263916015625, -6.9871826171875, -6.71044921875, -6.4337158203125, -6.156982421875, -5.8802490234375, -5.603515625, -5.3267822265625, -5.050048828125, -4.7733154296875, -4.49658203125, -4.2198486328125, -3.943115234375, -3.6663818359375, -3.3896484375, -3.1129150390625, -2.836181640625, -2.5594482421875, -2.28271484375, -2.0059814453125, -1.729248046875, -1.4525146484375, -1.17578125, -0.8990478515625, -0.622314453125, -0.3455810546875, -0.06884765625, 0.2078857421875, 0.484619140625, 0.7613525390625, 1.0380859375, 1.3148193359375, 1.591552734375, 1.8682861328125, 2.14501953125, 2.4217529296875, 2.698486328125, 2.9752197265625, 3.251953125, 3.5286865234375, 3.805419921875, 4.0821533203125, 4.35888671875, 4.6356201171875, 4.912353515625, 5.1890869140625, 5.4658203125, 5.7425537109375, 6.019287109375, 6.2960205078125, 6.57275390625, 6.8494873046875, 7.126220703125, 7.4029541015625, 7.6796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 10.0, 8.0, 6.0, 6.0, 12.0, 15.0, 18.0, 22.0, 23.0, 40.0, 33.0, 38.0, 39.0, 36.0, 41.0, 47.0, 57.0, 48.0, 41.0, 53.0, 48.0, 41.0, 44.0, 38.0, 29.0, 29.0, 22.0, 32.0, 24.0, 19.0, 17.0, 15.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.44384765625, -4.2744140625, -4.10498046875, -3.935546875, -3.76611328125, -3.5966796875, -3.42724609375, -3.2578125, -3.08837890625, -2.9189453125, -2.74951171875, -2.580078125, -2.41064453125, -2.2412109375, -2.07177734375, -1.90234375, -1.73291015625, -1.5634765625, -1.39404296875, -1.224609375, -1.05517578125, -0.8857421875, -0.71630859375, -0.546875, -0.37744140625, -0.2080078125, -0.03857421875, 0.130859375, 0.30029296875, 0.4697265625, 0.63916015625, 0.80859375, 0.97802734375, 1.1474609375, 1.31689453125, 1.486328125, 1.65576171875, 1.8251953125, 1.99462890625, 2.1640625, 2.33349609375, 2.5029296875, 2.67236328125, 2.841796875, 3.01123046875, 3.1806640625, 3.35009765625, 3.51953125, 3.68896484375, 3.8583984375, 4.02783203125, 4.197265625, 4.36669921875, 4.5361328125, 4.70556640625, 4.875, 5.04443359375, 5.2138671875, 5.38330078125, 5.552734375, 5.72216796875, 5.8916015625, 6.06103515625, 6.23046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 9.0, 19.0, 16.0, 29.0, 30.0, 48.0, 76.0, 112.0, 163.0, 240.0, 379.0, 587.0, 1315.0, 2949.0, 10774.0, 89488.0, 853206.0, 73806.0, 9649.0, 2754.0, 1206.0, 659.0, 340.0, 213.0, 156.0, 98.0, 61.0, 44.0, 39.0, 16.0, 14.0, 19.0, 7.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.875, -23.22021484375, -22.5654296875, -21.91064453125, -21.255859375, -20.60107421875, -19.9462890625, -19.29150390625, -18.63671875, -17.98193359375, -17.3271484375, -16.67236328125, -16.017578125, -15.36279296875, -14.7080078125, -14.05322265625, -13.3984375, -12.74365234375, -12.0888671875, -11.43408203125, -10.779296875, -10.12451171875, -9.4697265625, -8.81494140625, -8.16015625, -7.50537109375, -6.8505859375, -6.19580078125, -5.541015625, -4.88623046875, -4.2314453125, -3.57666015625, -2.921875, -2.26708984375, -1.6123046875, -0.95751953125, -0.302734375, 0.35205078125, 1.0068359375, 1.66162109375, 2.31640625, 2.97119140625, 3.6259765625, 4.28076171875, 4.935546875, 5.59033203125, 6.2451171875, 6.89990234375, 7.5546875, 8.20947265625, 8.8642578125, 9.51904296875, 10.173828125, 10.82861328125, 11.4833984375, 12.13818359375, 12.79296875, 13.44775390625, 14.1025390625, 14.75732421875, 15.412109375, 16.06689453125, 16.7216796875, 17.37646484375, 18.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 4.0, 4.0, 16.0, 9.0, 12.0, 15.0, 18.0, 28.0, 24.0, 42.0, 23.0, 43.0, 44.0, 48.0, 64.0, 61.0, 65.0, 65.0, 45.0, 51.0, 49.0, 33.0, 37.0, 29.0, 25.0, 31.0, 26.0, 11.0, 13.0, 11.0, 9.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.26123046875, -20.6005859375, -19.93994140625, -19.279296875, -18.61865234375, -17.9580078125, -17.29736328125, -16.63671875, -15.97607421875, -15.3154296875, -14.65478515625, -13.994140625, -13.33349609375, -12.6728515625, -12.01220703125, -11.3515625, -10.69091796875, -10.0302734375, -9.36962890625, -8.708984375, -8.04833984375, -7.3876953125, -6.72705078125, -6.06640625, -5.40576171875, -4.7451171875, -4.08447265625, -3.423828125, -2.76318359375, -2.1025390625, -1.44189453125, -0.78125, -0.12060546875, 0.5400390625, 1.20068359375, 1.861328125, 2.52197265625, 3.1826171875, 3.84326171875, 4.50390625, 5.16455078125, 5.8251953125, 6.48583984375, 7.146484375, 7.80712890625, 8.4677734375, 9.12841796875, 9.7890625, 10.44970703125, 11.1103515625, 11.77099609375, 12.431640625, 13.09228515625, 13.7529296875, 14.41357421875, 15.07421875, 15.73486328125, 16.3955078125, 17.05615234375, 17.716796875, 18.37744140625, 19.0380859375, 19.69873046875, 20.359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 38.0, 46.0, 67.0, 94.0, 200.0, 432.0, 1227.0, 5104.0, 55846.0, 950498.0, 29454.0, 3769.0, 925.0, 338.0, 188.0, 108.0, 57.0, 34.0, 24.0, 17.0, 20.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.4071044921875, -10.095458984375, -9.7838134765625, -9.47216796875, -9.1605224609375, -8.848876953125, -8.5372314453125, -8.2255859375, -7.9139404296875, -7.602294921875, -7.2906494140625, -6.97900390625, -6.6673583984375, -6.355712890625, -6.0440673828125, -5.732421875, -5.4207763671875, -5.109130859375, -4.7974853515625, -4.48583984375, -4.1741943359375, -3.862548828125, -3.5509033203125, -3.2392578125, -2.9276123046875, -2.615966796875, -2.3043212890625, -1.99267578125, -1.6810302734375, -1.369384765625, -1.0577392578125, -0.74609375, -0.4344482421875, -0.122802734375, 0.1888427734375, 0.50048828125, 0.8121337890625, 1.123779296875, 1.4354248046875, 1.7470703125, 2.0587158203125, 2.370361328125, 2.6820068359375, 2.99365234375, 3.3052978515625, 3.616943359375, 3.9285888671875, 4.240234375, 4.5518798828125, 4.863525390625, 5.1751708984375, 5.48681640625, 5.7984619140625, 6.110107421875, 6.4217529296875, 6.7333984375, 7.0450439453125, 7.356689453125, 7.6683349609375, 7.97998046875, 8.2916259765625, 8.603271484375, 8.9149169921875, 9.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 9.0, 13.0, 14.0, 34.0, 49.0, 77.0, 154.0, 223.0, 138.0, 68.0, 51.0, 37.0, 22.0, 15.0, 7.0, 9.0, 7.0, 4.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016536712646484375, -0.0016117841005325317, -0.001569896936416626, -0.0015280097723007202, -0.0014861226081848145, -0.0014442354440689087, -0.001402348279953003, -0.0013604611158370972, -0.0013185739517211914, -0.0012766867876052856, -0.0012347996234893799, -0.0011929124593734741, -0.0011510252952575684, -0.0011091381311416626, -0.0010672509670257568, -0.001025363802909851, -0.0009834766387939453, -0.0009415894746780396, -0.0008997023105621338, -0.000857815146446228, -0.0008159279823303223, -0.0007740408182144165, -0.0007321536540985107, -0.000690266489982605, -0.0006483793258666992, -0.0006064921617507935, -0.0005646049976348877, -0.0005227178335189819, -0.00048083066940307617, -0.0004389435052871704, -0.00039705634117126465, -0.0003551691770553589, -0.0003132820129394531, -0.00027139484882354736, -0.0002295076847076416, -0.00018762052059173584, -0.00014573335647583008, -0.00010384619235992432, -6.195902824401855e-05, -2.0071864128112793e-05, 2.181529998779297e-05, 6.370246410369873e-05, 0.00010558962821960449, 0.00014747679233551025, 0.00018936395645141602, 0.00023125112056732178, 0.00027313828468322754, 0.0003150254487991333, 0.00035691261291503906, 0.0003987997770309448, 0.0004406869411468506, 0.00048257410526275635, 0.0005244612693786621, 0.0005663484334945679, 0.0006082355976104736, 0.0006501227617263794, 0.0006920099258422852, 0.0007338970899581909, 0.0007757842540740967, 0.0008176714181900024, 0.0008595585823059082, 0.000901445746421814, 0.0009433329105377197, 0.0009852200746536255, 0.0010271072387695312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 9.0, 26.0, 28.0, 47.0, 95.0, 267.0, 609.0, 2214.0, 18985.0, 933759.0, 85650.0, 5180.0, 992.0, 360.0, 140.0, 77.0, 42.0, 28.0, 12.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.58056640625, -12.2470703125, -11.91357421875, -11.580078125, -11.24658203125, -10.9130859375, -10.57958984375, -10.24609375, -9.91259765625, -9.5791015625, -9.24560546875, -8.912109375, -8.57861328125, -8.2451171875, -7.91162109375, -7.578125, -7.24462890625, -6.9111328125, -6.57763671875, -6.244140625, -5.91064453125, -5.5771484375, -5.24365234375, -4.91015625, -4.57666015625, -4.2431640625, -3.90966796875, -3.576171875, -3.24267578125, -2.9091796875, -2.57568359375, -2.2421875, -1.90869140625, -1.5751953125, -1.24169921875, -0.908203125, -0.57470703125, -0.2412109375, 0.09228515625, 0.42578125, 0.75927734375, 1.0927734375, 1.42626953125, 1.759765625, 2.09326171875, 2.4267578125, 2.76025390625, 3.09375, 3.42724609375, 3.7607421875, 4.09423828125, 4.427734375, 4.76123046875, 5.0947265625, 5.42822265625, 5.76171875, 6.09521484375, 6.4287109375, 6.76220703125, 7.095703125, 7.42919921875, 7.7626953125, 8.09619140625, 8.4296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 3.0, 3.0, 5.0, 4.0, 5.0, 14.0, 12.0, 17.0, 26.0, 34.0, 49.0, 60.0, 90.0, 118.0, 151.0, 94.0, 78.0, 53.0, 33.0, 38.0, 29.0, 17.0, 14.0, 11.0, 13.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.6251220703125, -5.461181640625, -5.2972412109375, -5.13330078125, -4.9693603515625, -4.805419921875, -4.6414794921875, -4.4775390625, -4.3135986328125, -4.149658203125, -3.9857177734375, -3.82177734375, -3.6578369140625, -3.493896484375, -3.3299560546875, -3.166015625, -3.0020751953125, -2.838134765625, -2.6741943359375, -2.51025390625, -2.3463134765625, -2.182373046875, -2.0184326171875, -1.8544921875, -1.6905517578125, -1.526611328125, -1.3626708984375, -1.19873046875, -1.0347900390625, -0.870849609375, -0.7069091796875, -0.54296875, -0.3790283203125, -0.215087890625, -0.0511474609375, 0.11279296875, 0.2767333984375, 0.440673828125, 0.6046142578125, 0.7685546875, 0.9324951171875, 1.096435546875, 1.2603759765625, 1.42431640625, 1.5882568359375, 1.752197265625, 1.9161376953125, 2.080078125, 2.2440185546875, 2.407958984375, 2.5718994140625, 2.73583984375, 2.8997802734375, 3.063720703125, 3.2276611328125, 3.3916015625, 3.5555419921875, 3.719482421875, 3.8834228515625, 4.04736328125, 4.2113037109375, 4.375244140625, 4.5391845703125, 4.703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 60.0, 656.0, 238.0, 32.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.8194580078125, -679.603271484375, -665.3870849609375, -651.1708984375, -636.9547119140625, -622.738525390625, -608.5223388671875, -594.30615234375, -580.0899658203125, -565.873779296875, -551.6575927734375, -537.44140625, -523.2252197265625, -509.009033203125, -494.7928466796875, -480.57666015625, -466.3605041503906, -452.1443176269531, -437.9281311035156, -423.7119445800781, -409.4957580566406, -395.2795715332031, -381.06341552734375, -366.84722900390625, -352.63104248046875, -338.41485595703125, -324.19866943359375, -309.98248291015625, -295.76629638671875, -281.55010986328125, -267.33392333984375, -253.1177520751953, -238.90151977539062, -224.68533325195312, -210.46914672851562, -196.25296020507812, -182.03677368164062, -167.82058715820312, -153.6044158935547, -139.3882293701172, -125.17204284667969, -110.95585632324219, -96.73966979980469, -82.52349090576172, -68.30730438232422, -54.09111785888672, -39.87493896484375, -25.65875244140625, -11.44256591796875, 2.773618698120117, 16.989803314208984, 31.20598602294922, 45.42217254638672, 59.63835906982422, 73.85453796386719, 88.07072448730469, 102.28691101074219, 116.50309753417969, 130.7192840576172, 144.93545532226562, 159.15164184570312, 173.36782836914062, 187.58401489257812, 201.80020141601562, 216.01638793945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 6.0, 18.0, 14.0, 19.0, 25.0, 30.0, 31.0, 34.0, 28.0, 34.0, 50.0, 124.0, 170.0, 70.0, 39.0, 49.0, 37.0, 26.0, 24.0, 26.0, 28.0, 13.0, 15.0, 17.0, 7.0, 10.0, 8.0, 5.0, 1.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.43122863769531, -98.28334045410156, -95.13545989990234, -91.9875717163086, -88.83969116210938, -85.69180297851562, -82.54391479492188, -79.39603424072266, -76.24815368652344, -73.10026550292969, -69.95238494873047, -66.80449676513672, -63.6566162109375, -60.50872802734375, -57.360843658447266, -54.21295928955078, -51.06507110595703, -47.91718673706055, -44.76930236816406, -41.62141418457031, -38.473533630371094, -35.325645446777344, -32.17776107788086, -29.029876708984375, -25.88199234008789, -22.734107971191406, -19.586223602294922, -16.438337326049805, -13.29045295715332, -10.142568588256836, -6.994682312011719, -3.8467979431152344, -0.69891357421875, 2.4489712715148926, 5.596856117248535, 8.744741439819336, 11.89262580871582, 15.040510177612305, 18.188396453857422, 21.336280822753906, 24.48416519165039, 27.632049560546875, 30.77993392944336, 33.927818298339844, 37.075706481933594, 40.22358703613281, 43.37147521972656, 46.51935958862305, 49.66724395751953, 52.815128326416016, 55.9630126953125, 59.11090087890625, 62.25878143310547, 65.40666961669922, 68.55455017089844, 71.70243835449219, 74.85032653808594, 77.99821472167969, 81.1460952758789, 84.29398345947266, 87.44186401367188, 90.58975219726562, 93.73764038085938, 96.8855209350586, 100.03340148925781]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 12.0, 12.0, 15.0, 28.0, 52.0, 85.0, 123.0, 203.0, 333.0, 569.0, 1087.0, 2200.0, 5725.0, 21654.0, 209384.0, 2352085.0, 1475914.0, 102566.0, 14152.0, 4260.0, 1719.0, 863.0, 480.0, 301.0, 165.0, 94.0, 74.0, 41.0, 34.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6641845703125, -11.273681640625, -10.8831787109375, -10.49267578125, -10.1021728515625, -9.711669921875, -9.3211669921875, -8.9306640625, -8.5401611328125, -8.149658203125, -7.7591552734375, -7.36865234375, -6.9781494140625, -6.587646484375, -6.1971435546875, -5.806640625, -5.4161376953125, -5.025634765625, -4.6351318359375, -4.24462890625, -3.8541259765625, -3.463623046875, -3.0731201171875, -2.6826171875, -2.2921142578125, -1.901611328125, -1.5111083984375, -1.12060546875, -0.7301025390625, -0.339599609375, 0.0509033203125, 0.44140625, 0.8319091796875, 1.222412109375, 1.6129150390625, 2.00341796875, 2.3939208984375, 2.784423828125, 3.1749267578125, 3.5654296875, 3.9559326171875, 4.346435546875, 4.7369384765625, 5.12744140625, 5.5179443359375, 5.908447265625, 6.2989501953125, 6.689453125, 7.0799560546875, 7.470458984375, 7.8609619140625, 8.25146484375, 8.6419677734375, 9.032470703125, 9.4229736328125, 9.8134765625, 10.2039794921875, 10.594482421875, 10.9849853515625, 11.37548828125, 11.7659912109375, 12.156494140625, 12.5469970703125, 12.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 5.0, 9.0, 13.0, 13.0, 12.0, 24.0, 22.0, 29.0, 27.0, 26.0, 26.0, 33.0, 37.0, 34.0, 42.0, 47.0, 47.0, 41.0, 50.0, 50.0, 37.0, 40.0, 34.0, 33.0, 35.0, 26.0, 32.0, 26.0, 19.0, 22.0, 23.0, 11.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.15789794921875, -4.0072021484375, -3.85650634765625, -3.705810546875, -3.55511474609375, -3.4044189453125, -3.25372314453125, -3.10302734375, -2.95233154296875, -2.8016357421875, -2.65093994140625, -2.500244140625, -2.34954833984375, -2.1988525390625, -2.04815673828125, -1.8974609375, -1.74676513671875, -1.5960693359375, -1.44537353515625, -1.294677734375, -1.14398193359375, -0.9932861328125, -0.84259033203125, -0.69189453125, -0.54119873046875, -0.3905029296875, -0.23980712890625, -0.089111328125, 0.06158447265625, 0.2122802734375, 0.36297607421875, 0.513671875, 0.66436767578125, 0.8150634765625, 0.96575927734375, 1.116455078125, 1.26715087890625, 1.4178466796875, 1.56854248046875, 1.71923828125, 1.86993408203125, 2.0206298828125, 2.17132568359375, 2.322021484375, 2.47271728515625, 2.6234130859375, 2.77410888671875, 2.9248046875, 3.07550048828125, 3.2261962890625, 3.37689208984375, 3.527587890625, 3.67828369140625, 3.8289794921875, 3.97967529296875, 4.13037109375, 4.28106689453125, 4.4317626953125, 4.58245849609375, 4.733154296875, 4.88385009765625, 5.0345458984375, 5.18524169921875, 5.3359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 9.0, 14.0, 30.0, 65.0, 103.0, 207.0, 412.0, 1010.0, 3957.0, 362168.0, 3817162.0, 6768.0, 1358.0, 473.0, 255.0, 125.0, 62.0, 35.0, 24.0, 12.0, 11.0, 10.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.53125, -49.76123046875, -47.9912109375, -46.22119140625, -44.451171875, -42.68115234375, -40.9111328125, -39.14111328125, -37.37109375, -35.60107421875, -33.8310546875, -32.06103515625, -30.291015625, -28.52099609375, -26.7509765625, -24.98095703125, -23.2109375, -21.44091796875, -19.6708984375, -17.90087890625, -16.130859375, -14.36083984375, -12.5908203125, -10.82080078125, -9.05078125, -7.28076171875, -5.5107421875, -3.74072265625, -1.970703125, -0.20068359375, 1.5693359375, 3.33935546875, 5.109375, 6.87939453125, 8.6494140625, 10.41943359375, 12.189453125, 13.95947265625, 15.7294921875, 17.49951171875, 19.26953125, 21.03955078125, 22.8095703125, 24.57958984375, 26.349609375, 28.11962890625, 29.8896484375, 31.65966796875, 33.4296875, 35.19970703125, 36.9697265625, 38.73974609375, 40.509765625, 42.27978515625, 44.0498046875, 45.81982421875, 47.58984375, 49.35986328125, 51.1298828125, 52.89990234375, 54.669921875, 56.43994140625, 58.2099609375, 59.97998046875, 61.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 14.0, 13.0, 24.0, 28.0, 63.0, 92.0, 102.0, 204.0, 347.0, 575.0, 703.0, 676.0, 427.0, 248.0, 162.0, 100.0, 78.0, 47.0, 43.0, 28.0, 20.0, 19.0, 10.0, 11.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -12.901611328125, -12.33447265625, -11.767333984375, -11.2001953125, -10.633056640625, -10.06591796875, -9.498779296875, -8.931640625, -8.364501953125, -7.79736328125, -7.230224609375, -6.6630859375, -6.095947265625, -5.52880859375, -4.961669921875, -4.39453125, -3.827392578125, -3.26025390625, -2.693115234375, -2.1259765625, -1.558837890625, -0.99169921875, -0.424560546875, 0.142578125, 0.709716796875, 1.27685546875, 1.843994140625, 2.4111328125, 2.978271484375, 3.54541015625, 4.112548828125, 4.6796875, 5.246826171875, 5.81396484375, 6.381103515625, 6.9482421875, 7.515380859375, 8.08251953125, 8.649658203125, 9.216796875, 9.783935546875, 10.35107421875, 10.918212890625, 11.4853515625, 12.052490234375, 12.61962890625, 13.186767578125, 13.75390625, 14.321044921875, 14.88818359375, 15.455322265625, 16.0224609375, 16.589599609375, 17.15673828125, 17.723876953125, 18.291015625, 18.858154296875, 19.42529296875, 19.992431640625, 20.5595703125, 21.126708984375, 21.69384765625, 22.260986328125, 22.828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 12.0, 22.0, 56.0, 128.0, 202.0, 231.0, 150.0, 67.0, 38.0, 16.0, 12.0, 9.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.5052947998047, -159.9416961669922, -152.3780975341797, -144.81448364257812, -137.25088500976562, -129.68728637695312, -122.12368774414062, -114.56008911132812, -106.9964828491211, -99.4328842163086, -91.86927795410156, -84.30567932128906, -76.74208068847656, -69.17847442626953, -61.61487579345703, -54.051273345947266, -46.4876708984375, -38.924068450927734, -31.3604679107666, -23.79686737060547, -16.233264923095703, -8.669662475585938, -1.1060638427734375, 6.457538604736328, 14.021141052246094, 21.58474349975586, 29.148344039916992, 36.711944580078125, 44.27554702758789, 51.839149475097656, 59.402748107910156, 66.96635437011719, 74.52996826171875, 82.09356689453125, 89.65717315673828, 97.22077178955078, 104.78437805175781, 112.34797668457031, 119.91157531738281, 127.47517395019531, 135.03878784179688, 142.60238647460938, 150.16598510742188, 157.72958374023438, 165.29319763183594, 172.85679626464844, 180.42039489746094, 187.98399353027344, 195.54759216308594, 203.11119079589844, 210.67478942871094, 218.2384033203125, 225.802001953125, 233.3656005859375, 240.92919921875, 248.4927978515625, 256.056396484375, 263.6199951171875, 271.18359375, 278.7471923828125, 286.310791015625, 293.8743896484375, 301.43798828125, 309.0016174316406, 316.5652160644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 9.0, 7.0, 16.0, 25.0, 17.0, 32.0, 31.0, 48.0, 60.0, 53.0, 67.0, 55.0, 77.0, 91.0, 74.0, 56.0, 53.0, 41.0, 40.0, 29.0, 28.0, 14.0, 18.0, 8.0, 10.0, 3.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.36074829101562, -152.4566650390625, -148.55259704589844, -144.6485137939453, -140.74444580078125, -136.84036254882812, -132.93629455566406, -129.03221130371094, -125.12814331054688, -121.22406768798828, -117.31999206542969, -113.4159164428711, -109.5118408203125, -105.6077651977539, -101.70368957519531, -97.79960632324219, -93.8955307006836, -89.991455078125, -86.0873794555664, -82.18330383300781, -78.27922821044922, -74.37515258789062, -70.4710693359375, -66.56700134277344, -62.66292190551758, -58.758846282958984, -54.85477066040039, -50.95069122314453, -47.04661560058594, -43.142539978027344, -39.23846435546875, -35.334388732910156, -31.430320739746094, -27.5262451171875, -23.622169494628906, -19.71809196472168, -15.814016342163086, -11.909940719604492, -8.005863189697266, -4.101787567138672, -0.19771194458007812, 3.706364154815674, 7.610440254211426, 11.514516830444336, 15.41859245300293, 19.322668075561523, 23.22674560546875, 27.130821228027344, 31.034896850585938, 34.93897247314453, 38.843048095703125, 42.74712371826172, 46.65119934082031, 50.555274963378906, 54.459354400634766, 58.36343002319336, 62.26750564575195, 66.17158508300781, 70.0756607055664, 73.979736328125, 77.8838119506836, 81.78788757324219, 85.69196319580078, 89.59603881835938, 93.50011444091797]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 11.0, 13.0, 13.0, 22.0, 23.0, 54.0, 73.0, 116.0, 196.0, 347.0, 597.0, 1044.0, 2052.0, 4157.0, 9037.0, 23016.0, 67207.0, 248956.0, 492519.0, 131845.0, 39780.0, 14690.0, 6219.0, 2954.0, 1525.0, 830.0, 501.0, 262.0, 175.0, 106.0, 79.0, 40.0, 33.0, 21.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.2578125, -9.0025634765625, -8.747314453125, -8.4920654296875, -8.23681640625, -7.9815673828125, -7.726318359375, -7.4710693359375, -7.2158203125, -6.9605712890625, -6.705322265625, -6.4500732421875, -6.19482421875, -5.9395751953125, -5.684326171875, -5.4290771484375, -5.173828125, -4.9185791015625, -4.663330078125, -4.4080810546875, -4.15283203125, -3.8975830078125, -3.642333984375, -3.3870849609375, -3.1318359375, -2.8765869140625, -2.621337890625, -2.3660888671875, -2.11083984375, -1.8555908203125, -1.600341796875, -1.3450927734375, -1.08984375, -0.8345947265625, -0.579345703125, -0.3240966796875, -0.06884765625, 0.1864013671875, 0.441650390625, 0.6968994140625, 0.9521484375, 1.2073974609375, 1.462646484375, 1.7178955078125, 1.97314453125, 2.2283935546875, 2.483642578125, 2.7388916015625, 2.994140625, 3.2493896484375, 3.504638671875, 3.7598876953125, 4.01513671875, 4.2703857421875, 4.525634765625, 4.7808837890625, 5.0361328125, 5.2913818359375, 5.546630859375, 5.8018798828125, 6.05712890625, 6.3123779296875, 6.567626953125, 6.8228759765625, 7.078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 16.0, 24.0, 19.0, 27.0, 31.0, 48.0, 38.0, 37.0, 52.0, 56.0, 65.0, 69.0, 58.0, 51.0, 56.0, 50.0, 60.0, 42.0, 32.0, 36.0, 24.0, 20.0, 12.0, 17.0, 12.0, 11.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.1015625, -9.86602783203125, -9.6304931640625, -9.39495849609375, -9.159423828125, -8.92388916015625, -8.6883544921875, -8.45281982421875, -8.21728515625, -7.98175048828125, -7.7462158203125, -7.51068115234375, -7.275146484375, -7.03961181640625, -6.8040771484375, -6.56854248046875, -6.3330078125, -6.09747314453125, -5.8619384765625, -5.62640380859375, -5.390869140625, -5.15533447265625, -4.9197998046875, -4.68426513671875, -4.44873046875, -4.21319580078125, -3.9776611328125, -3.74212646484375, -3.506591796875, -3.27105712890625, -3.0355224609375, -2.79998779296875, -2.564453125, -2.32891845703125, -2.0933837890625, -1.85784912109375, -1.622314453125, -1.38677978515625, -1.1512451171875, -0.91571044921875, -0.68017578125, -0.44464111328125, -0.2091064453125, 0.02642822265625, 0.261962890625, 0.49749755859375, 0.7330322265625, 0.96856689453125, 1.2041015625, 1.43963623046875, 1.6751708984375, 1.91070556640625, 2.146240234375, 2.38177490234375, 2.6173095703125, 2.85284423828125, 3.08837890625, 3.32391357421875, 3.5594482421875, 3.79498291015625, 4.030517578125, 4.26605224609375, 4.5015869140625, 4.73712158203125, 4.97265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 3.0, 6.0, 11.0, 17.0, 18.0, 22.0, 25.0, 50.0, 60.0, 87.0, 142.0, 209.0, 325.0, 596.0, 1232.0, 3456.0, 16900.0, 309702.0, 683680.0, 24310.0, 4491.0, 1480.0, 686.0, 325.0, 209.0, 162.0, 91.0, 63.0, 45.0, 39.0, 27.0, 20.0, 9.0, 8.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.59375, -15.16162109375, -14.7294921875, -14.29736328125, -13.865234375, -13.43310546875, -13.0009765625, -12.56884765625, -12.13671875, -11.70458984375, -11.2724609375, -10.84033203125, -10.408203125, -9.97607421875, -9.5439453125, -9.11181640625, -8.6796875, -8.24755859375, -7.8154296875, -7.38330078125, -6.951171875, -6.51904296875, -6.0869140625, -5.65478515625, -5.22265625, -4.79052734375, -4.3583984375, -3.92626953125, -3.494140625, -3.06201171875, -2.6298828125, -2.19775390625, -1.765625, -1.33349609375, -0.9013671875, -0.46923828125, -0.037109375, 0.39501953125, 0.8271484375, 1.25927734375, 1.69140625, 2.12353515625, 2.5556640625, 2.98779296875, 3.419921875, 3.85205078125, 4.2841796875, 4.71630859375, 5.1484375, 5.58056640625, 6.0126953125, 6.44482421875, 6.876953125, 7.30908203125, 7.7412109375, 8.17333984375, 8.60546875, 9.03759765625, 9.4697265625, 9.90185546875, 10.333984375, 10.76611328125, 11.1982421875, 11.63037109375, 12.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 6.0, 13.0, 8.0, 8.0, 9.0, 22.0, 18.0, 15.0, 26.0, 26.0, 33.0, 44.0, 49.0, 69.0, 74.0, 95.0, 91.0, 69.0, 50.0, 43.0, 48.0, 30.0, 27.0, 15.0, 19.0, 19.0, 12.0, 12.0, 8.0, 11.0, 6.0, 5.0, 0.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.375, -27.554931640625, -26.73486328125, -25.914794921875, -25.0947265625, -24.274658203125, -23.45458984375, -22.634521484375, -21.814453125, -20.994384765625, -20.17431640625, -19.354248046875, -18.5341796875, -17.714111328125, -16.89404296875, -16.073974609375, -15.25390625, -14.433837890625, -13.61376953125, -12.793701171875, -11.9736328125, -11.153564453125, -10.33349609375, -9.513427734375, -8.693359375, -7.873291015625, -7.05322265625, -6.233154296875, -5.4130859375, -4.593017578125, -3.77294921875, -2.952880859375, -2.1328125, -1.312744140625, -0.49267578125, 0.327392578125, 1.1474609375, 1.967529296875, 2.78759765625, 3.607666015625, 4.427734375, 5.247802734375, 6.06787109375, 6.887939453125, 7.7080078125, 8.528076171875, 9.34814453125, 10.168212890625, 10.98828125, 11.808349609375, 12.62841796875, 13.448486328125, 14.2685546875, 15.088623046875, 15.90869140625, 16.728759765625, 17.548828125, 18.368896484375, 19.18896484375, 20.009033203125, 20.8291015625, 21.649169921875, 22.46923828125, 23.289306640625, 24.109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 15.0, 16.0, 21.0, 31.0, 36.0, 40.0, 89.0, 110.0, 187.0, 286.0, 432.0, 842.0, 1576.0, 3432.0, 8656.0, 28058.0, 236348.0, 716511.0, 34043.0, 9933.0, 3765.0, 1798.0, 858.0, 498.0, 275.0, 174.0, 133.0, 95.0, 40.0, 40.0, 38.0, 23.0, 24.0, 19.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-1.65234375, -1.6023712158203125, -1.552398681640625, -1.5024261474609375, -1.45245361328125, -1.4024810791015625, -1.352508544921875, -1.3025360107421875, -1.2525634765625, -1.2025909423828125, -1.152618408203125, -1.1026458740234375, -1.05267333984375, -1.0027008056640625, -0.952728271484375, -0.9027557373046875, -0.852783203125, -0.8028106689453125, -0.752838134765625, -0.7028656005859375, -0.65289306640625, -0.6029205322265625, -0.552947998046875, -0.5029754638671875, -0.4530029296875, -0.4030303955078125, -0.353057861328125, -0.3030853271484375, -0.25311279296875, -0.2031402587890625, -0.153167724609375, -0.1031951904296875, -0.05322265625, -0.0032501220703125, 0.046722412109375, 0.0966949462890625, 0.14666748046875, 0.1966400146484375, 0.246612548828125, 0.2965850830078125, 0.3465576171875, 0.3965301513671875, 0.446502685546875, 0.4964752197265625, 0.54644775390625, 0.5964202880859375, 0.646392822265625, 0.6963653564453125, 0.746337890625, 0.7963104248046875, 0.846282958984375, 0.8962554931640625, 0.94622802734375, 0.9962005615234375, 1.046173095703125, 1.0961456298828125, 1.1461181640625, 1.1960906982421875, 1.246063232421875, 1.2960357666015625, 1.34600830078125, 1.3959808349609375, 1.445953369140625, 1.4959259033203125, 1.5458984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 12.0, 29.0, 28.0, 37.0, 62.0, 110.0, 192.0, 192.0, 119.0, 59.0, 34.0, 21.0, 18.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008893013000488281, -0.0008623376488685608, -0.0008353739976882935, -0.0008084103465080261, -0.0007814466953277588, -0.0007544830441474915, -0.0007275193929672241, -0.0007005557417869568, -0.0006735920906066895, -0.0006466284394264221, -0.0006196647882461548, -0.0005927011370658875, -0.0005657374858856201, -0.0005387738347053528, -0.0005118101835250854, -0.0004848465323448181, -0.0004578828811645508, -0.00043091922998428345, -0.0004039555788040161, -0.0003769919276237488, -0.00035002827644348145, -0.0003230646252632141, -0.0002961009740829468, -0.00026913732290267944, -0.0002421736717224121, -0.00021521002054214478, -0.00018824636936187744, -0.0001612827181816101, -0.00013431906700134277, -0.00010735541582107544, -8.03917646408081e-05, -5.342811346054077e-05, -2.6464462280273438e-05, 4.991888999938965e-07, 2.746284008026123e-05, 5.4426491260528564e-05, 8.13901424407959e-05, 0.00010835379362106323, 0.00013531744480133057, 0.0001622810959815979, 0.00018924474716186523, 0.00021620839834213257, 0.0002431720495223999, 0.00027013570070266724, 0.00029709935188293457, 0.0003240630030632019, 0.00035102665424346924, 0.00037799030542373657, 0.0004049539566040039, 0.00043191760778427124, 0.0004588812589645386, 0.0004858449101448059, 0.0005128085613250732, 0.0005397722125053406, 0.0005667358636856079, 0.0005936995148658752, 0.0006206631660461426, 0.0006476268172264099, 0.0006745904684066772, 0.0007015541195869446, 0.0007285177707672119, 0.0007554814219474792, 0.0007824450731277466, 0.0008094087243080139, 0.0008363723754882812]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 34.0, 55.0, 84.0, 127.0, 214.0, 419.0, 809.0, 1682.0, 3844.0, 10577.0, 35167.0, 507871.0, 435746.0, 34371.0, 10183.0, 3868.0, 1687.0, 782.0, 401.0, 229.0, 132.0, 67.0, 53.0, 34.0, 16.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.7294464111328125, -1.671783447265625, -1.6141204833984375, -1.55645751953125, -1.4987945556640625, -1.441131591796875, -1.3834686279296875, -1.3258056640625, -1.2681427001953125, -1.210479736328125, -1.1528167724609375, -1.09515380859375, -1.0374908447265625, -0.979827880859375, -0.9221649169921875, -0.864501953125, -0.8068389892578125, -0.749176025390625, -0.6915130615234375, -0.63385009765625, -0.5761871337890625, -0.518524169921875, -0.4608612060546875, -0.4031982421875, -0.3455352783203125, -0.287872314453125, -0.2302093505859375, -0.17254638671875, -0.1148834228515625, -0.057220458984375, 0.0004425048828125, 0.05810546875, 0.1157684326171875, 0.173431396484375, 0.2310943603515625, 0.28875732421875, 0.3464202880859375, 0.404083251953125, 0.4617462158203125, 0.5194091796875, 0.5770721435546875, 0.634735107421875, 0.6923980712890625, 0.75006103515625, 0.8077239990234375, 0.865386962890625, 0.9230499267578125, 0.980712890625, 1.0383758544921875, 1.096038818359375, 1.1537017822265625, 1.21136474609375, 1.2690277099609375, 1.326690673828125, 1.3843536376953125, 1.4420166015625, 1.4996795654296875, 1.557342529296875, 1.6150054931640625, 1.67266845703125, 1.7303314208984375, 1.787994384765625, 1.8456573486328125, 1.9033203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 10.0, 5.0, 3.0, 12.0, 5.0, 6.0, 19.0, 22.0, 17.0, 37.0, 45.0, 64.0, 107.0, 106.0, 119.0, 113.0, 81.0, 58.0, 34.0, 28.0, 17.0, 18.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.107421875, -2.0442047119140625, -1.980987548828125, -1.9177703857421875, -1.85455322265625, -1.7913360595703125, -1.728118896484375, -1.6649017333984375, -1.6016845703125, -1.5384674072265625, -1.475250244140625, -1.4120330810546875, -1.34881591796875, -1.2855987548828125, -1.222381591796875, -1.1591644287109375, -1.095947265625, -1.0327301025390625, -0.969512939453125, -0.9062957763671875, -0.84307861328125, -0.7798614501953125, -0.716644287109375, -0.6534271240234375, -0.5902099609375, -0.5269927978515625, -0.463775634765625, -0.4005584716796875, -0.33734130859375, -0.2741241455078125, -0.210906982421875, -0.1476898193359375, -0.08447265625, -0.0212554931640625, 0.041961669921875, 0.1051788330078125, 0.16839599609375, 0.2316131591796875, 0.294830322265625, 0.3580474853515625, 0.4212646484375, 0.4844818115234375, 0.547698974609375, 0.6109161376953125, 0.67413330078125, 0.7373504638671875, 0.800567626953125, 0.8637847900390625, 0.927001953125, 0.9902191162109375, 1.053436279296875, 1.1166534423828125, 1.17987060546875, 1.2430877685546875, 1.306304931640625, 1.3695220947265625, 1.4327392578125, 1.4959564208984375, 1.559173583984375, 1.6223907470703125, 1.68560791015625, 1.7488250732421875, 1.812042236328125, 1.8752593994140625, 1.9384765625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 11.0, 19.0, 37.0, 70.0, 160.0, 493.0, 98.0, 41.0, 32.0, 18.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-153.13253784179688, -149.51748657226562, -145.90245056152344, -142.2873992919922, -138.67236328125, -135.05731201171875, -131.4422607421875, -127.82722473144531, -124.21217346191406, -120.59712982177734, -116.98208618164062, -113.36703491210938, -109.75199127197266, -106.13694763183594, -102.52190399169922, -98.9068603515625, -95.29181671142578, -91.67677307128906, -88.06172943115234, -84.44668579101562, -80.83163452148438, -77.21659088134766, -73.60154724121094, -69.98650360107422, -66.3714599609375, -62.75641632080078, -59.1413688659668, -55.52632522583008, -51.911277770996094, -48.296234130859375, -44.681190490722656, -41.06614685058594, -37.45109558105469, -33.83605194091797, -30.221004486083984, -26.605960845947266, -22.990915298461914, -19.375869750976562, -15.760826110839844, -12.145780563354492, -8.53073501586914, -4.915689945220947, -1.300644874572754, 2.3143997192382812, 5.929445266723633, 9.544490814208984, 13.159534454345703, 16.774580001831055, 20.389625549316406, 24.004671096801758, 27.61971664428711, 31.234760284423828, 34.84980773925781, 38.46485137939453, 42.07989501953125, 45.69493865966797, 49.30998611450195, 52.92502975463867, 56.540077209472656, 60.155120849609375, 63.770164489746094, 67.38520812988281, 71.00025939941406, 74.61530303955078, 78.2303466796875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 10.0, 15.0, 20.0, 19.0, 15.0, 17.0, 24.0, 18.0, 39.0, 102.0, 137.0, 152.0, 124.0, 42.0, 26.0, 22.0, 24.0, 17.0, 24.0, 13.0, 14.0, 10.0, 8.0, 14.0, 8.0, 7.0, 6.0, 3.0, 7.0, 2.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.59358215332031, -68.57595825195312, -66.55833435058594, -64.54070281982422, -62.52307891845703, -60.505455017089844, -58.48782730102539, -56.47019958496094, -54.45257568359375, -52.43495178222656, -50.41732406616211, -48.399696350097656, -46.38207244873047, -44.36444854736328, -42.34682083129883, -40.329193115234375, -38.31156921386719, -36.2939453125, -34.27631759643555, -32.258689880371094, -30.241065979003906, -28.223440170288086, -26.205814361572266, -24.188188552856445, -22.170562744140625, -20.152936935424805, -18.135311126708984, -16.117685317993164, -14.100059509277344, -12.082433700561523, -10.064807891845703, -8.047182083129883, -6.029563903808594, -4.011938095092773, -1.9943122863769531, 0.023313522338867188, 2.0409393310546875, 4.058565139770508, 6.076190948486328, 8.093816757202148, 10.111442565917969, 12.129068374633789, 14.14669418334961, 16.16431999206543, 18.18194580078125, 20.19957160949707, 22.21719741821289, 24.23482322692871, 26.25244903564453, 28.27007484436035, 30.287700653076172, 32.305328369140625, 34.32295227050781, 36.340576171875, 38.35820388793945, 40.375831604003906, 42.393455505371094, 44.41107940673828, 46.428707122802734, 48.44633483886719, 50.463958740234375, 52.48158264160156, 54.499210357666016, 56.51683807373047, 58.534461975097656]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 15.0, 16.0, 23.0, 30.0, 38.0, 53.0, 63.0, 180.0, 282.0, 62.0, 50.0, 49.0, 31.0, 35.0, 13.0, 17.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.890625, -14.5601806640625, -14.229736328125, -13.8992919921875, -13.56884765625, -13.2384033203125, -12.907958984375, -12.5775146484375, -12.2470703125, -11.9166259765625, -11.586181640625, -11.2557373046875, -10.92529296875, -10.5948486328125, -10.264404296875, -9.9339599609375, -9.603515625, -9.2730712890625, -8.942626953125, -8.6121826171875, -8.28173828125, -7.9512939453125, -7.620849609375, -7.2904052734375, -6.9599609375, -6.6295166015625, -6.299072265625, -5.9686279296875, -5.63818359375, -5.3077392578125, -4.977294921875, -4.6468505859375, -4.31640625, -3.9859619140625, -3.655517578125, -3.3250732421875, -2.99462890625, -2.6641845703125, -2.333740234375, -2.0032958984375, -1.6728515625, -1.3424072265625, -1.011962890625, -0.6815185546875, -0.35107421875, -0.0206298828125, 0.309814453125, 0.6402587890625, 0.970703125, 1.3011474609375, 1.631591796875, 1.9620361328125, 2.29248046875, 2.6229248046875, 2.953369140625, 3.2838134765625, 3.6142578125, 3.9447021484375, 4.275146484375, 4.6055908203125, 4.93603515625, 5.2664794921875, 5.596923828125, 5.9273681640625, 6.2578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 4.0, 10.0, 18.0, 27.0, 38.0, 63.0, 114.0, 211.0, 444.0, 1582.0, 9004.0, 8345523.0, 27309.0, 2810.0, 760.0, 259.0, 137.0, 78.0, 44.0, 53.0, 18.0, 20.0, 9.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.94425201416016, -85.2537841796875, -82.56331634521484, -79.87284851074219, -77.18238067626953, -74.49191284179688, -71.80144500732422, -69.11097717285156, -66.4205093383789, -63.73004150390625, -61.039573669433594, -58.34910583496094, -55.65863800048828, -52.968170166015625, -50.27770233154297, -47.58723449707031, -44.896766662597656, -42.206298828125, -39.515830993652344, -36.82536315917969, -34.13489532470703, -31.444427490234375, -28.75395965576172, -26.063491821289062, -23.373023986816406, -20.68255615234375, -17.992088317871094, -15.301620483398438, -12.611152648925781, -9.920684814453125, -7.230216979980469, -4.5397491455078125, -1.849273681640625, 0.8411941528320312, 3.5316619873046875, 6.222129821777344, 8.91259765625, 11.603065490722656, 14.293533325195312, 16.98400115966797, 19.674468994140625, 22.36493682861328, 25.055404663085938, 27.745872497558594, 30.43634033203125, 33.126808166503906, 35.81727600097656, 38.50774383544922, 41.198211669921875, 43.88867950439453, 46.57914733886719, 49.269615173339844, 51.9600830078125, 54.650550842285156, 57.34101867675781, 60.03148651123047, 62.721954345703125, 65.41242218017578, 68.10289001464844, 70.7933578491211, 73.48382568359375, 76.1742935180664, 78.86476135253906, 81.55522918701172, 84.24569702148438]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 7.0, 5.0, 9.0, 5.0, 3.0, 5.0, 6.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 7.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.10792541503906, -154.2130584716797, -149.31817626953125, -144.42330932617188, -139.5284423828125, -134.63357543945312, -129.7386932373047, -124.84382629394531, -119.9489517211914, -115.0540771484375, -110.15921020507812, -105.26433563232422, -100.36946105957031, -95.47459411621094, -90.57971954345703, -85.68484497070312, -80.78997802734375, -75.89510345458984, -71.00023651123047, -66.10536193847656, -61.21049118041992, -56.31562042236328, -51.420745849609375, -46.525875091552734, -41.631004333496094, -36.73613357543945, -31.84126091003418, -26.946388244628906, -22.051517486572266, -17.156646728515625, -12.261774063110352, -7.366901397705078, -2.4720458984375, 2.422825813293457, 7.317697525024414, 12.212569236755371, 17.107440948486328, 22.00231170654297, 26.897184371948242, 31.792057037353516, 36.686927795410156, 41.5817985534668, 46.47666931152344, 51.371543884277344, 56.266414642333984, 61.161285400390625, 66.05615997314453, 70.95103454589844, 75.84590148925781, 80.74077606201172, 85.6356430053711, 90.530517578125, 95.42538452148438, 100.32025909423828, 105.21513366699219, 110.11000061035156, 115.00487518310547, 119.89974975585938, 124.79461669921875, 129.68948364257812, 134.58436584472656, 139.47923278808594, 144.3740997314453, 149.26898193359375, 154.16384887695312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 21.0, 28.0, 36.0, 78.0, 73.0, 176.0, 270.0, 476.0, 902.0, 1887.0, 4420.0, 12349.0, 37975.0, 125270.0, 212674.0, 85924.0, 26423.0, 8819.0, 3320.0, 1504.0, 699.0, 372.0, 201.0, 134.0, 67.0, 50.0, 29.0, 23.0, 17.0, 5.0, 9.0, 1.0, 0.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.90625, -61.1259765625, -59.345703125, -57.5654296875, -55.78515625, -54.0048828125, -52.224609375, -50.4443359375, -48.6640625, -46.8837890625, -45.103515625, -43.3232421875, -41.54296875, -39.7626953125, -37.982421875, -36.2021484375, -34.421875, -32.6416015625, -30.861328125, -29.0810546875, -27.30078125, -25.5205078125, -23.740234375, -21.9599609375, -20.1796875, -18.3994140625, -16.619140625, -14.8388671875, -13.05859375, -11.2783203125, -9.498046875, -7.7177734375, -5.9375, -4.1572265625, -2.376953125, -0.5966796875, 1.18359375, 2.9638671875, 4.744140625, 6.5244140625, 8.3046875, 10.0849609375, 11.865234375, 13.6455078125, 15.42578125, 17.2060546875, 18.986328125, 20.7666015625, 22.546875, 24.3271484375, 26.107421875, 27.8876953125, 29.66796875, 31.4482421875, 33.228515625, 35.0087890625, 36.7890625, 38.5693359375, 40.349609375, 42.1298828125, 43.91015625, 45.6904296875, 47.470703125, 49.2509765625, 51.03125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 20.0, 29.0, 45.0, 59.0, 80.0, 100.0, 127.0, 133.0, 81.0, 78.0, 63.0, 45.0, 37.0, 20.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.611328125, -10.24609375, -9.880859375, -9.515625, -9.150390625, -8.78515625, -8.419921875, -8.0546875, -7.689453125, -7.32421875, -6.958984375, -6.59375, -6.228515625, -5.86328125, -5.498046875, -5.1328125, -4.767578125, -4.40234375, -4.037109375, -3.671875, -3.306640625, -2.94140625, -2.576171875, -2.2109375, -1.845703125, -1.48046875, -1.115234375, -0.75, -0.384765625, -0.01953125, 0.345703125, 0.7109375, 1.076171875, 1.44140625, 1.806640625, 2.171875, 2.537109375, 2.90234375, 3.267578125, 3.6328125, 3.998046875, 4.36328125, 4.728515625, 5.09375, 5.458984375, 5.82421875, 6.189453125, 6.5546875, 6.919921875, 7.28515625, 7.650390625, 8.015625, 8.380859375, 8.74609375, 9.111328125, 9.4765625, 9.841796875, 10.20703125, 10.572265625, 10.9375, 11.302734375, 11.66796875, 12.033203125, 12.3984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 6.0, 7.0, 4.0, 15.0, 25.0, 14.0, 31.0, 65.0, 58.0, 75.0, 59.0, 34.0, 27.0, 18.0, 3.0, 8.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.72188949584961, -53.93724060058594, -52.152591705322266, -50.367942810058594, -48.58329391479492, -46.79864501953125, -45.01399230957031, -43.229347229003906, -41.44469451904297, -39.6600456237793, -37.875396728515625, -36.09074783325195, -34.30609893798828, -32.52145004272461, -30.736799240112305, -28.952150344848633, -27.167503356933594, -25.382854461669922, -23.59820556640625, -21.813556671142578, -20.028907775878906, -18.244258880615234, -16.45960807800293, -14.674959182739258, -12.890310287475586, -11.105661392211914, -9.321012496948242, -7.536362648010254, -5.751713752746582, -3.96706485748291, -2.182415008544922, -0.39776611328125, 1.3868827819824219, 3.171531915664673, 4.956181049346924, 6.740830421447754, 8.525479316711426, 10.310128211975098, 12.094778060913086, 13.879426956176758, 15.66407585144043, 17.4487247467041, 19.233373641967773, 21.018024444580078, 22.80267333984375, 24.587322235107422, 26.371971130371094, 28.156620025634766, 29.941268920898438, 31.72591781616211, 33.51056671142578, 35.29521560668945, 37.079864501953125, 38.8645133972168, 40.64916229248047, 42.433815002441406, 44.21846008300781, 46.003108978271484, 47.787757873535156, 49.57240676879883, 51.3570556640625, 53.14170455932617, 54.926353454589844, 56.71100616455078, 58.49565505981445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 8.0, 16.0, 9.0, 19.0, 37.0, 55.0, 71.0, 70.0, 65.0, 43.0, 17.0, 15.0, 9.0, 5.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.547569274902344, -40.342533111572266, -39.13750076293945, -37.932464599609375, -36.72743225097656, -35.522396087646484, -34.317359924316406, -33.112327575683594, -31.907291412353516, -30.70225715637207, -29.497222900390625, -28.292186737060547, -27.0871524810791, -25.882118225097656, -24.677082061767578, -23.472047805786133, -22.267013549804688, -21.061979293823242, -19.856945037841797, -18.65190887451172, -17.446874618530273, -16.241840362548828, -15.036805152893066, -13.831769943237305, -12.62673568725586, -11.421701431274414, -10.216666221618652, -9.01163101196289, -7.806596755981445, -6.601562023162842, -5.396527290344238, -4.191492080688477, -2.9864578247070312, -1.7814230918884277, -0.5763883590698242, 0.6286463737487793, 1.8336811065673828, 3.0387158393859863, 4.24375057220459, 5.448785781860352, 6.653820037841797, 7.8588547706604, 9.063889503479004, 10.268924713134766, 11.473958969116211, 12.678993225097656, 13.884028434753418, 15.08906364440918, 16.294097900390625, 17.49913215637207, 18.704166412353516, 19.909202575683594, 21.11423683166504, 22.319271087646484, 23.524307250976562, 24.729341506958008, 25.934375762939453, 27.1394100189209, 28.344444274902344, 29.549480438232422, 30.754514694213867, 31.959548950195312, 33.16458511352539, 34.36962127685547, 35.57465362548828]}, "eval/loss": 1.818001627922058, "eval/wer": 0.2663625545418485, "eval/runtime": 915.1002, "eval/samples_per_second": 2.887, "eval/steps_per_second": 0.362, "train/train_runtime": 108037.8512, "train/train_samples_per_second": 5.283, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 2.302149100206905} \ No newline at end of file